-
Notifications
You must be signed in to change notification settings - Fork 6
/
nextflow.config
162 lines (115 loc) · 3.78 KB
/
nextflow.config
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
manifest {
description = 'PhIP-Seq common analysis workflows'
nextflowVersion = '>= 20.07.0'
}
// PIPELINE KNOBS
params{
/*
sample reads options
*/
// Stream Function
// Set this as 'cat' if fastq files not g'zipped
fastq_stream_func = 'zcat'
/*
output options
*/
// Dataset Name Prefix
dataset_prefix = 'data'
// Output Xarray pickle
output_pickle_xarray = true
// Output tall format ds
output_tall_csv = false
// Output wide format ds
output_wide_csv = true
/*
alignment options
*/
// read length for align
read_length = 125
// peptide oligo encoding length for alignment
oligo_tile_length = 117
// mismatches allowed (end-to-end)
n_mismatches = 2
// other bowtie options
bowtie_optional_args = '--tryhard --nomaqround --norc --best --sam --quiet'
// Flag for replicating counts for replicate sequences
replicate_sequence_counts = true
/*
Optional workflows
*/
run_cpm_enr_workflow = false
run_zscore_fit_predict = false
run_edgeR = true
// WARNING: This functionality has not been fully tested
run_BEER = false
/*
Options for grouping results by organism (e.g. VirScan)
*/
// Flag used to control the summary of results by organism
summarize_by_organism = false
// Column in the peptide table indicating the organism for each peptide
peptide_org_col = "organism"
// Column in the peptide table containing the peptide sequence
// (used to match against public epitopes, and to filter overlapping peptides)
peptide_seq_col = "seq"
// Maximum allowed overlap between detected peptides
max_overlap = 7
// Minimum z-score threshold
zscore_threshold = 2.5
// Maximum edgeR threshold (BH-adjusted p-value)
edgeR_threshold = 0.05
// Column in the sample table used for mapping replicates to samples
sample_grouping_col = ""
// Optional, a CSV containing public epitopes
public_epitopes_csv = "$projectDir/templates/public_epitope_template.csv"
// In the public epitopes CSV, the column containing the translated amino acid sequence
public_epitopes_col = "peptide_translate"
}
// Set the container which can be used for all processes
process {
// Default for any processes which do not match the selectors below
container = 'quay.io/matsengrp/phip-flow:latest'
withName: 'run_edgeR|run_BEER' {
container = 'quay.io/biocontainers/bioconductor-beer:1.2.0--r42hdfd78af_0'
}
}
profiles {
// Run locally assuming all deps available in current environment
standard {
}
// Run locally assuming docker is installed with the latest image
docker {
docker.enabled = true
}
singularity {
singularity.enabled = true
singularity.autoMounts = true
//singularity.cacheDir = 'singularity_cache'
singularity.runOptions = '--contain -W /tmp/ -B ${HOME},${PWD}'
}
apptainer {
apptainer.enabled = true
apptainer.autoMounts = true
//apptainer.cacheDir = 'apptainer_cache'
apptainer.runOptions = '--contain -W /tmp/ -B ${HOME},${PWD}'
}
// Run batch submission assuming docker is installed with the latest image
cluster {
singularity {
enabled = true
autoMounts = true
cacheDir = 'singularity_cache'
runOptions = '--contain -W /tmp/ -B ${HOME},${PWD}'
}
process {
executor = 'slurm'
queue = 'campus-new'
cpus = 1
memory = 16.GB
time = '1h'
clusterOptions = '-A overbaugh_j'
withLabel: mem_large { memory = 48.GB }
withLabel: mem_xlarge { memory = 64.GB }
}
}
}