-
Notifications
You must be signed in to change notification settings - Fork 8
/
Copy pathminiex.config
133 lines (122 loc) · 4.12 KB
/
miniex.config
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
////////////////////////////////
// MINI-EX CONFIGURATION FILE //
////////////////////////////////
// SPECIFY THE SYSTEM EXECUTOR //
executor {
name = 'slurm'
// --> common examples: local, slurm, sge, azurebatch
queueSize = 5
}
// SINGULARITY CONTAINERS SETTINGS // (not to be adapted)
process.container = "vibpsb/mini-ex:latest"
singularity {
enabled = true
cacheDir = "singularity_cache"
autoMounts = true
}
params {
// INPUT FILES DERIVED FROM SINGLE-CELL DATASETS //
expressionMatrix = "$baseDir/example/INPUTS/*_matrix.tsv"
markersOut = "$baseDir/example/INPUTS/*_allMarkers.tsv"
cellsToClusters = "$baseDir/example/INPUTS/*_cells2clusters.tsv"
clustersToIdentities = "$baseDir/example/INPUTS/*_identities.tsv"
// CACHED FILES // (allows to reuse the initial coexpression network)
grnboostOut = "/$baseDir/example/OUTPUTS/grnboost2/*_grnboost2.tsv"
// --> to infer coexpression network de novo, replace the line above by: grnboostOut = null
// SPECIES SPECIFIC INFORMATION //
tfList = "$baseDir/data/ath/ath_TF_list.tsv"
geneAliases = "$baseDir/data/ath/ath_gene_aliases.tsv"
// --> if gene aliases are not available, replace the line above by: geneAliases = null
infoTf = "$baseDir/data/ath/ath_TF2fam2mot.tsv"
featureFileMotifs = "$baseDir/data/ath/ath_2021.1_motifMapping.out.gz"
goFile = "$baseDir/data/ath/ath_full_BP_expcur_ext_names.tsv"
// --> if GO data is not available, replace the line above by: goFile = null
// (when doing so, termsOfInterest should also be set to <null>)
// PARAMETERS //
doMotifAnalysis = true
// --> set to <false> if no motif mapping data is available
// [CAUTION: without motif data MINI-EX is less reliable]
termsOfInterest = "$baseDir/example/INPUTS/GOsIwant.tsv"
// --> to use the standard ranking procedure, replace the line above by: termsOfInterest = null
topMarkers = "700"
expressionFilter = "10"
motifFilter = "TF-F_motifs"
// --> to use the motifs of the TF family: motifFilter = "TF-F_motifs"
// --> to only use the motifs known for a TF: motifFilter = "TF_motifs"
topRegulons = "150"
enrichmentBackground = null
// --> to specify an enrichment background: enrichmentBackground = "pathToTheFile", with file containing one gene id per line
// (when not specified, the background defaults to the list of genes that are present in the expression matrix)
// SPECIFY OUTPUT DIRECTORY //
outputDir = "$baseDir/output"
}
// SPECIFY MEMORY AND CPUS FOR EACH PROCESS //
process {
withName: check_user_input {
memory = '1 GB'
}
withName: get_expressed_genes {
memory = '1 GB'
}
withName: run_grnboost {
memory = '20 GB'
cpus = 5
}
withName: unzip_motif_mappings {
executor = 'local'
}
withName: run_enricher_motifs {
memory = '4 GB'
}
withName: filter_motifs {
memory = '20 GB'
}
withName: filter_motifs_dummy {
executor = 'local'
}
withName: get_top_degs {
memory = '10 GB'
}
withName: run_enricher_cluster {
memory = '4 GB'
}
withName: filter_expression {
memory = '20 GB'
}
withName: make_info_file {
memory = '10 GB'
}
withName: make_regulon_clustermap {
memory = '20 GB'
}
withName: get_network_centrality {
memory = '20 GB'
}
withName: make_go_enrichment_files {
memory = '10 GB'
}
withName: run_enricher_go {
memory = '4 GB'
}
withName: select_borda_procedure {
memory = '10 GB'
}
withName: make_ranking_dataframe {
memory = '10 GB'
}
withName: make_borda {
memory = '10 GB'
}
withName: score_edges {
memory = '15 GB'
}
withName: make_top_regulons_heatmaps {
memory = '20 GB'
}
withName: make_regmaps {
memory = '20 GB'
}
withName: make_log_file {
executor = 'local'
}
}