-
Notifications
You must be signed in to change notification settings - Fork 4
/
Copy pathconfig.yaml
35 lines (29 loc) · 1.41 KB
/
config.yaml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
# This file should contain everything to configure the workflow on a global scale.
# In case of sample based data are in metadata.tsv file that contains one row per sample and with following column headers. Also no comments (#) are allowed in it.
# ID: column in Metadata file for sample name
# Group: column in Metadata file for Group (treatment)
# R1: column in Metadata file for R1 rawdata path
# R2: column in METADATA file for R2 rawdata path
# Merged: column in Metadata file for Merged (by flash or pandaseq) rawdata path
Project: test
Metadata: metadata.tsv # use absolute path to avoid trouble; relative path should be relative to Workdir, including paths within metadata.tsv.
Workdir: # the directory where ssusearch is run if not specified
# --------------------------------
# Parameters
# --------------------------------
#
### search step:
Gene: ssu
Cpu: 4 # max threads for each process/task
# pick start and end of a region in V4 for de novo clustering
# the default numbers are for 150bp reads
# rule of thumb is pick a region with more reads with larger overlap
# change to Start=577, End=657, Len_cutoff=75 for 100bp reads
Start: 577
End: 727
Len_cutoff: 100 # min length for reads picked for the region
### clust step
Java_xmx: 4g # depends on data size; Increase this if you see error like "java.lang.OutOfMemoryError"
Otu_dist_cutoff: 0.05
# Refdir defaults to the same directory as Snakefile
Refdir: