-
Notifications
You must be signed in to change notification settings - Fork 15
/
pepatac_input_schema.yaml
executable file
·110 lines (110 loc) · 3.66 KB
/
pepatac_input_schema.yaml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
description: A PEP for ATAC-seq samples for the PEPATAC pipeline.
imports:
- https://schema.databio.org/pep/2.0.0.yaml # Use a web-based schema source file
#- PEP_schema.yaml # Use a local (current directory) schema source file
properties:
samples:
type: array
items:
type: object
properties:
sample_name:
type: string
description: "Name of the sample"
organism:
type: string
description: "Organism"
protocol:
type: string
description: "Must be an ATAC-seq or DNAse-seq sample"
genome:
type: string
description: "Refgenie genome registry identifier"
prealignments:
type: ["array"]
descrption: "Refgenie genome registry identifiers"
read_type:
type: string
description: "Is this single or paired-end data?"
enum: ["SINGLE", "single", "PAIRED", "paired"]
read1:
type: string
description: "Fastq file for read 1"
read2:
type: string
description: "Fastq file for read 2 (for paired-end experiments)"
extend:
type: string
description: "Length to extend fixed width peaks around summit"
frip_ref_peaks:
type: string
description: "Path to a reference peak set"
aligner:
type: string
description: "Specify the read alignment tool"
enum: ["bowtie2", "bwa"]
peak_caller:
type: string
description: "Specify the peak calling tool"
enum: ["fseq", "genrich", "hmmratac", "homer", "macs3"]
genome_size:
type: string
description: "MACS2 effective genome size"
trimmer:
type: string
description: "Specify the read trimming tool"
enum: ["trimmomatic", "pyadapt", "skewer"]
deduplicator:
type: string
description: "Specify the read deduplication tool"
enum: ["picard", "samblaster", "samtools"]
peak_type:
type: string
description: "Call variable or fixed width peaks"
enum: ["fixed", "variable"]
anno_name:
type: string
description: "Genomic partitions annotation file (by default uses Refgenie asset)"
blacklist:
type: string
description: "Path to file of blacklisted genomic regions (by default uses Refgenie asset)"
TSS_name:
type: string
description: "TSS annotation file (by default uses Refgenie asset)"
motif:
type: boolean
description: "Use HOMER to perform motif enrichment analysis"
sob:
type: boolean
description: "Use seqOutBias to generate signal tracks"
no_scale:
type: boolean
description: "Do not scale signal tracks"
prioritize:
type: boolean
description: "Plot cFRiF/FRiF using mutually exclusive priority ranked features based on the order of feature appearance in the feature annotation asset"
keep:
type: boolean
description: "Keep prealignment BAM files"
noFIFO:
type: boolean
description: "Do NOT use named pipes during prealignments"
lite:
type: boolean
description: "Remove all intermediate file types"
skipqc:
type: boolean
description: "Do not use FastQC even if available"
required:
- sample_name
- protocol
- read_type
- read1
- genome
required_files:
- read1
files:
- read1
- read2
required:
- samples