3 label: WGS processing workflow for single sample
6 SubworkflowFeatureRequirement: {}
11 format: edam:format_1930 # FASTQ
12 label: One of set of pair-end FASTQs (R1)
15 format: edam:format_1930 # FASTQ
16 label: One of set of pair-end FASTQs (R2)
19 format: edam:format_1929 # FASTA
20 label: Reference genome
31 label: Full list of intervals to operate over
37 format: edam:format_3016 # VCF
38 label: VCF of known polymorphic sites for BQSR
43 label: Desired split for variant calling
46 format: edam:format_3016 # VCF
47 label: Reference VCF for ClinVar
50 label: Function used to create HTML report
53 format: edam:format_2331 # HTML
54 label: Header for HTML report
57 format: edam:format_2331 # HTML
58 label: Footer for HTML report
63 label: FASTQ QC reports
64 format: edam:format_2331 # HTML
65 outputSource: fastqc/out-html
68 label: Zip files of FASTQ QC report and associated data
69 outputSource: fastqc/out-zip
72 outputSource: haplotypecaller/gatheredgvcf
73 format: edam:format_3016 # GVCF
74 label: GVCF generated from GATK Haplotype Caller
77 outputSource: generate-report/report
78 format: edam:format_2331 # HTML
79 label: ClinVar variant report
87 out: [out-html, out-zip]
89 run: bwamem-samtools-view.cwl
97 run: samtools-sort.cwl
99 bam: bwamem-samtools-view/bam
103 run: mark-duplicates.cwl
105 bam: samtools-sort/sortedbam
106 out: [dupbam,dupmetrics]
108 run: samtools-index.cwl
110 bam: mark-duplicates/dupbam
113 run: scatter-gatk-wf-with-interval.cwl
116 fullintervallist: fullintervallist
117 bam: samtools-index/indexedbam
119 scattercount: scattercount
120 knownsites: knownsites
125 gvcf: haplotypecaller/gatheredgvcf
127 clinvarvcf: clinvarvcf
128 reportfunc: reportfunc
133 s:codeRepository: https://github.com/arvados/arvados-tutorial
134 s:license: https://www.gnu.org/licenses/agpl-3.0.en.html
137 s: https://schema.org/
138 edam: http://edamontology.org/
141 # - https://schema.org/version/latest/schema.rdf
142 # - http://edamontology.org/EDAM_1.18.owl