cwlVersion: v1.1 class: Workflow label: Variant calling workflow for given interval requirements: SubworkflowFeatureRequirement: {} inputs: bam: type: File format: edam:format_2572 # BAM label: Indexed sorted BAM with labeled duplicates secondaryFiles: - .bai reference: type: File format: edam:format_1929 # FASTA label: Reference genome secondaryFiles: - .amb - .ann - .bwt - .pac - .sa - .fai - ^.dict sample: type: string label: Sample Name knownsites1: type: File format: edam:format_3016 # VCF label: VCF of known SNPS sites for BQSR secondaryFiles: - .idx knownsites2: type: File format: edam:format_3016 # VCF label: VCF of known indel sites for BQSR secondaryFiles: - .tbi intervallist: type: File label: Scatter intervals file outputs: gvcf: type: File format: edam:format_3016 # GVCF label: Given interval filtered GVCF outputSource: selectvariants/filteredgvcf steps: basecalibrator: run: gatk-baserecalibrator-with-interval.cwl in: bam: bam reference: reference sample: sample knownsites1: knownsites1 knownsites2: knownsites2 intervallist: intervallist out: [recaltable] applyBQSR: run: gatk-applyBSQR-with-interval.cwl in: reference: reference bam: bam sample: sample intervallist: intervallist recaltable: basecalibrator/recaltable out: [recalbam] haplotypecaller: run: gatk-haplotypecaller-with-interval.cwl in: reference: reference bam: applyBQSR/recalbam sample: sample intervallist: intervallist out: [gvcf] selectvariants: run: gatk-selectvariants.cwl in: gvcf: haplotypecaller/gvcf reference: reference sample: sample out: [filteredgvcf] s:codeRepository: https://github.com/arvados/arvados-tutorial s:license: https://www.gnu.org/licenses/agpl-3.0.en.html $namespaces: s: https://schema.org/ edam: http://edamontology.org/ #$schemas: # - https://schema.org/version/latest/schema.rdf # - http://edamontology.org/EDAM_1.18.owl