Updating cwl and yml for intervals and other changes
[arvados-tutorial.git] / WGS-processing / cwl / wgs-processing-wf.cwl
index 0f8f8ccb78885eee9c1cf29c264199837b296c73..8cbcf5ee03b17f7d5800b611fd29a4d69cfcc105 100644 (file)
@@ -1,14 +1,19 @@
 cwlVersion: v1.1
 class: Workflow
+label: WGS processing workflow scattered over samples
 
 requirements:
   - class: SubworkflowFeatureRequirement
   - class: ScatterFeatureRequirement
 
 inputs:
-  fastqdir: Directory 
+  fastqdir:
+    type: Directory 
+    label: Directory of paired FASTQ files
   reference:
     type: File
+    format: edam:format_1929 # FASTA
+    label: Reference genome 
     secondaryFiles:
       - .amb
       - .ann
@@ -17,24 +22,44 @@ inputs:
       - .sa
       - .fai
       - ^.dict
-  sample: string
+  fullintervallist:
+    type: File
   knownsites:
     type: File
+    format: edam:format_3016 # VCF
+    label: VCF of known polymorphic sites for BQSR
     secondaryFiles:
       - .tbi   
-  scattercount: string
-  clinvarvcf: File
-  reportfunc: File
-  headhtml: File
-  tailhtml: File
+  scattercount: 
+    type: string
+    label: Desired split for variant calling
+  clinvarvcf: 
+    type: File
+    format: edam:format_3016 # VCF
+    label: Reference VCF for ClinVar
+  reportfunc: 
+    type: File
+    label: Function used to create HTML report
+  headhtml: 
+    type: File
+    format: edam:format_2331 # HTML 
+    label: Header for HTML report
+  tailhtml: 
+    type: File
+    format: edam:format_2331 # HTML
+    label: Footer for HTML report
 
 outputs:
   gvcf:
     type: File[]
     outputSource: bwamem-gatk-report/gvcf
+    format: edam:format_3016 # GVCF
+    label: GVCFs generated from GATK 
   report:
     type: File[]  
     outputSource: bwamem-gatk-report/report
+    format: edam:format_2331 # HTML
+    label: ClinVar variant reports 
 
 steps:
   getfastq:
@@ -51,6 +76,7 @@ steps:
       fastq1: getfastq/fastq1
       fastq2: getfastq/fastq2
       reference: reference
+      fullintervallist: fullintervallist
       sample: getfastq/sample
       knownsites: knownsites
       scattercount: scattercount
@@ -64,4 +90,9 @@ s:codeRepository: https://github.com/arvados/arvados-tutorial
 s:license: https://www.gnu.org/licenses/agpl-3.0.en.html
 
 $namespaces:
-  s: https://schema.org/
+ s: https://schema.org/
+ edam: http://edamontology.org/
+
+#$schemas:
+# - https://schema.org/version/latest/schema.rdf
+# - http://edamontology.org/EDAM_1.18.owl