Adding labels
authorSarah Wait Zaranek <swz@curii.com>
Wed, 24 Jun 2020 17:10:55 +0000 (17:10 +0000)
committerSarah Wait Zaranek <swz@curii.com>
Wed, 24 Jun 2020 17:10:55 +0000 (17:10 +0000)
Arvados-DCO-1.1-Signed-off-by: Sarah Wait Zaranek <swz@curii.com>
no issue #

WGS-processing/cwl/helper/bwamem-gatk-report-wf.cwl
WGS-processing/cwl/helper/getfastq.cwl
WGS-processing/cwl/wgs-processing-wf.cwl

index dbe5cf05f88dbdfa6e1014b98306b344f2238589..f1cfad4cac14af5825c1cd14209e82ed075b1f93 100644 (file)
@@ -1,14 +1,23 @@
 cwlVersion: v1.1
 class: Workflow
+label: WGS processing workflow for single sample
 
 requirements:
   - class: SubworkflowFeatureRequirement
 
 inputs:
-  fastq1: File
-  fastq2: File
+  fastq1: 
+    type: File
+    format: edam:format_1930 # FASTQ
+    label: One of set of pair-end FASTQs (R1)
+  fastq2: 
+    type: File
+    format: edam:format_1930 # FASTQ
+    label: One of set of pair-end FASTQs (R2)
   reference:
     type: File
+    format: edam:format_1929 # FASTA
+    label: Reference genome
     secondaryFiles:
       - .amb
       - .ann
@@ -17,30 +26,55 @@ inputs:
       - .sa
       - .fai
       - ^.dict
-  sample: string
+  sample: 
+    type: string
+    label: Sample Name
   knownsites:
     type: File
+    format: edam:format_3016 # VCF
+    label: VCF of known polymorphic sites for BQSR
     secondaryFiles:
       - .tbi   
-  scattercount: string
-  clinvarvcf: File
-  reportfunc: File
-  headhtml: File
-  tailhtml: File
+  scattercount: 
+    type: string
+    label: Desired split for variant calling
+  clinvarvcf:
+    type: File
+    format: edam:format_3016 # VCF
+    label: Reference VCF for ClinVar
+  reportfunc:
+    type: File
+    label: Function used to create HTML report
+  headhtml:
+    type: File
+    format: edam:format_1964 # HTML
+    label: Header for HTML report
+  tailhtml:
+    type: File
+    format: edam:format_1964 # HTML
+    label: Footer for HTML report
 
 outputs:
   qc-html:
     type: File[]
+    label: FASTQ QC report
+    format: edam:format_1964 # HTML
     outputSource: fastqc/out-html
   qc-zip:
     type: File[]
+    label: Zip file of FASTQ QC report and associated data
     outputSource: fastqc/out-zip 
   gvcf:
     type: File
     outputSource: haplotypecaller/gatheredgvcf
+    format: edam:format_3016 # GVCF
+    label: GVCF generated from GATK 
   report:
     type: File  
     outputSource: generate-report/report
+    format: edam:format_1964 # HTML
+    label: ClinVar variant report
+
 steps:
   fastqc:
     run: fastqc.cwl
@@ -91,3 +125,14 @@ steps:
       headhtml: headhtml
       tailhtml: tailhtml
     out: [report] 
+
+s:codeRepository: https://github.com/arvados/arvados-tutorial
+s:license: https://www.gnu.org/licenses/agpl-3.0.en.html
+
+$namespaces:
+ s: https://schema.org/
+ edam: http://edamontology.org/
+
+$schemas:
+ - https://schema.org/version/latest/schema.rdf
+ - http://edamontology.org/EDAM_1.18.owl
index c651771389f2720614f5e33fcab54e325f3a5305..e2aaa887eb27a4efe8239dcd52434673e39b7365 100644 (file)
@@ -1,23 +1,28 @@
-$namespaces:
-  arv: "http://arvados.org/cwl#"
-  cwltool: "http://commonwl.org/cwltool#"
 class: ExpressionTool
 cwlVersion: v1.1
-label: Create array of gvcfs to process
+label: Find matching FASTQ pairs 
 requirements:
   InlineJavascriptRequirement: {}
+
 inputs:
   fastqdir:
     type: Directory
-    label: Input directory of fastqs
+    label: Input directory of FASTQs
     loadListing: 'shallow_listing' 
+
 outputs:
   fastq1: 
     type: File[]
+    format: edam:format_1930 # FASTQ
+    label: Half set of pair-end FASTQs (R1)
   fastq2:
     type: File[]
+    format: edam:format_1930 # FASTQ
+    label: Half set of pair-end FASTQs (R2)
   sample:
     type: string[]
+    label: Sample Names
+
 expression: |
   ${function compare(a, b) {
     var baseA = a.basename;
@@ -58,3 +63,17 @@ expression: |
  
     return {"fastq1": fastq1, "fastq2": fastq2, "sample": sample};
   }
+
+
+s:codeRepository: https://github.com/arvados/arvados-tutorial
+s:license: https://www.gnu.org/licenses/agpl-3.0.en.html
+
+$namespaces:
+ s: https://schema.org/
+ edam: http://edamontology.org/
+ arv: "http://arvados.org/cwl#"
+ cwltool: "http://commonwl.org/cwltool#"
+
+$schemas:
+ - https://schema.org/version/latest/schema.rdf
+ - http://edamontology.org/EDAM_1.18.owl
index a6218bdaa79bd28f83a2cd91087fca673999cf8a..58e38cbf2d6453908bfb5b4c4564daa439996988 100644 (file)
@@ -22,9 +22,6 @@ inputs:
       - .sa
       - .fai
       - ^.dict
-  sample: 
-    type: string
-    label: Sample name
   knownsites:
     type: File
     format: edam:format_3016 # VCF
@@ -55,7 +52,7 @@ outputs:
     type: File[]
     outputSource: bwamem-gatk-report/gvcf
     format: edam:format_3016 # GVCF
-    label: GVCFs generated from sets of fastqs
+    label: GVCFs generated from GATK 
     
   report:
     type: File[]