RNA-Seq/cwl/helper/fastqc_2.cwl

   1 #!/usr/bin/env cwl-runner
   2 cwlVersion: v1.0
   3 class: CommandLineTool
   4
   5 hints:
   6   DockerRequirement:
   7     dockerPull: quay.io/biocontainers/fastqc:0.11.9--hdfd78af_1
   8   SoftwareRequirement:
   9     packages:
  10       fastqc:
  11         specs: [ "http://identifiers.org/biotools/fastqc" ]
  12         version: [ "0.11.9--hdfd78af_1", "0.11.9" ]
  13
  14 inputs:
  15
  16   reads_file:
  17     type: File
  18     inputBinding:
  19       position: 50
  20     doc: |
  21       Input bam,sam,bam_mapped,sam_mapped or fastq file
  22
  23   format_enum:
  24     type:
  25       - "null"
  26       - type: enum
  27         name: "format"
  28         symbols: ['bam','sam','bam_mapped','sam_mapped','fastq']
  29     inputBinding:
  30       position: 6
  31       prefix: '--format'
  32     doc: |
  33       Bypasses the normal sequence file format detection and
  34       forces the program to use the specified format.  Valid
  35       formats are bam,sam,bam_mapped,sam_mapped and fastq
  36
  37   threads:
  38     type: int?
  39     inputBinding:
  40       position: 7
  41       prefix: '--threads'
  42     doc: |
  43       Specifies the number of files which can be processed
  44       simultaneously.  Each thread will be allocated 250MB of
  45       memory so you shouldn't run more threads than your
  46       available memory will cope with, and not more than
  47       6 threads on a 32 bit machine
  48
  49   contaminants:
  50     type: File?
  51     inputBinding:
  52       position: 8
  53       prefix: '--contaminants'
  54     doc: |
  55       Specifies a non-default file which contains the list of
  56       contaminants to screen overrepresented sequences against.
  57       The file must contain sets of named contaminants in the
  58       form name[tab]sequence.  Lines prefixed with a hash will
  59       be ignored.
  60
  61   adapters:
  62     type: File?
  63     inputBinding:
  64       position: 9
  65       prefix: '--adapters'
  66     doc: |
  67       Specifies a non-default file which contains the list of
  68       adapter sequences which will be explicity searched against
  69       the library. The file must contain sets of named adapters
  70       in the form name[tab]sequence.  Lines prefixed with a hash
  71       will be ignored.
  72
  73   limits:
  74     type: File?
  75     inputBinding:
  76       position: 10
  77       prefix: '--limits'
  78     doc: |
  79       Specifies a non-default file which contains a set of criteria
  80       which will be used to determine the warn/error limits for the
  81       various modules.  This file can also be used to selectively
  82       remove some modules from the output all together.  The format
  83       needs to mirror the default limits.txt file found in the
  84       Configuration folder.
  85
  86   kmers:
  87     type: int?
  88     inputBinding:
  89       position: 11
  90       prefix: '--kmers'
  91     doc: |
  92       Specifies the length of Kmer to look for in the Kmer content
  93       module. Specified Kmer length must be between 2 and 10. Default
  94       length is 7 if not specified.
  95
  96   casava:
  97     type: boolean?
  98     inputBinding:
  99       position: 13
 100       prefix: '--casava'
 101     doc: |
 102       Files come from raw casava output. Files in the same sample
 103       group (differing only by the group number) will be analysed
 104       as a set rather than individually. Sequences with the filter
 105       flag set in the header will be excluded from the analysis.
 106       Files must have the same names given to them by casava
 107       (including being gzipped and ending with .gz) otherwise they
 108       won't be grouped together correctly.
 109
 110   nofilter:
 111     type: boolean?
 112     inputBinding:
 113       position: 14
 114       prefix: '--nofilter'
 115     doc: |
 116       If running with --casava then don't remove read flagged by
 117       casava as poor quality when performing the QC analysis.
 118
 119   hide_group:
 120     type: boolean?
 121     inputBinding:
 122       position: 15
 123       prefix: '--nogroup'
 124     doc: |
 125       Disable grouping of bases for reads >50bp. All reports will
 126       show data for every base in the read.  WARNING: Using this
 127       option will cause fastqc to crash and burn if you use it on
 128       really long reads, and your plots may end up a ridiculous size.
 129       You have been warned!
 130
 131 outputs:
 132
 133   zipped_file:
 134     type: File
 135     outputBinding:
 136       glob: '*.zip'
 137   html_file:
 138     type: File
 139     outputBinding:
 140       glob: '*.html'
 141   summary_file:
 142     type: File
 143     outputBinding:
 144       glob: "*/summary.txt"
 145
 146 baseCommand: [fastqc, --extract, --outdir, .]
 147
 148 $namespaces:
 149   s: http://schema.org/
 150
 151 $schemas:
 152 - https://github.com/schemaorg/schemaorg/raw/main/data/releases/11.01/schemaorg-current-http.rdf
 153
 154 s:name: "fastqc_2"
 155 s:license: http://www.apache.org/licenses/LICENSE-2.0
 156
 157 s:creator:
 158 - class: s:Organization
 159   s:legalName: "Cincinnati Children's Hospital Medical Center"
 160   s:location:
 161   - class: s:PostalAddress
 162     s:addressCountry: "USA"
 163     s:addressLocality: "Cincinnati"
 164     s:addressRegion: "OH"
 165     s:postalCode: "45229"
 166     s:streetAddress: "3333 Burnet Ave"
 167     s:telephone: "+1(513)636-4200"
 168   s:logo: "https://www.cincinnatichildrens.org/-/media/cincinnati%20childrens/global%20shared/childrens-logo-new.png"
 169   s:department:
 170   - class: s:Organization
 171     s:legalName: "Allergy and Immunology"
 172     s:department:
 173     - class: s:Organization
 174       s:legalName: "Barski Research Lab"
 175       s:member:
 176       - class: s:Person
 177         s:name: Michael Kotliar
 178         s:email: mailto:misha.kotliar@gmail.com
 179         s:sameAs:
 180         - id: http://orcid.org/0000-0002-6486-3898
 181
 182 doc: |
 183   Tool runs FastQC from Babraham Bioinformatics