|
| 1 | +#!/usr/bin/env cwl-runner |
| 2 | +cwlVersion: 'v1.0' |
| 3 | +class: CommandLineTool |
| 4 | +id: "seqtk_seq" |
| 5 | +label: "Convert to FASTA (seqtk)" |
| 6 | +hints: |
| 7 | + DockerRequirement: |
| 8 | + dockerPull: quay.io/biocontainers/seqtk:1.2--1 |
| 9 | + SoftwareRequirement: |
| 10 | + packages: |
| 11 | + - package: seqtk |
| 12 | + version: |
| 13 | + - "1.2" |
| 14 | +inputs: |
| 15 | + input1: |
| 16 | + type: File |
| 17 | + doc: | |
| 18 | + Input FASTA file. |
| 19 | + inputBinding: |
| 20 | + position: 1 |
| 21 | + prefix: "-a" |
| 22 | +outputs: |
| 23 | + output1: |
| 24 | + type: File |
| 25 | + outputBinding: |
| 26 | + glob: out |
| 27 | +baseCommand: |
| 28 | + - "seqtk" |
| 29 | + - "seq" |
| 30 | +arguments: [] |
| 31 | +stdout: out |
| 32 | +doc: | |
| 33 | + |
| 34 | + Usage: seqtk seq [options] <in.fq>|<in.fa> |
| 35 | + |
| 36 | + Options: -q INT mask bases with quality lower than INT [0] |
| 37 | + -X INT mask bases with quality higher than INT [255] |
| 38 | + -n CHAR masked bases converted to CHAR; 0 for lowercase [0] |
| 39 | + -l INT number of residues per line; 0 for 2^32-1 [0] |
| 40 | + -Q INT quality shift: ASCII-INT gives base quality [33] |
| 41 | + -s INT random seed (effective with -f) [11] |
| 42 | + -f FLOAT sample FLOAT fraction of sequences [1] |
| 43 | + -M FILE mask regions in BED or name list FILE [null] |
| 44 | + -L INT drop sequences with length shorter than INT [0] |
| 45 | + -c mask complement region (effective with -M) |
| 46 | + -r reverse complement |
| 47 | + -A force FASTA output (discard quality) |
| 48 | + -C drop comments at the header lines |
| 49 | + -N drop sequences containing ambiguous bases |
| 50 | + -1 output the 2n-1 reads only |
| 51 | + -2 output the 2n reads only |
| 52 | + -V shift quality by '(-Q) - 33' |
| 53 | + -U convert all bases to uppercases |
| 54 | + -S strip of white spaces in sequences |
| 55 | + |
| 56 | +$namespaces: |
| 57 | + s: http://schema.org/ |
| 58 | +$schemas: |
| 59 | +- http://schema.org/docs/schema_org_rdfa.html |
| 60 | + |
| 61 | +s:mainEntity: |
| 62 | + class: s:SoftwareSourceCode |
| 63 | + s:name: seqtk |
| 64 | + s:about: 'Toolkit for processing sequences in FASTA/Q formats' |
| 65 | + s:url: https://github.com/lh3/seqtk |
| 66 | + s:codeRepository: https://github.com/lh3/seqtk |
| 67 | + |
| 68 | + s:license: |
| 69 | + - https://opensource.org/licenses/MIT |
| 70 | + |
| 71 | + s:targetProduct: |
| 72 | + class: s:SoftwareApplication |
| 73 | + s:softwareVersion: "1.2" |
| 74 | + s:applicationCategory: commandline tool |
| 75 | + s:programmingLanguage: C |
| 76 | + s:publication: |
| 77 | + - class: s:ScholarlyArticle |
| 78 | + id: http://dx.doi.org/10.1093/bioinformatics/bts635 |
| 79 | + |
| 80 | + s:author: |
| 81 | + - class: s:Person |
| 82 | + s:name: "Heng Li" |
| 83 | + s:sameAs: |
| 84 | + - id: https://orcid.org/0000-0003-4874-2874 |
| 85 | + |
| 86 | +s:downloadUrl: https://github.com/galaxyproject/planemo/blob/master/project_templates/seqtk_complete_cwl/seqtk_seq.cwl |
| 87 | +s:codeRepository: https://github.com/galaxyproject/planemo |
| 88 | + |
| 89 | +s:author: |
| 90 | + class: s:Person |
| 91 | + s:name: John Chilton |
| 92 | + s:email: mailto:jmchilton@gmail.com |
| 93 | + s:sameAs: |
| 94 | + - id: https://orcid.org/0000-0002-6794-0756 |
0 commit comments