Skip to content

Commit cd3b054

Browse files
authored
Merge pull request #2960 from nsoranzo/minia
Add minimal wrapper for minia
2 parents 6de23fe + 5110437 commit cd3b054

5 files changed

Lines changed: 118 additions & 3 deletions

File tree

tools/minia/.shed.yml

Lines changed: 11 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,11 @@
1+
categories:
2+
- Assembly
3+
description: Short-read assembler based on a de Bruijn graph
4+
long_description: |
5+
Minia is capable of assembling a human genome on a desktop computer in a day.
6+
The output of Minia is a set of contigs.
7+
name: minia
8+
owner: iuc
9+
remote_repository_url: https://github.com/galaxyproject/tools-iuc/tree/master/tools/minia
10+
homepage_url: https://gatb.inria.fr/software/minia/
11+
type: unrestricted

tools/minia/minia.xml

Lines changed: 55 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,55 @@
1+
<tool id="minia" name="Minia" version="@TOOL_VERSION@">
2+
<description>Short-read assembler based on a de Bruijn graph</description>
3+
<macros>
4+
<token name="@TOOL_VERSION@">3.2.1</token>
5+
</macros>
6+
<requirements>
7+
<requirement type="package" version="@TOOL_VERSION@">minia</requirement>
8+
</requirements>
9+
<command detect_errors="exit_code"><![CDATA[
10+
#set input = 'infile.' + $in.ext
11+
ln -s '$in' '$input' &&
12+
13+
minia
14+
-in '$input'
15+
-kmer-size $kmer_size
16+
#if str($abundance_min):
17+
-abundance-min $abundance_min
18+
#end if
19+
#if str($abundance_max):
20+
-abundance-min $abundance_max
21+
#end if
22+
-nb-cores \${GALAXY_SLOTS:-1}
23+
-out output
24+
]]></command>
25+
<inputs>
26+
<param argument="-in" type="data" format="fasta,fastqsanger,fastqsanger.gz,fasta.gz" label="Reads in FASTA or FASTQ format" />
27+
<param argument="-kmer-size" type="integer" value="31" min="1" label="Size of a kmer" />
28+
<param argument="-abundance-min" type="integer" value="" optional="true" min="0" label="Min abundance threshold for solid kmers (default: 2)" />
29+
<param argument="-abundance-max" type="integer" value="" optional="true" label="Max abundance threshold for solid kmers" />
30+
</inputs>
31+
<outputs>
32+
<data name="output" format="fasta" label="${tool.name} on ${on_string}" from_work_dir="output.contigs.fa" />
33+
</outputs>
34+
<tests>
35+
<test>
36+
<param name="in" value="ec.fa" />
37+
<param name="kmer_size" value="21" />
38+
<param name="abundance_min" value="1" />
39+
<output name="output" ftype="fasta">
40+
<assert_contents>
41+
<has_text text="LN:i:460 KC:i:2200 km:f:5.000"/>
42+
<has_text text="LN:i:637 KC:i:3085 km:f:5.000"/>
43+
<has_n_lines n="4"/>
44+
</assert_contents>
45+
</output>
46+
</test>
47+
</tests>
48+
<help><![CDATA[
49+
Minia is a short-read assembler based on a de Bruijn graph, capable of assembling a human genome on a desktop computer in a day.
50+
The output of Minia is a set of contigs.
51+
]]></help>
52+
<citations>
53+
<citation type="doi">10.1186/1748-7188-8-22</citation>
54+
</citations>
55+
</tool>

tools/minia/test-data/ec.fa

Lines changed: 49 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,49 @@
1+
>works well for k=21; part of genome10K.fasta
2+
CATCGATGCGAGACGCCTGTCGCGGGGAATTGTGGGGCGGACCACGCTCTGGCTAACGAGCTACCGTTTCCTTTAACCTGCCAGACGGTGACCAGGGCCGTTCGGCGTTGCATCGAGCGGTGTCGCTAGCGCAATGCGCAAGATTTTGACATTTACAAGGCAACATTGCAGCGTCCGATGGTCCGGTGGCCTCCAGATAGTGTCCAGTCGCTCTAACTGTATGGAGACCATAGGCATTTACCTTATTCTCATCGCCACGCCCCAAGATCTTTAGGACCCAGCATTCCTTTAACCACTAACATAACGCGTGTCATCTAGTTCAACAACC
3+
>remaining part
4+
TGTCATCTAGTTCAACAACCGTTATGCCGTCCGACTCTTGCGCTCGGATGTCCGCAATGGGTTATCCCTATGTTCCGGTAATCTCTCATCTACTAAGCGCCCTAAAGGTCGTATGGTTGGAGGGCGGTTACACACCCTTAAGTACCGAACGATAGAGCACCCGTCTAGGAGGGCGTGCAGGGTCTCCCGCTAGCTAATGGTCACGGCCTCTCTGGGAAAGCTGAACAACGGATGATACCCATACTGCCACTCCAGTACCTGGGCCGCGTGTTGTACGCTGTGTATCTTGAGAGCGTTTCCAGCAGATAGAACAGGATCACATGTACATG
5+
>that's the EC
6+
TGTCATCTAGTTCAACAACCAAAAAAA
7+
>contig that is split in two by the EC, containing the last kmer of the ec (CTAGTTCAACAACCAAAAAAA)
8+
GGTGAACAGCACATCTTTTCGTCCTGAGGCCATATTAATTCTACTCAGATTGTCTGTAACCGGAGCTTCGGGCGTATTTTTGCGTAAGACACTGCCTAAAGGGAACATATGTGTCCAGAATAGGGTTCAACGGTGTATGAGCAAA
9+
CTAGTTCAACAACCAAAAAAA
10+
TTGTGTGCAAGCTACTTCTAGACCTTATTAAGTGCCCAGGAATTCCTAGGAAGGCGCGCAGCTCAAGCAATCATACATGGCGGAATGCCTGTCCACCGGGGGTTCTACTGTACCACAGTGGCCTGGATAGCTAAGCAGGTCCTGGATTGGCATGTCATCCGGAGTGATAGGCACTGCTCACGACCAGCTTGCGGACAAACGGGGTGCCCGCGCCTGCGTCCGGTAGACGAGCGATGGATTTAGACCGTTCACTGAACCCTCTAATAGGACCTCTTGCCCATCCGAGGCTTAAGC
11+
>the rest below is just repeated for coverage reasons
12+
A
13+
>the rest below is just repeated for coverage reasons
14+
A
15+
>the rest below is just repeated for coverage reasons
16+
A
17+
>contig that is split in two by the EC, containing the last kmer of the ec (CTAGTTCAACAACCAAAAAAA)
18+
GGTGAACAGCACATCTTTTCGTCCTGAGGCCATATTAATTCTACTCAGATTGTCTGTAACCGGAGCTTCGGGCGTATTTTTGCGTAAGACACTGCCTAAAGGGAACATATGTGTCCAGAATAGGGTTCAACGGTGTATGAGCAAA
19+
CTAGTTCAACAACCAAAAAAA
20+
TTGTGTGCAAGCTACTTCTAGACCTTATTAAGTGCCCAGGAATTCCTAGGAAGGCGCGCAGCTCAAGCAATCATACATGGCGGAATGCCTGTCCACCGGGGGTTCTACTGTACCACAGTGGCCTGGATAGCTAAGCAGGTCCTGGATTGGCATGTCATCCGGAGTGATAGGCACTGCTCACGACCAGCTTGCGGACAAACGGGGTGCCCGCGCCTGCGTCCGGTAGACGAGCGATGGATTTAGACCGTTCACTGAACCCTCTAATAGGACCTCTTGCCCATCCGAGGCTTAAGC
21+
>contig that is split in two by the EC, containing the last kmer of the ec (CTAGTTCAACAACCAAAAAAA)
22+
GGTGAACAGCACATCTTTTCGTCCTGAGGCCATATTAATTCTACTCAGATTGTCTGTAACCGGAGCTTCGGGCGTATTTTTGCGTAAGACACTGCCTAAAGGGAACATATGTGTCCAGAATAGGGTTCAACGGTGTATGAGCAAA
23+
CTAGTTCAACAACCAAAAAAA
24+
TTGTGTGCAAGCTACTTCTAGACCTTATTAAGTGCCCAGGAATTCCTAGGAAGGCGCGCAGCTCAAGCAATCATACATGGCGGAATGCCTGTCCACCGGGGGTTCTACTGTACCACAGTGGCCTGGATAGCTAAGCAGGTCCTGGATTGGCATGTCATCCGGAGTGATAGGCACTGCTCACGACCAGCTTGCGGACAAACGGGGTGCCCGCGCCTGCGTCCGGTAGACGAGCGATGGATTTAGACCGTTCACTGAACCCTCTAATAGGACCTCTTGCCCATCCGAGGCTTAAGC
25+
>works well for k=21; part of genome10K.fasta
26+
CATCGATGCGAGACGCCTGTCGCGGGGAATTGTGGGGCGGACCACGCTCTGGCTAACGAGCTACCGTTTCCTTTAACCTGCCAGACGGTGACCAGGGCCGTTCGGCGTTGCATCGAGCGGTGTCGCTAGCGCAATGCGCAAGATTTTGACATTTACAAGGCAACATTGCAGCGTCCGATGGTCCGGTGGCCTCCAGATAGTGTCCAGTCGCTCTAACTGTATGGAGACCATAGGCATTTACCTTATTCTCATCGCCACGCCCCAAGATCTTTAGGACCCAGCATTCCTTTAACCACTAACATAACGCGTGTCATCTAGTTCAACAACC
27+
>remaining part
28+
TGTCATCTAGTTCAACAACCGTTATGCCGTCCGACTCTTGCGCTCGGATGTCCGCAATGGGTTATCCCTATGTTCCGGTAATCTCTCATCTACTAAGCGCCCTAAAGGTCGTATGGTTGGAGGGCGGTTACACACCCTTAAGTACCGAACGATAGAGCACCCGTCTAGGAGGGCGTGCAGGGTCTCCCGCTAGCTAATGGTCACGGCCTCTCTGGGAAAGCTGAACAACGGATGATACCCATACTGCCACTCCAGTACCTGGGCCGCGTGTTGTACGCTGTGTATCTTGAGAGCGTTTCCAGCAGATAGAACAGGATCACATGTACATG
29+
>works well for k=21; part of genome10K.fasta
30+
CATCGATGCGAGACGCCTGTCGCGGGGAATTGTGGGGCGGACCACGCTCTGGCTAACGAGCTACCGTTTCCTTTAACCTGCCAGACGGTGACCAGGGCCGTTCGGCGTTGCATCGAGCGGTGTCGCTAGCGCAATGCGCAAGATTTTGACATTTACAAGGCAACATTGCAGCGTCCGATGGTCCGGTGGCCTCCAGATAGTGTCCAGTCGCTCTAACTGTATGGAGACCATAGGCATTTACCTTATTCTCATCGCCACGCCCCAAGATCTTTAGGACCCAGCATTCCTTTAACCACTAACATAACGCGTGTCATCTAGTTCAACAACC
31+
>remaining part
32+
TGTCATCTAGTTCAACAACCGTTATGCCGTCCGACTCTTGCGCTCGGATGTCCGCAATGGGTTATCCCTATGTTCCGGTAATCTCTCATCTACTAAGCGCCCTAAAGGTCGTATGGTTGGAGGGCGGTTACACACCCTTAAGTACCGAACGATAGAGCACCCGTCTAGGAGGGCGTGCAGGGTCTCCCGCTAGCTAATGGTCACGGCCTCTCTGGGAAAGCTGAACAACGGATGATACCCATACTGCCACTCCAGTACCTGGGCCGCGTGTTGTACGCTGTGTATCTTGAGAGCGTTTCCAGCAGATAGAACAGGATCACATGTACATG
33+
>contig that is split in two by the EC, containing the last kmer of the ec (CTAGTTCAACAACCAAAAAAA)
34+
GGTGAACAGCACATCTTTTCGTCCTGAGGCCATATTAATTCTACTCAGATTGTCTGTAACCGGAGCTTCGGGCGTATTTTTGCGTAAGACACTGCCTAAAGGGAACATATGTGTCCAGAATAGGGTTCAACGGTGTATGAGCAAA
35+
CTAGTTCAACAACCAAAAAAA
36+
TTGTGTGCAAGCTACTTCTAGACCTTATTAAGTGCCCAGGAATTCCTAGGAAGGCGCGCAGCTCAAGCAATCATACATGGCGGAATGCCTGTCCACCGGGGGTTCTACTGTACCACAGTGGCCTGGATAGCTAAGCAGGTCCTGGATTGGCATGTCATCCGGAGTGATAGGCACTGCTCACGACCAGCTTGCGGACAAACGGGGTGCCCGCGCCTGCGTCCGGTAGACGAGCGATGGATTTAGACCGTTCACTGAACCCTCTAATAGGACCTCTTGCCCATCCGAGGCTTAAGC
37+
>contig that is split in two by the EC, containing the last kmer of the ec (CTAGTTCAACAACCAAAAAAA)
38+
GGTGAACAGCACATCTTTTCGTCCTGAGGCCATATTAATTCTACTCAGATTGTCTGTAACCGGAGCTTCGGGCGTATTTTTGCGTAAGACACTGCCTAAAGGGAACATATGTGTCCAGAATAGGGTTCAACGGTGTATGAGCAAA
39+
CTAGTTCAACAACCAAAAAAA
40+
TTGTGTGCAAGCTACTTCTAGACCTTATTAAGTGCCCAGGAATTCCTAGGAAGGCGCGCAGCTCAAGCAATCATACATGGCGGAATGCCTGTCCACCGGGGGTTCTACTGTACCACAGTGGCCTGGATAGCTAAGCAGGTCCTGGATTGGCATGTCATCCGGAGTGATAGGCACTGCTCACGACCAGCTTGCGGACAAACGGGGTGCCCGCGCCTGCGTCCGGTAGACGAGCGATGGATTTAGACCGTTCACTGAACCCTCTAATAGGACCTCTTGCCCATCCGAGGCTTAAGC
41+
>works well for k=21; part of genome10K.fasta
42+
CATCGATGCGAGACGCCTGTCGCGGGGAATTGTGGGGCGGACCACGCTCTGGCTAACGAGCTACCGTTTCCTTTAACCTGCCAGACGGTGACCAGGGCCGTTCGGCGTTGCATCGAGCGGTGTCGCTAGCGCAATGCGCAAGATTTTGACATTTACAAGGCAACATTGCAGCGTCCGATGGTCCGGTGGCCTCCAGATAGTGTCCAGTCGCTCTAACTGTATGGAGACCATAGGCATTTACCTTATTCTCATCGCCACGCCCCAAGATCTTTAGGACCCAGCATTCCTTTAACCACTAACATAACGCGTGTCATCTAGTTCAACAACC
43+
>remaining part
44+
TGTCATCTAGTTCAACAACCGTTATGCCGTCCGACTCTTGCGCTCGGATGTCCGCAATGGGTTATCCCTATGTTCCGGTAATCTCTCATCTACTAAGCGCCCTAAAGGTCGTATGGTTGGAGGGCGGTTACACACCCTTAAGTACCGAACGATAGAGCACCCGTCTAGGAGGGCGTGCAGGGTCTCCCGCTAGCTAATGGTCACGGCCTCTCTGGGAAAGCTGAACAACGGATGATACCCATACTGCCACTCCAGTACCTGGGCCGCGTGTTGTACGCTGTGTATCTTGAGAGCGTTTCCAGCAGATAGAACAGGATCACATGTACATG
45+
>works well for k=21; part of genome10K.fasta
46+
CATCGATGCGAGACGCCTGTCGCGGGGAATTGTGGGGCGGACCACGCTCTGGCTAACGAGCTACCGTTTCCTTTAACCTGCCAGACGGTGACCAGGGCCGTTCGGCGTTGCATCGAGCGGTGTCGCTAGCGCAATGCGCAAGATTTTGACATTTACAAGGCAACATTGCAGCGTCCGATGGTCCGGTGGCCTCCAGATAGTGTCCAGTCGCTCTAACTGTATGGAGACCATAGGCATTTACCTTATTCTCATCGCCACGCCCCAAGATCTTTAGGACCCAGCATTCCTTTAACCACTAACATAACGCGTGTCATCTAGTTCAACAACC
47+
>remaining part
48+
TGTCATCTAGTTCAACAACCGTTATGCCGTCCGACTCTTGCGCTCGGATGTCCGCAATGGGTTATCCCTATGTTCCGGTAATCTCTCATCTACTAAGCGCCCTAAAGGTCGTATGGTTGGAGGGCGGTTACACACCCTTAAGTACCGAACGATAGAGCACCCGTCTAGGAGGGCGTGCAGGGTCTCCCGCTAGCTAATGGTCACGGCCTCTCTGGGAAAGCTGAACAACGGATGATACCCATACTGCCACTCCAGTACCTGGGCCGCGTGTTGTACGCTGTGTATCTTGAGAGCGTTTCCAGCAGATAGAACAGGATCACATGTACATG
49+

tools/odgi/build.xml

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -23,8 +23,8 @@ $sort
2323
help="" />
2424
</inputs>
2525
<outputs>
26-
<data name="odgi_output" format="odgi" />
27-
<data name="gfa_output" format="gfa1">
26+
<data name="odgi_output" format="odgi" label="${tool.name} on ${on_string}: odgi" />
27+
<data name="gfa_output" format="gfa1" label="${tool.name} on ${on_string}: GFA">
2828
<filter>to_gfa</filter>
2929
</data>
3030
</outputs>

tools/odgi/vis.xml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -37,7 +37,7 @@ $path_per_row
3737
label="Show thin links of this relative width to connect path pieces" />
3838
</inputs>
3939
<outputs>
40-
<data name="output" format="png" />
40+
<data name="output" format="png" label="${tool.name} on ${on_string}" />
4141
</outputs>
4242
<tests>
4343
<test>

0 commit comments

Comments
 (0)