Skip to content

Commit 911bc48

Browse files
committed
Compleasm: use symlink instead of copying busco data
1 parent 273fabe commit 911bc48

24 files changed

+19008
-334
lines changed

tools/compleasm/compleasm.xml

+24-15
Original file line numberDiff line numberDiff line change
@@ -11,17 +11,17 @@
1111
</requirements>
1212
<version_command>compleasm --version</version_command>
1313
<command><![CDATA[
14-
15-
mkdir -p galaxy_db &&
16-
cp -r '${busco_database.fields.path}/lineages/${lineage_dataset}/' 'galaxy_db/' &&
14+
mkdir -p 'galaxy_db/' &&
15+
ln -s '${busco_database.fields.path}/lineages/${lineage_dataset}/' 'galaxy_db/${lineage_dataset}' &&
16+
touch 'galaxy_db/${lineage_dataset}.done' &&
1717
1818
compleasm run
1919
-a '$input'
2020
-o galaxy_output
2121
--mode $mode
2222
-L 'galaxy_db'
2323
-l '$lineage_dataset'
24-
-t "\${GALAXY_SLOTS:-1}"
24+
-t "\${GALAXY_SLOTS:-1}"
2525
2626
#if str($specified_contigs) != '':
2727
--specified_contigs '$specified_contigs'
@@ -43,7 +43,7 @@
4343
</sanitizer>
4444
<validator type="regex">[0-9a-zA-Z_ ]+</validator>
4545
</param>
46-
46+
4747
<param name="outputs" type="select" multiple="true" label="Which outputs should be generated">
4848
<option value="full_table_busco" selected="true">full busco table</option>
4949
<option value="full_table">full table</option>
@@ -72,26 +72,32 @@
7272
</data>
7373
<data name='translated_protein' format='fasta' label="${tool.name} on ${on_string}: Translated protein" from_work_dir="galaxy_output/*_odb10/translated_protein.fasta">
7474
<filter>outputs and 'translated_protein' in outputs</filter>
75-
</data>
75+
</data>
7676
</outputs>
7777

7878
<tests>
7979
<test expect_num_outputs="4">
8080
<param name="input" value="small_genome.fasta"/>
8181
<param name="mode" value="busco"/>
8282
<param name="outputs" value="full_table_busco,full_table,miniprot,translated_protein"/>
83-
<param name="busco_database" value="eukaryota_odb10"/>
84-
<param name="lineage_dataset" value="eukaryota_odb10"/>
83+
<param name="busco_database" value="entomoplasmatales_odb10"/>
84+
<param name="lineage_dataset" value="entomoplasmatales_odb10"/>
8585
<output name="full_table_busco">
8686
<assert_contents>
8787
<has_text text="Busco id"/>
88-
<has_text text="Missing"/>
88+
<has_text text="496at186328&#009;Missing"/>
89+
<has_text text="165at186328&#009;Complete"/>
90+
<has_text text="421at186328&#009;Complete"/>
91+
<has_text text="90at186328&#009;Complete"/>
8992
</assert_contents>
9093
</output>
9194
<output name="full_table">
9295
<assert_contents>
93-
<has_text text="Gene"/>
94-
<has_text text="Missing"/>
96+
<has_text text="Gene&#009;Status"/>
97+
<has_text text="496at186328&#009;Missing"/>
98+
<has_text text="165at186328&#009;Single"/>
99+
<has_text text="421at186328&#009;Single"/>
100+
<has_text text="90at186328&#009;Single"/>
95101
</assert_contents>
96102
</output>
97103
<output name="miniprot">
@@ -101,19 +107,22 @@
101107
</output>
102108
<output name="translated_protein">
103109
<assert_contents>
104-
<has_text text="GGWLIGNGGAGGSGAAGVNGGAGGNGGAGGNGGAGG"/>
105-
<has_text text="AAVFADRGAHVVLAVRNLEKGNAARARIMAARPGAHVTLQQLDLCSLDSVRAAADALRTAYPRIDVLINNAGVMW"/>
110+
<has_text text="EKDFYQELGVSSDASPEEIKRAYRKLARDLHPDANPGNPAA"/>
111+
<has_text text="AASITILEGLEAVRKRPGMYIGSTGERGLHHLIWEVVD"/>
106112
</assert_contents>
107113
</output>
114+
<assert_stdout>
115+
<has_text text="S:1.20%, 4"/>
116+
</assert_stdout>
108117
</test>
109118
</tests>
110119
<help><![CDATA[
111120
112-
compleasm_ assesses genome completeness based on genome assembly.
121+
compleasm_ assesses genome completeness based on genome assembly.
113122
114123
.. _compleasm: https://github.com/huangnengCSU/compleasm
115124
116-
]]>
125+
]]>
117126
</help>
118127
<expand macro="citation"/>
119128
</tool>

tools/compleasm/macros.xml

+2-2
Original file line numberDiff line numberDiff line change
@@ -1,10 +1,10 @@
11
<macros>
22
<token name="@TOOL_VERSION@">0.2.6</token>
3-
<token name="@VERSION_SUFFIX@">1</token>
3+
<token name="@VERSION_SUFFIX@">2</token>
44

55
<xml name="citation">
66
<citations>
7-
<citation type="doi">10.1101/2023.06.03.543588</citation>
7+
<citation type="doi">10.1101/2023.06.03.543588</citation>
88
</citations>
99
</xml>
1010

tools/compleasm/test-data/busco_database.loc

+2-2
Original file line numberDiff line numberDiff line change
@@ -2,5 +2,5 @@
22
# - value
33
# - name
44
# - version
5-
# - /path/to/data
6-
eukaryota_odb10 eukaryota 5.4.6 ${__HERE__}/test-db/busco_downloads
5+
# - /path/to/data
6+
entomoplasmatales_odb10 entomoplasmatales 5.4.6 ${__HERE__}/test-db/busco_downloads

tools/compleasm/test-data/test-db/busco_downloads/information/lineages_list.2021-12-14.txt

-199
This file was deleted.

0 commit comments

Comments
 (0)