Skip to content

Commit f6d1167

Browse files
committed
udpate gtdbtk and make it run again
1 parent d86386f commit f6d1167

2 files changed

Lines changed: 39 additions & 10 deletions

File tree

tools/gtdbtk/gtdbtk_classify_wf.xml

Lines changed: 37 additions & 8 deletions
Original file line numberDiff line numberDiff line change
@@ -12,24 +12,35 @@
1212
1313
mkdir input_dir &&
1414
mkdir output_dir &&
15+
mkdir scratch_dir &&
16+
mkdir tmp_dir &&
1517
#for $i in $input:
1618
## gtdbtk uses the file extension to determine the input format.
17-
#set ext = "." + $i.ext
18-
#set input_identifier = re.sub('[^\w\-.]', '_', str($i.element_identifier)) + $ext
19+
#set ext = $i.ext
20+
#if $ext.endswith(".gz")
21+
#set ext = "gz"
22+
#end if
23+
#set input_identifier = re.sub('[^\w\-.]', '_', str($i.element_identifier)) + "." + $ext
1924
ln -s '${i}' input_dir/'${input_identifier}' &&
2025
#end for
2126
export GTDBTK_DATA_PATH=$gtdbtk_db.fields.path &&
2227
gtdbtk classify_wf
2328
--genome_dir input_dir
2429
--extension '$ext'
2530
--out_dir output_dir
31+
--prefix gtdbtk
2632
--cpus "\${GALAXY_SLOTS:-4}"
33+
--tmpdir tmp_dir
34+
$advanced.place_species
2735
--min_perc_aa $advanced.min_perc_aa
36+
$advanced.genes
37+
--pplacer_cpus "\${GALAXY_SLOTS:-4}"
2838
$advanced.force
39+
--scratch_dir scratch_dir
40+
$advanced.write_single_copy_genes
41+
--keep_intermediates
2942
--min_af $advanced.min_af
30-
$full_tree
31-
## Required unless mash_db is available:
32-
--skip_ani_screen
43+
$advanced.full_tree
3344
3445
#if str($advanced.output_process_log) == 'yes':
3546
&& cat output_dir/gtdbtk.warnings.log output_dir/gtdbtk.log > '$process_log'
@@ -44,16 +55,19 @@ $full_tree
4455
</options>
4556
</param>
4657
<section name="advanced" title="Advanced options">
58+
<param argument="--place_species" type="boolean" truevalue="--place_species" falsevalue="" checked="false" label="Place species in pplacer trees even if they are classified with skani?"/>
4759
<param argument="--min_perc_aa" type="integer" min="0" max="100" value="10" label="Exclude genomes that do not have at least this percentage of AA in the MSA" help="Inclusive bound"/>
60+
<param argument="--genes" type="boolean" truevalue="--genes" falsevalue="" checked="false" label="Input files contain predicted proteins as amino acids?" help="This skips gene calling, ANI screening, and ANI classification."/>
4861
<param argument="--force" type="boolean" truevalue="--force" falsevalue="" checked="false" label="Continue processing if an error occurs on a single genome?"/>
49-
<param argument="--min_af" type="float" min="0" max="1" value="0.65" label="Minimum alignment fraction to consider closest genome"/>
62+
<param argument="--write_single_copy_genes" type="boolean" truevalue="--write_single_copy_genes" falsevalue="" checked="false" label="Output unaligned single-copy marker genes?"/>
63+
<param argument="--min_af" type="float" min="0" max="1" value="0.5" label="Minimum alignment fraction to assign genome to a species cluster"/>
5064
<param argument="--full_tree" type="boolean" truevalue="--full_tree" falsevalue="" checked="false" label="Use the full tree" help="Use the unsplit bacterial tree for the classify step; this is the original GTDB-Tk approach (version &lt; 2) and requires more than 320 GB of RAM to load the reference tree (default: False)"/>
5165
<param name="output_process_log" type="boolean" truevalue="yes" falsevalue="no" checked="false" label="Output process log file?"/>
5266
</section>
5367
</inputs>
5468
<outputs>
5569
<data name="process_log" format="txt" label="${tool.name} on ${on_string} (process log)">
56-
<filter>advanced['output_process_log']</filter>
70+
<filter>advanced['output_process_log'] == 'yes'</filter>
5771
</data>
5872
<collection name="output_align" type="list" format="fasta.gz" label="${tool.name} on ${on_string} (align)">
5973
<discover_datasets pattern="(?P&lt;designation&gt;.+)\.fasta.gz" ext="fasta.gz" directory="output_dir/align"/>
@@ -130,6 +144,22 @@ $full_tree
130144
<test expect_failure="true">
131145
<param name="input" value="genome_1.fna.gz" ftype="fasta.gz"/>
132146
<param name="gtdbtk_db" value="gtdbtk214"/>
147+
<section name="advanced">
148+
<param name="place_species" value="true"/>
149+
<param name="genes" value="true"/>
150+
<param name="force" value="true"/>
151+
<param name="write_single_copy_genes" value="true"/>
152+
</section>
153+
<assert_command>
154+
<has_text text="--prefix gtdbtk"/>
155+
<has_text text="--place_species"/>
156+
<has_text text="--genes"/>
157+
<has_text text="--pplacer_cpus"/>
158+
<has_text text="--force"/>
159+
<has_text text="--write_single_copy_genes"/>
160+
<has_text text="--keep_intermediates"/>
161+
<has_text text="--skip_ani_screen" negate="true"/>
162+
</assert_command>
133163
<assert_stderr>
134164
<has_text text="Fatal error: Exit code 1"/>
135165
</assert_stderr>
@@ -162,4 +192,3 @@ Results can be impacted by a lack of marker genes or contamination.
162192
]]></help>
163193
<expand macro="citations"/>
164194
</tool>
165-

tools/gtdbtk/macros.xml

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -1,7 +1,7 @@
11
<macros>
2-
<token name="@TOOL_VERSION@">2.7.1</token>
2+
<token name="@TOOL_VERSION@">2.7.2</token>
33
<token name="@VERSION_SUFFIX@">0</token>
4-
<token name="@PROFILE@">22.05</token>
4+
<token name="@PROFILE@">24.0</token>
55
<xml name="requirements">
66
<requirements>
77
<requirement type="package" version="@TOOL_VERSION@">gtdbtk</requirement>

0 commit comments

Comments
 (0)