Mercurial > repos > jpayne > seqsero2s
changeset 0:a9790ce778af draft default tip
planemo upload commit 233f498f942f9253a7e6e1656157e59d38549c44-dirty
| author | jpayne |
|---|---|
| date | Mon, 29 Sep 2025 20:04:28 +0000 |
| parents | |
| children | |
| files | job_conf.yml seqsero2S.xml test-data/.gitmodules tool-data/all_fasta.loc.sample |
| diffstat | 4 files changed, 247 insertions(+), 0 deletions(-) [+] |
line wrap: on
line diff
--- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/job_conf.yml Mon Sep 29 20:04:28 2025 +0000 @@ -0,0 +1,37 @@ +runners: + local: + load: galaxy.jobs.runners.local:LocalJobRunner + workers: 16 + +# handling: +# processes: +# handler0: + +execution: + default: local + environments: + local: + runner: local + docker_local: + runner: local + docker_enabled: true + # container: "auto" + docker_volumes: $defaults + # docker_set_user: null + docker_run_extra_arguments: "--entrypoint ''" + docker_set_user: root + +tools: +- id: seqsero_v2 + # handler: handler0 + environment: docker_local +- id: seqsero2s + # handler: handler0 + environment: docker_local + +limits: +- + # Amount of time a job can run (in any environment) before it + # will be terminated by Galaxy. + type: walltime + value: '01:00:00' \ No newline at end of file
--- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/seqsero2S.xml Mon Sep 29 20:04:28 2025 +0000 @@ -0,0 +1,197 @@ +<tool id="seqsero2s" name="SeqSero2S" version="1"> + <description>Simplified Salmonella serotype prediction</description> + <requirements> + <!-- <requirement type="package" version="@VERSION@">seqsero2s</requirement> --> + <container type="docker">quay.io/biocontainers/seqsero2s:1.1.3--pyhdfd78af_0</container> + </requirements> + <command detect_errors="exit_code"><![CDATA[ + mkdir ./output; + + #if $reads.reads_select == 'history' + #set $name = $reads.forward.name.split('.')[0].replace(' ','_') + #set $forward = $reads.forward + #set $reverse = $reads.reverse + #set $infile = $name + "_1.fastq " + $name + "_2.fastq" + #set $tval = 2 + #if $reverse.is_of_type('fastq.gz', 'fastqsanger.gz') + gunzip -c $reverse > reverse.fastq; + #set $reverse = './reverse.fastq' + gunzip -c $forward > forward.fastq; + #set $forward = './forward.fastq' + #end if + ln -s $forward ${name}_1.fastq; + ln -s $reverse ${name}_2.fastq; + #else if $reads.reads_select == 'collection' + #set $name = $reads.coll.name.replace(' ', '_') + #set $forward = $reads.coll.forward + #set $reverse = $reads.coll.reverse + #set $infile = $name + "_1.fastq " + $name + "_2.fastq" + #set $tval = 2 + #if $reverse.is_of_type('fastq.gz', 'fastqsanger.gz') + gunzip -c $reverse > reverse.fastq; + #set $reverse = './reverse.fastq' + gunzip -c $forward > forward.fastq; + #set $forward = './forward.fastq' + #end if + ln -s $forward ${name}_1.fastq; + ln -s $reverse ${name}_2.fastq; + #else + #set $name = $reads.assembly.name.replace(' ', '_') + #set $ga = $reads.assembly + #set $infile = $name + ".fasta" + ln -s $ga ${name}.fasta; + #set $tval = 4 + #set $mode='k' + #end if + echo $name ; + echo "-=-=-=-=-" ; + touch output/SeqSero_log.txt ; + /usr/local/bin/SeqSero2S.py --version ; + echo "-=-=-=-=-" ; + /usr/local/bin/SeqSero2S.py + -p \${GALAXY_SLOTS:-1} + -t $tval + -m $mode + -d ./output + #if $mode == 'a': + -b $maptype + #end if + -i $infile && + echo "-=-=-=-=-" && + cat output/SeqSero_log.txt && + echo "-=-=-=-=-" && + ls -lah ./output + ]]></command> + <inputs> + + <conditional name="reads"> + <param name="reads_select" type="select" label="Genome assembly,paired-end collection, or two datasets from your history"> + <option value="collection">Paired collection from your history</option> + <option value="history">Two FASTQ datasets from your history</option> + <option value="genome">Genome Assembly</option> + </param> + <when value="collection"> + <param label="Paired reads" name="coll" type="data_collection" format="fastq,fastqsanger,fastq.gz,fastqsanger.gz" collection_type="paired" /> + </when> + <when value="history"> + <param label="Forward reads" type="data" name="forward" format="fastq,fastqsanger,fastq.gz,fastqsanger.gz" /> + <param label="Reverse reads" type="data" name="reverse" format="fastq,fastqsanger,fastq.gz,fastqsanger.gz" /> + </when> + <when value="genome"> + <param label="Genome assembly" name="assembly" type="data" format="fasta"/> + </when> + </conditional> + + <!-- <param name="fastq1" type="data" format="fastq" label="FASTQ paired end read 1" /> + <param name="fastq2" type="data" format="fastq" label="FASTQ paired end read 2" /> --> + <!-- <param name="numofthr" type="select" label="Number of threads"> + <option value="1">1</option> + <option value="2">2</option> + <option value="3">3</option> + <option value="4">4</option> --> + <!-- </param> --> + + <param label="Analysis mode" type="select" name="mode"> + <option value="a">allele mode</option> + <option value="k">k-mer mode</option> + </param> + + <param name="maptype" type="select" label="Algorithms for BWA mapping"> + <option value="mem">mem</option> + <option value="sam">sam</option> + </param> + + + + </inputs> + <outputs> + <data format="tabular" label="SeqSero Results" name="results" from_work_dir="output/SeqSero_result.tsv" /> + </outputs> + <tests> + <!-- <test> + <param name="reads_select" value="history" /> + <param name="forward" value="forward.fastq.gz" ftype="fastqsanger.gz" /> + <param name="reverse" value="reverse.fastq.gz" ftype="fastqsanger.gz" /> + <output name="results" file="Seqsero_result.tsv" /> + </test> + <test> + <param name="reads_select" value="collection" /> + <param name="coll"> + <collection type="paired"> + <element name="forward" value="forward.fastq.gz" ftype="fastqsanger.gz" /> + <element name="reverse" value="reverse.fastq.gz" ftype="fastqsanger.gz" /> + </collection> + </param> + <output name="results" file="Seqsero_result.tsv" /> + </test> --> + <!-- <test> + <param name="mode" value="k" /> + <param name="reads_select" value="history" /> + <param name="forward" value="forward_25k.fastq.gz" ftype="fastqsanger" /> + <param name="reverse" value="reverse_25k.fastq.gz" ftype="fastqsanger" /> + <output name="results" file="Seqsero_result_25k.tsv" /> + </test> + <test> + <param name="mode" value="k" /> + <param name="reads_select" value="collection" /> + <param name="coll"> + <collection type="paired"> + <element name="forward" value="forward_25k.fastq.gz" ftype="fastqsanger.gz" /> + <element name="reverse" value="reverse_25k.fastq.gz" ftype="fastqsanger.gz" /> + </collection> + </param> + <output name="results" file="Seqsero_result_25k_coll.tsv" /> + </test> + <test> + <param name="mode" value="a" /> + <param name="reads_select" value="history" /> + <param name="forward" value="forward_250k.fastq.gz" ftype="fastqsanger" /> + <param name="reverse" value="reverse_250k.fastq.gz" ftype="fastqsanger" /> + <assert_stdout> + <has_text text="input genome cannot be identified as Salmonella" /> + </assert_stdout> + </test> --> + <!-- <test> + <param name="mode" value="a" /> + <param name="reads_select" value="collection" /> + <param name="coll"> + <collection type="paired"> + <element name="forward" value="forward_25k.fastq.gz" ftype="fastqsanger.gz" /> + <element name="reverse" value="reverse_25k.fastq.gz" ftype="fastqsanger.gz" /> + </collection> + </param> + <output name="results" file="Seqsero_result_allele.tsv" /> + </test> --> + <test> + <param name="mode" value="k" /> + <param name="reads_select" value="genome" /> + <param name="assembly" value="test/taxonomy/salmonella/contigs.fa" ftype="fasta" /> + <output name="results" file="test/taxonomy/salmonella/SeqSero_result/SeqSero_result.tsv" /> + </test> + </tests> + <help><![CDATA[ + +**Usage: SeqSero2.py** + +**Algorithms for BWA mapping** + +'mem' for mem, 'sam' for samse/sampe; default=mem; optional; for now SeqSero2 is only optimized for "mem" mode + + ]]></help> + <citations> + <citation type="bibtex"> + @misc{zhang_yin_jones_zhang_deathrage_dinsmore_fitzgeral_fields_deng_2015, + title={Salmonella serotype determination utilizing high-throughput genome sequencing data.}, + journal={J Clin Microbiol}, publisher={ASM}, + author={Zhang S, Yin Y, Jones MB, Zhang Z, Deatherage Kaiser BL, Dinsmore BA, Fitzgerald C, Fields PI, Deng X.}, + year={2015}, month={Max}, + url={http://http://jcm.asm.org/content/early/2015/03/05/JCM.00323-15}}, + }</citation> + <citation type="bibtex"> + @misc{cfsan_biostatistics_group_2017, + title={CFSAN Biostatistics Group fork of SeqSero2}, + url={https://github.com/CFSAN-Biostatistics/SeqSero2.git}}, + </citation> + </citations> + +</tool>
--- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/.gitmodules Mon Sep 29 20:04:28 2025 +0000 @@ -0,0 +1,3 @@ +[submodule "test/csp2"] + path = test/csp2 + url = https://github.com/CFSAN-Biostatistics/CSP2_TestData.git
--- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/tool-data/all_fasta.loc.sample Mon Sep 29 20:04:28 2025 +0000 @@ -0,0 +1,10 @@ +#This file lists the locations and dbkeys of all the fasta files +#under the "genome" directory (a directory that contains a directory +#for each build). The script extract_fasta.py will generate the file +#all_fasta.loc. This file has the format (white space characters are +#TAB characters): +# +#<unique_build_id> <dbkey> <display_name> <file_path> +# +#So, all_fasta.loc could look something like this: +#test1 test1 Test-Genome ./test-data/test1.fa \ No newline at end of file
