annotate cfsan_bettercallsal.xml @ 0:0a8dda29956e draft default tip

planemo upload
author galaxytrakr
date Thu, 28 May 2026 20:41:10 +0000
parents
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
1 <tool id="hfp_bettercallsal_konda" name="bettercallsal" version="1.0.0+galaxy21">
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
2 <description>An automated workflow to assign Salmonella serotype based on NCBI Pathogen Detection Project for Salmonella.</description>
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
3 <requirements>
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
4 <requirement type="package" version="24.04.3">nextflow</requirement>
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
5 <requirement type="package" version="1.5.8">micromamba</requirement>
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
6 <requirement type="package">graphviz</requirement>
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
7 </requirements>
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
8 <version_command>nextflow -version</version_command>
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
9 <command detect_errors="exit_code"><![CDATA[
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
10 input_path=\$(pwd)"/cpipes-input";
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
11 mkdir -p "\${input_path}" || exit 1;
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
12 #import re
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
13 #if (str($input_read_type_cond.input_read_type) == "single_long" or str($input_read_type_cond.input_read_type) == "long_long"):
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
14 #for _, $unpaired in enumerate($input_read_type_cond.input):
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
15 #set read1 = str($unpaired.name)
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
16 #if not str($unpaired.name).endswith(('.fastq', '.fastq.gz')):
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
17 #set read1_ext = re.sub('fastqsanger', 'fastq', str($unpaired.ext))
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
18 #set read1 = str($unpaired.name) + str('.') + $read1_ext
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
19 #end if
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
20 ln -sf '$unpaired' "\${input_path}/$read1";
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
21 #end for
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
22 #elif (str($input_read_type_cond.input_read_type) == "paired"):
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
23 #for _, $pair in enumerate($input_read_type_cond.input_pair)
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
24 #set read_R1 = re.sub('\:forward', '_forward', str($pair.forward.name))
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
25 #set read_R2 = re.sub('\:reverse', '_reverse', str($pair.reverse.name))
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
26 #set read_R1_ext = re.sub('fastqsanger', 'fastq', str($pair.forward.ext))
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
27 #set read_R2_ext = re.sub('fastqsanger', 'fastq', str($pair.reverse.ext))
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
28 #if not str($pair.forward.name).endswith(('.fastq', '.fastq.gz')):
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
29 #set read_R1 = $read_R1 + str('.') + $read_R1_ext
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
30 #end if
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
31 #if not str($pair.reverse.name).endswith(('.fastq', '.fastq.gz')):
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
32 #set read_R2 = $read_R2 + str('.') + $read_R2_ext
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
33 #end if
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
34 ln -sf '$pair.forward' "\${input_path}/$read_R1";
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
35 ln -sf '$pair.reverse' "\${input_path}/$read_R2";
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
36 #end for
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
37 #end if
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
38 $__tool_directory__/1.0.0/cpipes
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
39 #if (str($input_read_type_cond.input_read_type) == "long_long"):
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
40 --pipeline bettercallsal_lr
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
41 #else
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
42 --pipeline bettercallsal
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
43 #end if
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
44 --input \${input_path}
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
45 --output cpipes-output
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
46 --fq_suffix '${input_read_type_cond.fq_suffix}'
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
47 #if (str($input_read_type_cond.input_read_type) == "long_long"):
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
48 --fq_single_end true
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
49 #elif (str($input_read_type_cond.input_read_type) == "single_long"):
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
50 --fq_single_end true
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
51 #elif (str($input_read_type_cond.input_read_type) == "paired"):
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
52 --fq_single_end false --fq2_suffix '${input_read_type_cond.fq2_suffix}'
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
53 #end if
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
54 --tuspy_n $tuspy_n
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
55 #if ($sourmash_cond.run == "true"):
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
56 --sfhpy_fcv $sourmash_cond.sfhpy_fcv
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
57 #end if
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
58 #if ($bcs_thresholds != 'relax' and str($input_read_type_cond.input_read_type) != "long_long"):
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
59 --kmaalign_ID $kma_id
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
60 #end if
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
61 #if ($sourmash_cond.run == "true"):
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
62 --sfhpy_fcv $sourmash_cond.sfhpy_fcv
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
63 #end if
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
64 --bcs_db_mode $bcs_db_mode
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
65 --bcs_thresholds $bcs_thresholds
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
66 --fq_filename_delim '${fq_filename_delim}'
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
67 --fq_filename_delim_idx $fq_filename_delim_idx
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
68 -profile kondagac;
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
69 #if (str($input_read_type_cond.input_read_type) == "long_long"):
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
70 mv './cpipes-output/bettercallsal_lr-multiqc/CPIPES-Report_multiqc_report.html' './multiqc_report.html' || exit 1;
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
71 #else
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
72 mv './cpipes-output/bettercallsal-multiqc/CPIPES-Report_multiqc_report.html' './multiqc_report.html' || exit 1;
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
73 #end if
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
74 rm -rf ./cpipes-output || exit 1;
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
75 rm -rf ./work || exit 1;
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
76 ]]></command>
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
77 <inputs>
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
78 <conditional name="input_read_type_cond">
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
79 <param name="input_read_type" type="select" label="Select the read collection type">
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
80 <option value="single_long" selected="true">Single-End short reads</option>
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
81 <option value="paired">Paired-End short reads</option>
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
82 <option value="long_long">Long reads</option>
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
83 </param>
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
84 <when value="single_long">
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
85 <param name="input" type="data_collection" collection_type="list" format="fastq,fastq.gz"
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
86 label="Dataset list of unpaired short reads" />
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
87 <param name="fq_suffix" value=".fastq.gz" type="text" label="Suffix of the Single-End FASTQ"/>
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
88 </when>
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
89 <when value="long_long">
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
90 <param name="input" type="data_collection" collection_type="list" format="fastq,fastq.gz"
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
91 label="Dataset list of long reads" />
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
92 <param name="fq_suffix" value=".fastq.gz" type="text" label="Suffix of the long read FASTQ"/>
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
93 </when>
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
94 <when value="paired">
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
95 <param name="input_pair" type="data_collection" collection_type="list:paired" format="fastq,fastq.gz" label="List of Dataset pairs" />
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
96 <param name="fq_suffix" value="_R1_001.fastq.gz" type="text" label="Suffix of the R1 FASTQ"
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
97 help="For any data sets downloaded from NCBI into Galaxy, change this to _forward.fastq.gz suffix."/>
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
98 <param name="fq2_suffix" value="_R2_001.fastq.gz" type="text" label="Suffix of the R2 FASTQ"
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
99 help="For any data sets downloaded from NCBI into Galaxy, change this to _reverse.fastq.gz suffix."/>
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
100 </when>
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
101 </conditional>
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
102 <param name="bcs_db_mode" type="select" label="Select the database mode with bettercallsal"
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
103 help="Refer to `Database generation` section in our manuscript: https://doi.org/10.3389/fmicb.2023.1200983">
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
104 <option value="snp" selected="true">per_snp_cluster</option>
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
105 <option value="comp">per_computed_type</option>
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
106 </param>
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
107 <param name="tuspy_n" optional="true" value="10" type="integer" label="Enter the number of top unique serotypes to retain after initial MASH screen step"
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
108 help="The default value of 10 is suitable for almost all scenarios."/>
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
109 <param name="bcs_thresholds" type="select" label="Enter the type of base quality thresholds to be set with bettercallsal"
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
110 help="The default value sets strictest thresholds that tends to filter out most of the false positive hits.">
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
111 <option value="strict" selected="true">strict</option>
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
112 <option value="relax">relax</option>
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
113 </param>
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
114 <param name="kma_id" optional="true" value="10.0" type="text" label="Enter the %ID threshold for KMA alignments of samples against genomes"
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
115 help="The default value of 10% works well for enrichment samples tested within FDA. The 'relax' preset for base quality thresholds automatically sets this value to 5%."/>
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
116 <conditional name="sourmash_cond">
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
117 <param name="run" type="select" label="Run sourmash"
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
118 help="Should sourmash be used for additional genome fraction filtering">
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
119 <option value="true" selected="true">yes</option>
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
120 <option value="false">no</option>
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
121 </param>
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
122 <when value="true">
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
123 <param name="sfhpy_fcv" type="text" value="0.1" label="Enter the minimum coverage match with sourmash before a serotype hit is considered for further processing"
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
124 help="The default value is set at 10% coverage threshold."/>
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
125 </when>
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
126 <when value="false">
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
127 <param name="sfhpy_fcv" type="select" label="Enter the minimum coverage match with sourmash before a serotype hit is considered for further processing"
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
128 help="THIS OPTION IS IGNORED IF SOURMASH TOOL IS NOT RUN.">
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
129 <option value="NA" selected="true">N/A</option>
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
130 </param>
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
131 </when>
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
132 </conditional>
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
133 <param name="fq_filename_delim" type="text" value="_" label="File name delimitor by which samples are grouped together (--fq_filename_delim)"
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
134 help="This is the delimitor by which samples are grouped together to display in the final MultiQC report. For example, if your input data sets are mango_replicate1.fastq.gz, mango_replicate2.fastq.gz, orange_replicate1_maryland.fastq.gz, orange_replicate2_maryland.fastq.gz, then to create 2 samples mango and orange, the value for --fq_filename_delim would be _ (underscore) and the value for --fq_filename_delim_idx would be 1, since you want to group by the first word (i.e. mango or orange) after splitting the filename based on _ (underscore)."/>
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
135 <param name="fq_filename_delim_idx" type="integer" value="1" label="File name delimitor index (--fq_filename_delim_idx)" />
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
136 <!-- <param name="runtime_profile" type="select" label="Run time profile">
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
137 <option value="kondagac" selected="true">conda</option>
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
138 <option value="cingularitygac">singularity</option>
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
139 </param> -->
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
140 </inputs>
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
141 <outputs>
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
142 <data name="multiqc_report" format="html" label="bettercallsal: MultiQC Report on ${on_string}" from_work_dir="multiqc_report.html"/>
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
143 </outputs>
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
144 <tests>
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
145 <!--Test 01: long reads-->
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
146 <test expect_num_outputs="2">
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
147 <param name="input">
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
148 <collection type="list">
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
149 <element name="FAL11127.fastq.gz" value="FAL11127.fastq.gz" />
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
150 <element name="FAL11341.fastq.gz" value="FAL11341.fastq.gz" />
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
151 <element name="FAL11342.fastq.gz" value="FAL11342.fastq.gz" />
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
152 </collection>
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
153 </param>
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
154 <param name="fq_suffix" value=".fastq.gz"/>
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
155 <output name="multiqc_report" file="multiqc_report.html" ftype="html" compare="sim_size"/>
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
156 <!-- <output name="assembled_mags" file="FAL11127.assembly_filtered.contigs.fasta" ftype="fasta" compare="sim_size"/> -->
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
157 </test>
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
158 </tests>
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
159 <help><![CDATA[
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
160
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
161 .. class:: infomark
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
162
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
163 **Purpose**
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
164
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
165 bettercallsal is an automated workflow to assign Salmonella serotype based on NCBI Pathogen Detection Project for Salmonella.
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
166 It uses MASH to reduce the search space followed by additional genome filtering with sourmash. It then performs genome based
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
167 alignment with kma followed by count generation using salmon. This workflow can be used to analyze shotgun metagenomics
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
168 datasets, quasi-metagenomic datasets (enriched for Salmonella) and target enriched datasets (enriched with molecular baits specific for Salmonella)
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
169 and is especially useful in a case where a sample is of multi-serovar mixture.
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
170
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
171 It is written in Nextflow and is part of the modular data analysis pipelines (CFSAN PIPELINES or CPIPES for short) at CFSAN.
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
172
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
173
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
174 ----
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
175
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
176 .. class:: infomark
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
177
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
178 **Testing and Validation**
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
179
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
180 The CPIPES - bettercallsal Nextflow pipeline has been wrapped to make it work in Galaxy. It takes in either paired or unpaired short reads list as an input
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
181 and generates a MultiQC report in the final step. The pipeline has been tested on 2x300 bp MiSeq and 2x150 bp NextSeq simulated reads and has been shown to call multiple
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
182 Salmonella serotypes with up to ~95% accuracy. The pipeline has also been tested on metagenomics data sets from Peach and Papaya outbreaks as discussed in
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
183 our publication (https://www.frontiersin.org/articles/10.3389/fmicb.2023.1200983/full). All the original testing and validation was
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
184 done on the command line on the CFSAN Raven2 HPC Cluster.
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
185
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
186
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
187 ----
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
188
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
189 .. class:: infomark
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
190
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
191 **Outputs**
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
192
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
193 The main output file is a:
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
194
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
195 ::
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
196
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
197 - MultiQC Report: Contains a brief summary report including any serotyping and AMR result tables.
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
198 Please note that due to MultiQC customizations, the preview (eye icon) will not
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
199 work within Galaxy for the MultiQC report. Please download the file by clicking
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
200 on the floppy icon and view it in your browser on your local desktop/workstation.
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
201 You can export the tables and plots from the downloaded MultiQC report.
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
202
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
203 ]]></help>
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
204 <citations>
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
205 <citation type="bibtex">
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
206 @article{bettercallsal,
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
207 author = {Konganti, Kranti},
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
208 year = {2023},
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
209 month = {August},
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
210 title = {bettercallsal: better calling of Salmonella serotypes from enrichment cultures using shotgun metagenomic profiling and its application in an outbreak setting},
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
211 journal = {Frontiers in Microbiology},
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
212 doi = {10.3389/fmicb.2023.1200983},
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
213 url = {https://www.frontiersin.org/articles/10.3389/fmicb.2023.1200983/full}}
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
214 </citation>
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
215 </citations>
0a8dda29956e planemo upload
galaxytrakr
parents:
diff changeset
216 </tool>