annotate hfp_centriflaken.xml @ 0:082e0091e813 draft default tip

planemo upload
author galaxytrakr
date Fri, 29 May 2026 13:27:47 +0000
parents
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
1 <tool id="hfp_centriflaken_awsbatch" name="centriflaken" version="0.4.2+awsbatch">
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
2 <description>An automated pipeline to generate a MAG of interest (E.coli or Salmonella) and perform serotyping.</description>
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
3 <requirements>
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
4 <container type="docker">quay.io/galaxytrakr/mulled-v2-ebd88135862aa647eeae73d4d8e6ea8ec81245cd:v5.0</container>
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
5 </requirements>
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
6 <version_command>nextflow -version</version_command>
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
7 <command detect_errors="exit_code"><![CDATA[
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
8 export MAMBA_ROOT_PREFIX="/server/galaxy/data/nextflow-micromamba-cache";
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
9 export NXF_HOME=\$(pwd)"/.nextflow-home";
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
10 input_path=\$(pwd)"/cpipes-input";
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
11 mkdir -p "\${input_path}" || exit 1;
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
12 #import re
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
13 #if (str($input_read_type_cond.input_read_type) == "single_long"):
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
14 #for _, $unpaired in enumerate($input_read_type_cond.input):
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
15 #set read1 = str($unpaired.name)
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
16 #if not str($unpaired.name).endswith(('.fastq', '.fastq.gz')):
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
17 #set read1_ext = re.sub('fastqsanger', 'fastq', str($unpaired.ext))
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
18 #set read1 = str($unpaired.name) + str('.') + $read1_ext
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
19 #end if
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
20 ln -sf '$unpaired' "\${input_path}/$read1";
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
21 #end for
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
22 #elif (str($input_read_type_cond.input_read_type) == "paired"):
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
23 #for _, $pair in enumerate($input_read_type_cond.input_pair)
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
24 #set read_R1 = re.sub('\:forward', '_forward', str($pair.forward.name))
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
25 #set read_R2 = re.sub('\:reverse', '_reverse', str($pair.reverse.name))
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
26 #set read_R1_ext = re.sub('fastqsanger', 'fastq', str($pair.forward.ext))
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
27 #set read_R2_ext = re.sub('fastqsanger', 'fastq', str($pair.reverse.ext))
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
28 #if not str($pair.forward.name).endswith(('.fastq', '.fastq.gz')):
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
29 #set read_R1 = $read_R1 + str('.') + $read_R1_ext
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
30 #end if
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
31 #if not str($pair.reverse.name).endswith(('.fastq', '.fastq.gz')):
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
32 #set read_R2 = $read_R2 + str('.') + $read_R2_ext
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
33 #end if
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
34 ln -sf '$pair.forward' "\${input_path}/$read_R1";
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
35 ln -sf '$pair.reverse' "\${input_path}/$read_R2";
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
36 #end for
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
37 #end if
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
38 $__tool_directory__/0.4.2/cpipes
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
39 --pipeline $input_read_type_cond.pipeline_cond.pipeline
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
40 #if ($input_read_type_cond.pipeline_cond.pipeline == "centriflaken"):
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
41 --fq_single_end true
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
42 --flye_genome_size '${genome_size}'
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
43 #if ($input_read_type_cond.pipeline_cond.long_read_platform == "nanopore_corr"):
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
44 --flye_nano_corr true --flye_nano_raw false
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
45 #elif ($input_read_type_cond.pipeline_cond.long_read_platform == "nanopore_hq"):
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
46 --flye_nano_hq true --flye_nano_raw false
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
47 #elif ($input_read_type_cond.pipeline_cond.long_read_platform == "pacbio_raw"):
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
48 --flye_pacbio_raw true --flye_nano_raw false
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
49 #elif ($input_read_type_cond.pipeline_cond.long_read_platform == "pacbio_corr"):
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
50 --flye_pacbio_corr true --flye_nano_raw false
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
51 #elif ($input_read_type_cond.pipeline_cond.long_read_platform == "pacbio_hifi"):
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
52 --flye_pacbio_hifi true --flye_nano_raw false
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
53 #end if
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
54 #elif ($input_read_type_cond.pipeline_cond.pipeline == "centriflaken_hy"):
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
55 #if (str($input_read_type_cond.input_read_type) == "single_long"):
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
56 --fq_single_end true
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
57 #elif (str($input_read_type_cond.input_read_type) == "paired"):
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
58 --fq_single_end false --fq2_suffix '${input_read_type_cond.fq2_suffix}'
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
59 #end if
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
60 #end if
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
61 --input \${input_path}
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
62 --output cpipes-output
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
63 --fq_suffix '${input_read_type_cond.fq_suffix}'
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
64 #if ($fq_filter_by_len != ""):
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
65 --fq_filter_by_len $fq_filter_by_len
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
66 #end if
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
67 --fq_filename_delim '${fq_filename_delim}'
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
68 --fq_filename_delim_idx $fq_filename_delim_idx
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
69 --centrifuge_extract_bug '${centrifuge_extract_bug}'
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
70 #if (str($input_read_type_cond.pipeline_cond.rm_dup_seqs) == "true"):
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
71 --seqkit_rmdup_run true
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
72 #end if
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
73 -profile stdkondagac;
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
74 mv "./cpipes-output/${input_read_type_cond.pipeline_cond.pipeline}-multiqc/CPIPES-Report_multiqc_report.html" "./multiqc_report.html" || exit 1;
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
75 mv "./cpipes-output/${input_read_type_cond.pipeline_cond.pipeline}-results/kraken2_extract_contigs" "kraken2_extract_contigs" || exit 1;
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
76 ]]></command>
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
77 <inputs>
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
78 <conditional name="input_read_type_cond">
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
79 <param name="input_read_type" type="select" label="Select the read collection type">
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
80 <option value="single_long" selected="true">Unpaired reads (i.e. Single-End short reads or Long reads)</option>
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
81 <option value="paired">Paired-End reads</option>
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
82 </param>
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
83 <when value="single_long">
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
84 <param name="input" type="data_collection" collection_type="list" format="fastq,fastq.gz"
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
85 label="Dataset list of unpaired short reads or long reads" />
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
86 <conditional name="pipeline_cond">
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
87 <param name="pipeline" type="select" label="CPIPES Workflow name"
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
88 help="centriflaken: for long reads (Nanopore or PacBio). centriflaken_hy: for unpaired short reads. Default: centriflaken">
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
89 <option value="centriflaken" selected="true">centriflaken</option>
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
90 <option value="centriflaken_hy">centriflaken_hy</option>
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
91 </param>
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
92 <when value="centriflaken">
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
93 <param name="long_read_platform" type="select" label="Mention long read sequencing platform and type">
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
94 <option value="nanopore_raw" selected="true">Nanopore raw reads, pre-Guppy5 (&lt;20% error)</option>
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
95 <option value="nanopore_corr">Nanopore reads that were corrected with other methods (&lt;3% error)</option>
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
96 <option value="nanopore_hq">Nanopore high-quality reads, Guppy5+ SUP or Q20 (5% error)</option>
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
97 <option value="pacbio_raw">PacBio regular CLR reads (&lt;20% error)</option>
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
98 <option value="pacbio_corr">PacBio reads that were corrected with other methods (&lt;3% error)</option>
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
99 <option value="pacbio_hifi">PacBio HiFi reads (&lt;1% error)</option>
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
100 </param>
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
101 <param name="rm_dup_seqs" type="select" label="Remove duplicate sequences"
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
102 help="THIS OPTION IS IGNORED IF THE INPUT READS ARE LONG READS.">
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
103 <option value="NA" selected="true">N/A</option>
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
104 </param>
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
105 </when>
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
106 <when value="centriflaken_hy">
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
107 <param name="long_read_platform" type="select" label="Mention long read sequencing platform and type"
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
108 help="THIS OPTION IS IGNORED IF THE INPUT READS ARE SHORT READS.">
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
109 <option value="NA" selected="true">N/A</option>
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
110 </param>
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
111 <param name="rm_dup_seqs" type="select" label="Remove duplicate sequences"
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
112 help="Selecting yes will compare sequence content and remove identical sequences i.e. only the first occured sequence record will be saved.">
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
113 <option value="true">yes</option>
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
114 <option value="false" selected="true">no</option>
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
115 </param>
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
116 </when>
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
117 </conditional>
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
118 <param name="fq_suffix" value=".fastq.gz" type="text" label="Suffix of the Unpaired FASTQ"/>
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
119 </when>
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
120 <when value="paired">
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
121 <param name="input_pair" type="data_collection" collection_type="list:paired" format="fastq,fastq.gz" label="List of Dataset pairs" />
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
122 <conditional name="pipeline_cond">
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
123 <param name="pipeline" type="select" label="CPIPES Workflow name"
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
124 help="Auto selected centriflaken_hy workflow for paired-end short reads.">
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
125 <option value="centriflaken_hy" selected="true">centriflaken_hy</option>
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
126 </param>
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
127 <when value="centriflaken_hy">
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
128 <param name="long_read_platform" type="select" label="Mention long read sequencing platform and type"
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
129 help="THIS OPTION IS IGNORED IF THE INPUT READS ARE SHORT READS.">
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
130 <option value="NA" selected="true">N/A</option>
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
131 </param>
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
132 <param name="rm_dup_seqs" type="select" label="Remove duplicate sequences"
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
133 help="Selecting yes will compare sequence content and remove identical sequences i.e. only the first occured sequence record will be saved.">
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
134 <option value="true">yes</option>
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
135 <option value="false" selected="true">no</option>
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
136 </param>
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
137 </when>
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
138 </conditional>
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
139 <param name="fq_suffix" value="_R1_001.fastq.gz" type="text" label="Suffix of the R1 FASTQ"/>
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
140 <param name="fq2_suffix" value="_R2_001.fastq.gz" type="text" label="Suffix of the R2 FASTQ"/>
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
141 </when>
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
142 </conditional>
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
143 <param name="fq_filter_by_len" optional="true" value="" type="integer" label="Enter minimum read length to retain before starting the analysis"
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
144 help="Keep this option empty to use default values. Default for centriflaken (long reads) is 4000 bp and for centriflaken_hy (short reads) is 75 bp."/>
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
145 <param name="fq_filename_delim" type="text" value="_" label="File name delimitor by which samples are grouped together (--fq_filename_delim)"
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
146 help="This is the delimitor by which samples are grouped together to display in the final MultiQC report. For example, if your input data sets are mango_replicate1.fastq.gz, mango_replicate2.fastq.gz, orange_replicate1_maryland.fastq.gz, orange_replicate2_maryland.fastq.gz, then to create 2 samples mango and orange, the value for --fq_filename_delim would be _ (underscore) and the value for --fq_filename_delim_idx would be 1, since you want to group by the first word (i.e. mango or orange) after splitting the filename based on _ (underscore)."/>
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
147 <param name="fq_filename_delim_idx" type="integer" value="1" label="File name delimitor index (--fq_filename_delim_idx)" />
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
148 <param name="centrifuge_extract_bug" type="text" value="Escherichia coli" label="Reads belonging to this taxa are extracted and a MAG is generated to allow for serotyping"/>
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
149 <param name="genome_size" type="text" optional="true" value="5.5m" label="Estimated genome size" help="For example, 5m or 2.6g.">
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
150 <validator type="regex" message="Genome size must be a float or integer, optionally followed by the a unit prefix (kmg)">^([0-9]*[.])?[0-9]+[kmg]?$</validator>
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
151 </param>
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
152 <!-- <param name="runtime_profile" type="select" label="Run time profile">
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
153 <option value="kondagac" selected="true">conda</option>
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
154 <option value="cingularitygac">singularity</option>
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
155 </param> -->
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
156 </inputs>
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
157 <outputs>
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
158 <data name="multiqc_report" format="html" label="${input_read_type_cond.pipeline_cond.pipeline}: MultiQC Report on ${on_string}" from_work_dir="multiqc_report.html"/>
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
159 <collection name="assembled_mags" type="list" label="${input_read_type_cond.pipeline_cond.pipeline}: Assembled MAGs on ${on_string}">
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
160 <discover_datasets pattern="(?P&lt;name&gt;.*)\.assembly_filtered_contigs\.fasta" ext="fasta" directory="kraken2_extract_contigs"/>
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
161 </collection>
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
162 </outputs>
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
163 <tests>
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
164 <!--Test 01: long reads-->
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
165 <test expect_num_outputs="2">
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
166 <param name="input">
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
167 <collection type="list">
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
168 <element name="FAL11127.fastq.gz" value="FAL11127.fastq.gz" />
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
169 <element name="FAL11341.fastq.gz" value="FAL11341.fastq.gz" />
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
170 <element name="FAL11342.fastq.gz" value="FAL11342.fastq.gz" />
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
171 </collection>
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
172 </param>
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
173 <param name="fq_suffix" value=".fastq.gz"/>
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
174 <output name="multiqc_report" file="multiqc_report.html" ftype="html" compare="sim_size"/>
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
175 <!-- <output name="assembled_mags" file="FAL11127.assembly_filtered.contigs.fasta" ftype="fasta" compare="sim_size"/> -->
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
176 </test>
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
177 </tests>
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
178 <help><![CDATA[
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
179
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
180 .. class:: infomark
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
181
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
182 **Purpose**
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
183
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
184 Centriflaken suite of automated data analysis pipelines are based on Nextflow DSL2 developed at CFSAN, FDA. These pipelines allow rapid
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
185 and effective construction of metagenomic assembled genomes (MAGs) to enable bacterial source-tracking. It is based on methods described in our
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
186 previous publication (Maguire *et al*, 2021. doi: https://doi.org/10.1371/journal.pone.0245172).
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
187
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
188 ----
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
189
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
190 .. class:: infomark
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
191
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
192 **Testing and Validation**
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
193
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
194 The CPIPES - Centriflaken Nextflow pipeline has been wrapped to make it work in Galaxy. It takes in either paired or unpaired short reads or long reads, generates MAGs and performs
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
195 in silico-based analysis (i.e., virulence gene finding). Additionally, AMR gene finding analysis is also included in Centriflaken and performed on MAGs
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
196 of interest. The final summary plots and tables can be downloaded from the provided MultiQC HTML report generated as part of the pipeline.
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
197 The Centriflaken pipeline was validated with data from our previously published method (Maguire *et al*, 2021. doi: https://doi.org/10.1371/journal.pone.0245172) and was able to replicate the detection
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
198 and classification of STECs for each sample. We tested the pipeline with Nanopore data obtained from 21 additional enriched samples from
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
199 irrigation water and was able to perform the entire precision metagenomics analysis in less than 5 hours for all of them. All the original testing and validation was
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
200 done on the command line on the CFSAN Raven2 HPC Cluster.
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
201
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
202
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
203 ----
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
204
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
205 .. class:: infomark
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
206
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
207 **Outputs**
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
208
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
209 The main output files are:
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
210
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
211 ::
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
212
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
213 - MultiQC Report: Contains a brief summary report including any serotyping and AMR result tables.
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
214 Please note that due to MultiQC customizations, the preview (eye icon) will not
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
215 work within Galaxy for the MultiQC report. Please download the file by clicking
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
216 on the floppy icon and view it in your browser on your local desktop/workstation.
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
217 - Final assembly: contains contigs and possibly scaffolds.
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
218
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
219 ]]></help>
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
220 <citations>
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
221 <citation type="bibtex">
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
222 @misc{gitlabCPIPES,
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
223 author = {Konganti, Kranti},
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
224 year = {2022},
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
225 title = {CPIPES - Centriflaken},
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
226 publisher = {GitLab},
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
227 journal = {GitLab repository},
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
228 url = {https://cfsan-git.fda.gov/Kranti.Konganti/cpipes}}
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
229 </citation>
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
230 </citations>
082e0091e813 planemo upload
galaxytrakr
parents:
diff changeset
231 </tool>