annotate flye_cpu15mem59.xml @ 1:ab6ffc360b78 draft

planemo upload commit 449e45c59730743e250e8e09c1dfb4c6c3794ce3
author estrain
date Fri, 13 Mar 2026 11:36:25 +0000
parents e1e6ef58f334
children 7049afca140c
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
1 <tool id="flye" name="Flye" version="@TOOL_VERSION@+galaxy@SUFFIX_VERSION@" profile="20.01">
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
2 <description>de novo assembler for single molecule sequencing reads</description>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
3 <macros>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
4 <import>macros.xml</import>
1
ab6ffc360b78 planemo upload commit 449e45c59730743e250e8e09c1dfb4c6c3794ce3
estrain
parents: 0
diff changeset
5
0
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
6 </macros>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
7 <expand macro="edam_ontology"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
8 <expand macro="xrefs"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
9 <expand macro="requirements" />
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
10 <version_command>flye --version</version_command>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
11 <command detect_errors="exit_code"><![CDATA[
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
12 #if $input.is_of_type('fastqsanger', 'fastq'):
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
13 #set ext = 'fastq'
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
14 #elif $input.is_of_type('fastqsanger.gz', 'fastq.gz'):
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
15 #set ext = 'fastq.gz'
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
16 #elif $input.is_of_type('fasta.gz'):
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
17 #set ext = 'fasta.gz'
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
18 #elif $input.is_of_type('fasta'):
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
19 #set ext = 'fasta'
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
20 #else:
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
21 #set ext = 'dat'
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
22 #end if
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
23
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
24 ln -sf '$input' ./input_0.${ext} &&
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
25 flye $mode_conditional.mode ./input_0.${ext}
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
26 -o out_dir
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
27 -t \${GALAXY_SLOTS:-4}
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
28 -i $iterations
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
29 #if $mode_conditional.mode == '--pacbio-hifi' and $mode_conditional.hifi_error:
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
30 --hifi-error $mode_conditional.hifi_error
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
31 #end if
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
32 #if $min_overlap:
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
33 -m $min_overlap
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
34 #end if
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
35 #if $asm.asm_select == 'true':
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
36 --asm-coverage $asm.asm_coverage
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
37 -g '$asm.genome_size'
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
38 #end if
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
39 #if $meta:
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
40 $meta
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
41 #end if
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
42 #if $scaffold:
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
43 $scaffold
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
44 #end if
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
45 #if $no_alt_contigs:
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
46 $no_alt_contigs
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
47 #end if
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
48 ]]></command>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
49 <inputs>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
50 <param name="input" type="data" format="fasta,fasta.gz,fastq,fastq.gz,fastqsanger.gz,fastqsanger" label="Read file" />
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
51 <conditional name="mode_conditional">
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
52 <param name="mode" type="select" label="Mode">
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
53 <option value="--nano-raw">Nanopore raw (--nano-raw)</option>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
54 <option value="--nano-corr">Nanopore corrected (--nano-corr)</option>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
55 <option value="--nano-hq">Nanopore HQ (--nano-hq)</option>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
56 <option value="--pacbio-raw">PacBio raw (--pacbio-raw)</option>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
57 <option value="--pacbio-corr">PacBio corrected (--pacbio-corr)</option>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
58 <option value="--pacbio-hifi">PacBio HiFi (--pacbio-hifi)</option>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
59 </param>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
60 <when value="--nano-raw"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
61 <when value="--nano-corr"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
62 <when value="--nano-hq"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
63 <when value="--pacbio-raw"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
64 <when value="--pacbio-corr"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
65 <when value="--pacbio-hifi">
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
66 <param argument="--hifi-error" type="float" min="0" max="1" optional="true" label="Expected HiFi reads error rate" help="Default: 0.01"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
67 </when>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
68 </conditional>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
69 <param argument="--iterations" type="integer" value="1" label="Number of polishing iterations"
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
70 help="Polishing is performed as the final assembly stage. By default, Flye runs one polishing iteration. Additional iterations
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
71 might correct a small number of extra errors (due to improvements on how reads may align to the corrected assembly). If the
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
72 parameter is set to 0, the polishing is not performed"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
73 <param argument="--min-overlap" type="integer" min="1000" max="10000" optional="true" label="Minimum overlap between reads"
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
74 help="This sets a minimum overlap length for two reads to be considered overlapping. By default it is chosen
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
75 automatically based on the read length distribution (reads N90) and does not require manual setting. Typical
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
76 value is 3k-5k (and down to 1k for datasets with shorter read length). Intuitively, we want to set this
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
77 parameter as high as possible, so the repeat graph is less tangled. However, higher values might lead to assembly gaps.
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
78 In some rare cases it makes sense to manually increase minimum overlap for assemblies of big genomes with long reads and high coverage." />
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
79 <param argument="--keep-haplotypes" type="boolean" truevalue="--keep-haplotypes" falsevalue="" checked="False" label="Keep haplotypes"
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
80 help="By default, Flye collapses graph structures caused by alternative haplotypes (bubbles, superbubbles, roundabouts) to produce longer
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
81 consensus contigs. This option retains the alternative paths on the graph, producing less contigouos, but more detailed assembly."/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
82 <param argument="--scaffold" type="boolean" truevalue="--scaffold" falsevalue="" label="Enable scaffolding using graph"
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
83 help="Starting from the version 2.9 Flye does not perform scaffolding by default, which guarantees that all assembled sequences do not have any gaps" />
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
84 <param argument="--meta" type="boolean" truevalue="--meta" falsevalue="" checked="False" label="Perform metagenomic assembly"
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
85 help="It is designed for highly non-uniform coverage and is sensitive to underrepresented sequence at low coverage (as low as 2x).
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
86 In some examples of simple metagenomes, we observed that the normal mode assembled more contigious bacterial
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
87 consensus sequence, while the metagenome mode was slightly more fragmented, but revealed strain mixtures"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
88 <conditional name="asm">
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
89 <param name="asm_select" type="select" label="Reduced contig assembly coverage" help="Typically, assemblies of large genomes at high coverage require a large amount of RAM. For high coverage assemblies, you can reduce memory usage by using only a subset of longest reads for initial contig extension stage (which is often the memory bottleneck)">
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
90 <option value="true">Enable reduced coverage for initial disjointing assembly</option>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
91 <option value="false" selected="true">Disable reduced coverage for initial disjointing assembly</option>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
92 </param>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
93 <when value="true">
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
94 <param argument="--asm-coverage" type="integer" min="0" value="30"
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
95 label="Reduced coverage for initial disjointing assembly"
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
96 help="This parameter specifies the target coverage of the longest reads. For a typical assembly, 30x is enough to produce good
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
97 initial contigs. Regardless of this parameter, all reads will be used at the later pipeline stages."/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
98 <param argument="--genome-size" type="text" optional="true" label="Estimated genome size"
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
99 help="For example, 5m or 2.6g. No longer required as input. However, it must be used in conjunction with --asm-coverage option.">
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
100 <validator type="regex" message="Genome size must be a float or integer, optionally followed by the a unit prefix (kmg)">^([0-9]*[.])?[0-9]+[kmg]?$</validator>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
101 </param>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
102 </when>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
103 <when value="false" />
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
104 </conditional>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
105 <param argument="--no-alt-contigs" type="boolean" truevalue="--no-alt-contigs" falsevalue="" checked="false" label="Remove all non-primary contigs from the assembly"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
106 <param name="generate_log" type="boolean" truevalue="true" falsevalue="false" checked="false" label="Generate a log file"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
107 </inputs>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
108 <outputs>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
109 <data name="consensus" format="fasta" from_work_dir="out_dir/assembly.fasta" label="${tool.name} on ${on_string}: consensus"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
110 <data name="assembly_graph" format="graph_dot" from_work_dir="out_dir/assembly_graph.gv" label="${tool.name} on ${on_string}: assembly graph"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
111 <data name="assembly_gfa" format="gfa1" from_work_dir="out_dir/assembly_graph.gfa" label="${tool.name} on ${on_string}: graphical fragment assembly"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
112 <data name="assembly_info" format="tabular" from_work_dir="out_dir/assembly_info.txt" label="${tool.name} on ${on_string}: assembly info"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
113 <data name="flye_log" format="txt" from_work_dir="out_dir/flye.log" label="${tool.name} on ${on_string}: log">
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
114 <filter>generate_log</filter>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
115 </data>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
116 </outputs>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
117 <tests>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
118 <!--Test 01: pacbio-raw-->
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
119 <test expect_num_outputs="5">
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
120 <param name="inputs" ftype="fastq.gz" value="ecoli_01.fastq.gz,ecoli_02.fastq.gz,ecoli_03.fastq.gz,ecoli_04.fastq.gz,ecoli_05.fastq.gz,ecoli_06.fastq.gz,ecoli_07.fastq.gz"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
121 <conditional name="mode_conditional">
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
122 <param name="mode" value="--pacbio-raw"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
123 </conditional>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
124 <param name="iterations" value="0"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
125 <param name="generate_log" value="true"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
126 <output name="assembly_info" file="result1_assembly_info.txt" ftype="tabular" compare="sim_size"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
127 <output name="assembly_graph" file="result1_assembly_graph.dot" ftype="graph_dot" compare="sim_size"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
128 <output name="assembly_gfa" file="result1_assembly_graph.gfa" ftype="gfa1" compare="diff" lines_diff="10"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
129 <output name="consensus" ftype="fasta">
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
130 <assert_contents>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
131 <has_line line=">contig_1"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
132 </assert_contents>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
133 </output>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
134 <output name="flye_log" file="result1.log" ftype="txt" compare="sim_size"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
135 </test>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
136 <!--Test 02: nano raw-->
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
137 <test expect_num_outputs="4">
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
138 <param name="inputs" ftype="fasta.gz" value="nanopore.fasta.gz"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
139 <conditional name="mode_conditional">
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
140 <param name="mode" value="--nano-raw"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
141 </conditional>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
142 <param name="iterations" value="0"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
143 <output name="assembly_info" ftype="tabular">
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
144 <assert_contents>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
145 <has_size value="95" delta="100"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
146 </assert_contents>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
147 </output>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
148 <output name="assembly_graph" ftype="graph_dot">
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
149 <assert_contents>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
150 <has_size value="803" delta="100"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
151 </assert_contents>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
152 </output>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
153 <output name="assembly_gfa" ftype="gfa1">
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
154 <assert_contents>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
155 <has_size value="35047" delta="100"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
156 </assert_contents>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
157 </output>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
158 <output name="consensus" ftype="fasta">
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
159 <assert_contents>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
160 <has_size value="35573" delta="100"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
161 </assert_contents>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
162 </output>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
163 </test>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
164 <!--Test 03: reduce coverage-->
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
165 <test expect_num_outputs="4">
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
166 <param name="inputs" ftype="fastq.gz" value="ecoli_hifi_01.fastq.gz,ecoli_hifi_02.fastq.gz,ecoli_hifi_03.fastq.gz,ecoli_hifi_04.fastq.gz,ecoli_hifi_05.fastq.gz,ecoli_hifi_06.fastq.gz,ecoli_hifi_07.fastq.gz,ecoli_hifi_08.fastq.gz,ecoli_hifi_09.fastq.gz"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
167 <conditional name="mode_conditional">
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
168 <param name="mode" value="--nano-raw"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
169 </conditional>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
170 <conditional name="asm">
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
171 <param name="asm_select" value="true" />
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
172 <param name="asm_coverage" value="30"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
173 <param name="genome_size" value="3980000"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
174 </conditional>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
175 <output name="assembly_info" ftype="tabular">
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
176 <assert_contents>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
177 <has_size value="286" delta="100"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
178 </assert_contents>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
179 </output>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
180 <output name="assembly_graph" ftype="graph_dot">
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
181 <assert_contents>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
182 <has_size value="1840" delta="100"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
183 </assert_contents>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
184 </output>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
185 <output name="assembly_gfa" ftype="gfa1">
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
186 <assert_contents>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
187 <has_size value="420752" delta="100"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
188 </assert_contents>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
189 </output>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
190 <output name="consensus" ftype="fasta">
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
191 <assert_contents>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
192 <has_size value="427580" delta="100"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
193 </assert_contents>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
194 </output>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
195 </test>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
196 <!--Test 04: metagenomic mode-->
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
197 <test expect_num_outputs="4">
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
198 <param name="inputs" ftype="fastq.gz" value="ecoli_01.fastq.gz,ecoli_02.fastq.gz,ecoli_03.fastq.gz,ecoli_04.fastq.gz,ecoli_05.fastq.gz,ecoli_06.fastq.gz,ecoli_07.fastq.gz"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
199 <conditional name="mode_conditional">
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
200 <param name="mode" value="--pacbio-raw"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
201 </conditional>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
202 <param name="meta" value="true"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
203 <output name="assembly_info" ftype="tabular">
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
204 <assert_contents>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
205 <has_size value="95" delta="100"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
206 </assert_contents>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
207 </output>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
208 <output name="assembly_graph" ftype="graph_dot">
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
209 <assert_contents>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
210 <has_size value="367" delta="100"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
211 </assert_contents>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
212 </output>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
213 <output name="assembly_gfa" ftype="gfa1">
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
214 <assert_contents>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
215 <has_size value="418729" delta="100"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
216 </assert_contents>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
217 </output>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
218 <output name="consensus" ftype="fasta">
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
219 <assert_contents>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
220 <has_size value="425667" delta="100"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
221 </assert_contents>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
222 </output>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
223 </test>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
224 <!--Test 05: nanopore HQ mode-->
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
225 <test expect_num_outputs="4">
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
226 <param name="inputs" ftype="fastq.gz" value="ecoli_hifi_01.fastq.gz,ecoli_hifi_02.fastq.gz,ecoli_hifi_03.fastq.gz,ecoli_hifi_04.fastq.gz,ecoli_hifi_05.fastq.gz,ecoli_hifi_06.fastq.gz,ecoli_hifi_07.fastq.gz,ecoli_hifi_08.fastq.gz,ecoli_hifi_09.fastq.gz"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
227 <conditional name="mode_conditional">
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
228 <param name="mode" value="--nano-hq"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
229 </conditional>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
230 <param name="min_overlap" value="1000"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
231 <output name="assembly_info" ftype="tabular">
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
232 <assert_contents>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
233 <has_size value="286" delta="100"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
234 </assert_contents>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
235 </output>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
236 <output name="assembly_graph" ftype="graph_dot">
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
237 <assert_contents>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
238 <has_size value="1248" delta="100"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
239 </assert_contents>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
240 </output>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
241 <output name="assembly_gfa" ftype="gfa1">
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
242 <assert_contents>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
243 <has_size value="419414" delta="1000"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
244 </assert_contents>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
245 </output>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
246 <output name="consensus" ftype="fasta">
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
247 <assert_contents>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
248 <has_size value="426277" delta="1000"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
249 </assert_contents>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
250 </output>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
251 </test>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
252 <!--Test 06: hifi error option-->
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
253 <test expect_num_outputs="4">
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
254 <param name="inputs" ftype="fastq.gz" value="ecoli_hifi_01.fastq.gz,ecoli_hifi_02.fastq.gz,ecoli_hifi_03.fastq.gz,ecoli_hifi_04.fastq.gz,ecoli_hifi_05.fastq.gz,ecoli_hifi_06.fastq.gz,ecoli_hifi_07.fastq.gz,ecoli_hifi_08.fastq.gz,ecoli_hifi_09.fastq.gz"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
255 <conditional name="mode_conditional">
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
256 <param name="mode" value="--pacbio-hifi"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
257 <param name="hifi_error" value="0.21"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
258 </conditional>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
259 <param name="min_overlap" value="1000"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
260 <output name="assembly_info" ftype="tabular">
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
261 <assert_contents>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
262 <has_size value="286" delta="100"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
263 </assert_contents>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
264 </output>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
265 <output name="assembly_graph" ftype="graph_dot">
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
266 <assert_contents>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
267 <has_size value="1248" delta="500"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
268 </assert_contents>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
269 </output>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
270 <output name="assembly_gfa" ftype="gfa1">
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
271 <assert_contents>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
272 <has_size value="420254" delta="2000"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
273 </assert_contents>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
274 </output>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
275 <output name="consensus" ftype="fasta">
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
276 <assert_contents>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
277 <has_size value="427131" delta="2000"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
278 </assert_contents>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
279 </output>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
280 </test>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
281 <!--Test 07: keep haplotypes-->
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
282 <test expect_num_outputs="4">
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
283 <param name="inputs" ftype="fastq.gz" value="ecoli_hifi_01.fastq.gz,ecoli_hifi_02.fastq.gz,ecoli_hifi_03.fastq.gz,ecoli_hifi_04.fastq.gz,ecoli_hifi_05.fastq.gz,ecoli_hifi_06.fastq.gz,ecoli_hifi_07.fastq.gz,ecoli_hifi_08.fastq.gz,ecoli_hifi_09.fastq.gz"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
284 <conditional name="mode_conditional">
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
285 <param name="mode" value="--pacbio-corr"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
286 </conditional>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
287 <param name="min_overlap" value="1000"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
288 <param name="keep_haplotypes" value="true"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
289 <output name="assembly_info" ftype="tabular">
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
290 <assert_contents>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
291 <has_size value="286" delta="200"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
292 </assert_contents>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
293 </output>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
294 <output name="assembly_graph" ftype="graph_dot">
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
295 <assert_contents>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
296 <has_size value="1273" delta="500"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
297 </assert_contents>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
298 </output>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
299 <output name="assembly_gfa" ftype="gfa1">
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
300 <assert_contents>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
301 <has_size value="420254" delta="3000"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
302 </assert_contents>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
303 </output>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
304 <output name="consensus" ftype="fasta">
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
305 <assert_contents>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
306 <has_size value="427131" delta="3000"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
307 </assert_contents>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
308 </output>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
309 </test>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
310 <!--Test 08: scaffolding mode-->
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
311 <test expect_num_outputs="4">
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
312 <param name="inputs" ftype="fastq.gz" value="ecoli_hifi_01.fastq.gz,ecoli_hifi_02.fastq.gz,ecoli_hifi_03.fastq.gz,ecoli_hifi_04.fastq.gz,ecoli_hifi_05.fastq.gz,ecoli_hifi_06.fastq.gz,ecoli_hifi_07.fastq.gz,ecoli_hifi_08.fastq.gz,ecoli_hifi_09.fastq.gz"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
313 <conditional name="mode_conditional">
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
314 <param name="mode" value="--nano-hq"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
315 </conditional>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
316 <param name="min_overlap" value="1000"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
317 <param name="scaffold" value="true"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
318 <output name="assembly_info" ftype="tabular">
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
319 <assert_contents>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
320 <has_size value="286" delta="100"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
321 </assert_contents>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
322 </output>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
323 <output name="assembly_graph" ftype="graph_dot">
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
324 <assert_contents>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
325 <has_size value="1248" delta="100"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
326 </assert_contents>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
327 </output>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
328 <output name="assembly_gfa" ftype="gfa1">
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
329 <assert_contents>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
330 <has_size value="419414" delta="2000"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
331 </assert_contents>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
332 </output>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
333 <output name="consensus" ftype="fasta">
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
334 <assert_contents>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
335 <has_size value="426277" delta="2000"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
336 </assert_contents>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
337 </output>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
338 </test>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
339 <!--Test 09: test not-alt-contigs parameter w-->
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
340 <test expect_num_outputs="4">
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
341 <param name="inputs" ftype="fasta.gz" value="nanopore.fasta.gz"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
342 <conditional name="mode_conditional">
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
343 <param name="mode" value="--nano-raw"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
344 </conditional>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
345 <param name="iterations" value="0"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
346 <param name="no_alt_contigs" value="true"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
347 <output name="assembly_info" ftype="tabular">
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
348 <assert_contents>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
349 <has_size value="151" delta="100"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
350 </assert_contents>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
351 </output>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
352 <output name="assembly_graph" ftype="graph_dot">
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
353 <assert_contents>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
354 <has_size value="217" delta="100"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
355 </assert_contents>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
356 </output>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
357 <output name="assembly_gfa" ftype="gfa1">
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
358 <assert_contents>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
359 <has_size value="5110" delta="100"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
360 </assert_contents>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
361 </output>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
362 <output name="consensus" ftype="fasta">
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
363 <assert_contents>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
364 <has_size value="5123" delta="100"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
365 </assert_contents>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
366 </output>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
367 </test>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
368 </tests>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
369 <help><![CDATA[
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
370
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
371 **Purpose**
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
372
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
373 Flye is a de novo assembler for single molecule sequencing reads, such as those produced by PacBio and Oxford Nanopore Technologies.
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
374 It is designed for a wide range of datasets, from small bacterial projects to large mammalian-scale assemblies. The package represents
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
375 a complete pipeline: it takes raw PacBio/ONT reads as input and outputs polished contigs. Flye also has a special mode for metagenome
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
376 assembly.
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
377
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
378 ----
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
379
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
380 **Quick usage**
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
381
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
382 Input reads can be in FASTA or FASTQ format, uncompressed or compressed with gz. Currently, PacBio (raw, corrected, HiFi) and ONT reads
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
383 (raw, corrected) are supported. Expected error rates are <30% for raw, <3% for corrected, and <1% for HiFi. Note that Flye was primarily
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
384 developed to run on raw reads. You may specify multiple files with reads (separated by spaces). Mixing different read types is not yet supported. The *--meta* o
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
385 ption enables the mode for metagenome/uneven coverage assembly.
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
386
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
387 Genome size estimate is no longer a required option. You need to provide an estimate if using *--asm-coverage* option.
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
388
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
389 To reduce memory consumption for large genome assemblies, you can use a subset of the longest reads for initial disjointig assembly by
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
390 specifying *--asm-coverage* and *--genome-size* options. Typically, 40x coverage is enough to produce good disjointigs.
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
391
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
392 ----
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
393
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
394 **Outputs**
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
395
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
396 The main output files are:
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
397
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
398 * Final assembly: contains contigs and possibly scaffolds (see below).
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
399 * Final repeat graph: note that the edge sequences might be different (shorter) than contig sequences, because contigs might include multiple graph edges.
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
400 * Extra information about contigs (such as length or coverage).
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
401
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
402 Each contig is formed by a single unique graph edge. If possible, unique contigs are extended with the sequence from flanking unresolved repeats on the graph. Thus,
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
403 a contig fully contains the corresponding graph edge (with the same id), but might be longer then this edge. This is somewhat similar to unitig-contig relation in
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
404 OLC assemblers. In a rare case when a repetitive graph edge is not covered by the set of "extended" contigs, it will be also output in the assembly file.
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
405
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
406 Sometimes it is possible to further order contigs into scaffolds based on the repeat graph structure. These ordered contigs will be output as a part of scaffold in
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
407 the assembly file (with a scaffold prefix). Since it is hard to give a reliable estimate of the gap size, those gaps are represented with the default 100 Ns.
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
408 assembly_info.txt file (below) contains additional information about how scaffolds were formed.
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
409
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
410 Extra information about contigs/scaffolds is output into the assembly_info.txt file. It is a tab-delimited table with the columns as follows:
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
411
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
412 * Contig/scaffold id
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
413 * Length
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
414 * Coverage
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
415 * Is circular, (Y)es or (N)o
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
416 * Is repetitive, (Y)es or (N)o
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
417 * Multiplicity (based on coverage)
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
418 * Alternative group
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
419 * Graph path (graph path corresponding to this contig/scaffold).
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
420
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
421 Scaffold gaps are marked with `??` symbols, and `*` symbol denotes a terminal graph node. Alternative contigs (representing alternative haplotypes) will have the same alt.
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
422 group ID. Primary contigs are marked by `*`.
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
423
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
424 ----
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
425
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
426 **Algorithm Description**
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
427
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
428 This is a brief description of the Flye algorithm. Please refer to the manuscript for more detailed information. The draft contig extension is organized as follows:
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
429
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
430 * K-mer counting / erroneous k-mer pre-filtering
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
431 * Solid k-mer selection (k-mers with sufficient frequency, which are unlikely to be erroneous)
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
432 * Contig extension. The algorithm starts from a single read and extends it with a next overlapping read (overlaps are dynamically detected using the selected solid k-mers).
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
433
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
434 Note that we do not attempt to resolve repeats at this stage, thus the reconstructed contigs might contain misassemblies. Flye then aligns the reads on these draft
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
435 contigs using minimap2 and calls a consensus. Afterwards, Flye performs repeat analysis as follows:
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
436
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
437 * Repeat graph is constructed from the (possibly misassembled) contigs
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
438 * In this graph all repeats longer than minimum overlap are collapsed
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
439 * The algorithm resolves repeats using the read information and graph structure
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
440 * The unbranching paths in the graph are output as contigs
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
441
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
442 If enabled, after resolving bridged repeats, Trestle module attempts to resolve simple unbridged repeats (of multiplicity 2) using the heterogeneities between repeat copies.
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
443 Finally, Flye performs polishing of the resulting assembly to correct the remaining errors:
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
444
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
445 * Alignment of all reads to the current assembly using minimap2
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
446 * Partition the alignment into mini-alignments (bubbles)
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
447 * Error correction of each bubble using a maximum likelihood approach
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
448
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
449 The polishing steps could be repeated, which might slightly increase quality for some datasets.
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
450
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
451
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
452 ]]></help>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
453 <expand macro="citations" />
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
454 </tool>