annotate flye_cpu15mem59.xml @ 0:e1e6ef58f334 draft

planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
author estrain
date Thu, 12 Mar 2026 20:06:54 +0000
parents
children ab6ffc360b78
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
1 <tool id="flye" name="Flye" version="@TOOL_VERSION@+galaxy@SUFFIX_VERSION@" profile="20.01">
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
2 <description>de novo assembler for single molecule sequencing reads</description>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
3 <macros>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
4 <import>macros.xml</import>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
5 </macros>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
6 <expand macro="edam_ontology"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
7 <expand macro="xrefs"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
8 <expand macro="requirements" />
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
9 <version_command>flye --version</version_command>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
10 <command detect_errors="exit_code"><![CDATA[
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
11 #if $input.is_of_type('fastqsanger', 'fastq'):
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
12 #set ext = 'fastq'
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
13 #elif $input.is_of_type('fastqsanger.gz', 'fastq.gz'):
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
14 #set ext = 'fastq.gz'
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
15 #elif $input.is_of_type('fasta.gz'):
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
16 #set ext = 'fasta.gz'
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
17 #elif $input.is_of_type('fasta'):
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
18 #set ext = 'fasta'
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
19 #else:
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
20 #set ext = 'dat'
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
21 #end if
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
22
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
23 ln -sf '$input' ./input_0.${ext} &&
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
24 flye $mode_conditional.mode ./input_0.${ext}
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
25 -o out_dir
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
26 -t \${GALAXY_SLOTS:-4}
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
27 -i $iterations
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
28 #if $mode_conditional.mode == '--pacbio-hifi' and $mode_conditional.hifi_error:
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
29 --hifi-error $mode_conditional.hifi_error
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
30 #end if
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
31 #if $min_overlap:
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
32 -m $min_overlap
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
33 #end if
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
34 #if $asm.asm_select == 'true':
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
35 --asm-coverage $asm.asm_coverage
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
36 -g '$asm.genome_size'
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
37 #end if
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
38 #if $meta:
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
39 $meta
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
40 #end if
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
41 #if $scaffold:
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
42 $scaffold
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
43 #end if
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
44 #if $no_alt_contigs:
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
45 $no_alt_contigs
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
46 #end if
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
47 ]]></command>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
48 <inputs>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
49 <param name="input" type="data" format="fasta,fasta.gz,fastq,fastq.gz,fastqsanger.gz,fastqsanger" label="Read file" />
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
50 <conditional name="mode_conditional">
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
51 <param name="mode" type="select" label="Mode">
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
52 <option value="--nano-raw">Nanopore raw (--nano-raw)</option>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
53 <option value="--nano-corr">Nanopore corrected (--nano-corr)</option>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
54 <option value="--nano-hq">Nanopore HQ (--nano-hq)</option>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
55 <option value="--pacbio-raw">PacBio raw (--pacbio-raw)</option>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
56 <option value="--pacbio-corr">PacBio corrected (--pacbio-corr)</option>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
57 <option value="--pacbio-hifi">PacBio HiFi (--pacbio-hifi)</option>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
58 </param>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
59 <when value="--nano-raw"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
60 <when value="--nano-corr"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
61 <when value="--nano-hq"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
62 <when value="--pacbio-raw"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
63 <when value="--pacbio-corr"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
64 <when value="--pacbio-hifi">
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
65 <param argument="--hifi-error" type="float" min="0" max="1" optional="true" label="Expected HiFi reads error rate" help="Default: 0.01"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
66 </when>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
67 </conditional>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
68 <param argument="--iterations" type="integer" value="1" label="Number of polishing iterations"
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
69 help="Polishing is performed as the final assembly stage. By default, Flye runs one polishing iteration. Additional iterations
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
70 might correct a small number of extra errors (due to improvements on how reads may align to the corrected assembly). If the
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
71 parameter is set to 0, the polishing is not performed"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
72 <param argument="--min-overlap" type="integer" min="1000" max="10000" optional="true" label="Minimum overlap between reads"
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
73 help="This sets a minimum overlap length for two reads to be considered overlapping. By default it is chosen
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
74 automatically based on the read length distribution (reads N90) and does not require manual setting. Typical
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
75 value is 3k-5k (and down to 1k for datasets with shorter read length). Intuitively, we want to set this
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
76 parameter as high as possible, so the repeat graph is less tangled. However, higher values might lead to assembly gaps.
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
77 In some rare cases it makes sense to manually increase minimum overlap for assemblies of big genomes with long reads and high coverage." />
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
78 <param argument="--keep-haplotypes" type="boolean" truevalue="--keep-haplotypes" falsevalue="" checked="False" label="Keep haplotypes"
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
79 help="By default, Flye collapses graph structures caused by alternative haplotypes (bubbles, superbubbles, roundabouts) to produce longer
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
80 consensus contigs. This option retains the alternative paths on the graph, producing less contigouos, but more detailed assembly."/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
81 <param argument="--scaffold" type="boolean" truevalue="--scaffold" falsevalue="" label="Enable scaffolding using graph"
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
82 help="Starting from the version 2.9 Flye does not perform scaffolding by default, which guarantees that all assembled sequences do not have any gaps" />
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
83 <param argument="--meta" type="boolean" truevalue="--meta" falsevalue="" checked="False" label="Perform metagenomic assembly"
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
84 help="It is designed for highly non-uniform coverage and is sensitive to underrepresented sequence at low coverage (as low as 2x).
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
85 In some examples of simple metagenomes, we observed that the normal mode assembled more contigious bacterial
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
86 consensus sequence, while the metagenome mode was slightly more fragmented, but revealed strain mixtures"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
87 <conditional name="asm">
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
88 <param name="asm_select" type="select" label="Reduced contig assembly coverage" help="Typically, assemblies of large genomes at high coverage require a large amount of RAM. For high coverage assemblies, you can reduce memory usage by using only a subset of longest reads for initial contig extension stage (which is often the memory bottleneck)">
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
89 <option value="true">Enable reduced coverage for initial disjointing assembly</option>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
90 <option value="false" selected="true">Disable reduced coverage for initial disjointing assembly</option>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
91 </param>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
92 <when value="true">
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
93 <param argument="--asm-coverage" type="integer" min="0" value="30"
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
94 label="Reduced coverage for initial disjointing assembly"
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
95 help="This parameter specifies the target coverage of the longest reads. For a typical assembly, 30x is enough to produce good
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
96 initial contigs. Regardless of this parameter, all reads will be used at the later pipeline stages."/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
97 <param argument="--genome-size" type="text" optional="true" label="Estimated genome size"
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
98 help="For example, 5m or 2.6g. No longer required as input. However, it must be used in conjunction with --asm-coverage option.">
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
99 <validator type="regex" message="Genome size must be a float or integer, optionally followed by the a unit prefix (kmg)">^([0-9]*[.])?[0-9]+[kmg]?$</validator>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
100 </param>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
101 </when>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
102 <when value="false" />
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
103 </conditional>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
104 <param argument="--no-alt-contigs" type="boolean" truevalue="--no-alt-contigs" falsevalue="" checked="false" label="Remove all non-primary contigs from the assembly"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
105 <param name="generate_log" type="boolean" truevalue="true" falsevalue="false" checked="false" label="Generate a log file"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
106 </inputs>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
107 <outputs>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
108 <data name="consensus" format="fasta" from_work_dir="out_dir/assembly.fasta" label="${tool.name} on ${on_string}: consensus"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
109 <data name="assembly_graph" format="graph_dot" from_work_dir="out_dir/assembly_graph.gv" label="${tool.name} on ${on_string}: assembly graph"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
110 <data name="assembly_gfa" format="gfa1" from_work_dir="out_dir/assembly_graph.gfa" label="${tool.name} on ${on_string}: graphical fragment assembly"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
111 <data name="assembly_info" format="tabular" from_work_dir="out_dir/assembly_info.txt" label="${tool.name} on ${on_string}: assembly info"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
112 <data name="flye_log" format="txt" from_work_dir="out_dir/flye.log" label="${tool.name} on ${on_string}: log">
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
113 <filter>generate_log</filter>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
114 </data>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
115 </outputs>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
116 <tests>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
117 <!--Test 01: pacbio-raw-->
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
118 <test expect_num_outputs="5">
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
119 <param name="inputs" ftype="fastq.gz" value="ecoli_01.fastq.gz,ecoli_02.fastq.gz,ecoli_03.fastq.gz,ecoli_04.fastq.gz,ecoli_05.fastq.gz,ecoli_06.fastq.gz,ecoli_07.fastq.gz"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
120 <conditional name="mode_conditional">
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
121 <param name="mode" value="--pacbio-raw"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
122 </conditional>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
123 <param name="iterations" value="0"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
124 <param name="generate_log" value="true"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
125 <output name="assembly_info" file="result1_assembly_info.txt" ftype="tabular" compare="sim_size"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
126 <output name="assembly_graph" file="result1_assembly_graph.dot" ftype="graph_dot" compare="sim_size"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
127 <output name="assembly_gfa" file="result1_assembly_graph.gfa" ftype="gfa1" compare="diff" lines_diff="10"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
128 <output name="consensus" ftype="fasta">
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
129 <assert_contents>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
130 <has_line line=">contig_1"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
131 </assert_contents>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
132 </output>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
133 <output name="flye_log" file="result1.log" ftype="txt" compare="sim_size"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
134 </test>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
135 <!--Test 02: nano raw-->
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
136 <test expect_num_outputs="4">
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
137 <param name="inputs" ftype="fasta.gz" value="nanopore.fasta.gz"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
138 <conditional name="mode_conditional">
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
139 <param name="mode" value="--nano-raw"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
140 </conditional>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
141 <param name="iterations" value="0"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
142 <output name="assembly_info" ftype="tabular">
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
143 <assert_contents>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
144 <has_size value="95" delta="100"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
145 </assert_contents>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
146 </output>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
147 <output name="assembly_graph" ftype="graph_dot">
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
148 <assert_contents>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
149 <has_size value="803" delta="100"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
150 </assert_contents>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
151 </output>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
152 <output name="assembly_gfa" ftype="gfa1">
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
153 <assert_contents>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
154 <has_size value="35047" delta="100"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
155 </assert_contents>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
156 </output>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
157 <output name="consensus" ftype="fasta">
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
158 <assert_contents>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
159 <has_size value="35573" delta="100"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
160 </assert_contents>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
161 </output>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
162 </test>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
163 <!--Test 03: reduce coverage-->
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
164 <test expect_num_outputs="4">
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
165 <param name="inputs" ftype="fastq.gz" value="ecoli_hifi_01.fastq.gz,ecoli_hifi_02.fastq.gz,ecoli_hifi_03.fastq.gz,ecoli_hifi_04.fastq.gz,ecoli_hifi_05.fastq.gz,ecoli_hifi_06.fastq.gz,ecoli_hifi_07.fastq.gz,ecoli_hifi_08.fastq.gz,ecoli_hifi_09.fastq.gz"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
166 <conditional name="mode_conditional">
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
167 <param name="mode" value="--nano-raw"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
168 </conditional>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
169 <conditional name="asm">
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
170 <param name="asm_select" value="true" />
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
171 <param name="asm_coverage" value="30"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
172 <param name="genome_size" value="3980000"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
173 </conditional>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
174 <output name="assembly_info" ftype="tabular">
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
175 <assert_contents>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
176 <has_size value="286" delta="100"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
177 </assert_contents>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
178 </output>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
179 <output name="assembly_graph" ftype="graph_dot">
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
180 <assert_contents>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
181 <has_size value="1840" delta="100"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
182 </assert_contents>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
183 </output>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
184 <output name="assembly_gfa" ftype="gfa1">
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
185 <assert_contents>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
186 <has_size value="420752" delta="100"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
187 </assert_contents>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
188 </output>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
189 <output name="consensus" ftype="fasta">
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
190 <assert_contents>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
191 <has_size value="427580" delta="100"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
192 </assert_contents>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
193 </output>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
194 </test>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
195 <!--Test 04: metagenomic mode-->
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
196 <test expect_num_outputs="4">
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
197 <param name="inputs" ftype="fastq.gz" value="ecoli_01.fastq.gz,ecoli_02.fastq.gz,ecoli_03.fastq.gz,ecoli_04.fastq.gz,ecoli_05.fastq.gz,ecoli_06.fastq.gz,ecoli_07.fastq.gz"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
198 <conditional name="mode_conditional">
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
199 <param name="mode" value="--pacbio-raw"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
200 </conditional>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
201 <param name="meta" value="true"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
202 <output name="assembly_info" ftype="tabular">
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
203 <assert_contents>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
204 <has_size value="95" delta="100"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
205 </assert_contents>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
206 </output>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
207 <output name="assembly_graph" ftype="graph_dot">
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
208 <assert_contents>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
209 <has_size value="367" delta="100"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
210 </assert_contents>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
211 </output>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
212 <output name="assembly_gfa" ftype="gfa1">
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
213 <assert_contents>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
214 <has_size value="418729" delta="100"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
215 </assert_contents>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
216 </output>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
217 <output name="consensus" ftype="fasta">
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
218 <assert_contents>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
219 <has_size value="425667" delta="100"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
220 </assert_contents>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
221 </output>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
222 </test>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
223 <!--Test 05: nanopore HQ mode-->
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
224 <test expect_num_outputs="4">
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
225 <param name="inputs" ftype="fastq.gz" value="ecoli_hifi_01.fastq.gz,ecoli_hifi_02.fastq.gz,ecoli_hifi_03.fastq.gz,ecoli_hifi_04.fastq.gz,ecoli_hifi_05.fastq.gz,ecoli_hifi_06.fastq.gz,ecoli_hifi_07.fastq.gz,ecoli_hifi_08.fastq.gz,ecoli_hifi_09.fastq.gz"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
226 <conditional name="mode_conditional">
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
227 <param name="mode" value="--nano-hq"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
228 </conditional>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
229 <param name="min_overlap" value="1000"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
230 <output name="assembly_info" ftype="tabular">
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
231 <assert_contents>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
232 <has_size value="286" delta="100"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
233 </assert_contents>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
234 </output>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
235 <output name="assembly_graph" ftype="graph_dot">
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
236 <assert_contents>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
237 <has_size value="1248" delta="100"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
238 </assert_contents>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
239 </output>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
240 <output name="assembly_gfa" ftype="gfa1">
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
241 <assert_contents>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
242 <has_size value="419414" delta="1000"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
243 </assert_contents>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
244 </output>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
245 <output name="consensus" ftype="fasta">
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
246 <assert_contents>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
247 <has_size value="426277" delta="1000"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
248 </assert_contents>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
249 </output>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
250 </test>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
251 <!--Test 06: hifi error option-->
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
252 <test expect_num_outputs="4">
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
253 <param name="inputs" ftype="fastq.gz" value="ecoli_hifi_01.fastq.gz,ecoli_hifi_02.fastq.gz,ecoli_hifi_03.fastq.gz,ecoli_hifi_04.fastq.gz,ecoli_hifi_05.fastq.gz,ecoli_hifi_06.fastq.gz,ecoli_hifi_07.fastq.gz,ecoli_hifi_08.fastq.gz,ecoli_hifi_09.fastq.gz"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
254 <conditional name="mode_conditional">
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
255 <param name="mode" value="--pacbio-hifi"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
256 <param name="hifi_error" value="0.21"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
257 </conditional>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
258 <param name="min_overlap" value="1000"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
259 <output name="assembly_info" ftype="tabular">
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
260 <assert_contents>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
261 <has_size value="286" delta="100"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
262 </assert_contents>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
263 </output>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
264 <output name="assembly_graph" ftype="graph_dot">
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
265 <assert_contents>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
266 <has_size value="1248" delta="500"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
267 </assert_contents>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
268 </output>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
269 <output name="assembly_gfa" ftype="gfa1">
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
270 <assert_contents>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
271 <has_size value="420254" delta="2000"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
272 </assert_contents>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
273 </output>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
274 <output name="consensus" ftype="fasta">
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
275 <assert_contents>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
276 <has_size value="427131" delta="2000"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
277 </assert_contents>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
278 </output>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
279 </test>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
280 <!--Test 07: keep haplotypes-->
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
281 <test expect_num_outputs="4">
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
282 <param name="inputs" ftype="fastq.gz" value="ecoli_hifi_01.fastq.gz,ecoli_hifi_02.fastq.gz,ecoli_hifi_03.fastq.gz,ecoli_hifi_04.fastq.gz,ecoli_hifi_05.fastq.gz,ecoli_hifi_06.fastq.gz,ecoli_hifi_07.fastq.gz,ecoli_hifi_08.fastq.gz,ecoli_hifi_09.fastq.gz"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
283 <conditional name="mode_conditional">
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
284 <param name="mode" value="--pacbio-corr"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
285 </conditional>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
286 <param name="min_overlap" value="1000"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
287 <param name="keep_haplotypes" value="true"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
288 <output name="assembly_info" ftype="tabular">
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
289 <assert_contents>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
290 <has_size value="286" delta="200"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
291 </assert_contents>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
292 </output>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
293 <output name="assembly_graph" ftype="graph_dot">
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
294 <assert_contents>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
295 <has_size value="1273" delta="500"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
296 </assert_contents>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
297 </output>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
298 <output name="assembly_gfa" ftype="gfa1">
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
299 <assert_contents>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
300 <has_size value="420254" delta="3000"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
301 </assert_contents>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
302 </output>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
303 <output name="consensus" ftype="fasta">
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
304 <assert_contents>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
305 <has_size value="427131" delta="3000"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
306 </assert_contents>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
307 </output>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
308 </test>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
309 <!--Test 08: scaffolding mode-->
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
310 <test expect_num_outputs="4">
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
311 <param name="inputs" ftype="fastq.gz" value="ecoli_hifi_01.fastq.gz,ecoli_hifi_02.fastq.gz,ecoli_hifi_03.fastq.gz,ecoli_hifi_04.fastq.gz,ecoli_hifi_05.fastq.gz,ecoli_hifi_06.fastq.gz,ecoli_hifi_07.fastq.gz,ecoli_hifi_08.fastq.gz,ecoli_hifi_09.fastq.gz"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
312 <conditional name="mode_conditional">
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
313 <param name="mode" value="--nano-hq"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
314 </conditional>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
315 <param name="min_overlap" value="1000"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
316 <param name="scaffold" value="true"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
317 <output name="assembly_info" ftype="tabular">
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
318 <assert_contents>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
319 <has_size value="286" delta="100"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
320 </assert_contents>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
321 </output>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
322 <output name="assembly_graph" ftype="graph_dot">
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
323 <assert_contents>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
324 <has_size value="1248" delta="100"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
325 </assert_contents>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
326 </output>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
327 <output name="assembly_gfa" ftype="gfa1">
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
328 <assert_contents>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
329 <has_size value="419414" delta="2000"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
330 </assert_contents>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
331 </output>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
332 <output name="consensus" ftype="fasta">
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
333 <assert_contents>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
334 <has_size value="426277" delta="2000"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
335 </assert_contents>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
336 </output>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
337 </test>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
338 <!--Test 09: test not-alt-contigs parameter w-->
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
339 <test expect_num_outputs="4">
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
340 <param name="inputs" ftype="fasta.gz" value="nanopore.fasta.gz"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
341 <conditional name="mode_conditional">
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
342 <param name="mode" value="--nano-raw"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
343 </conditional>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
344 <param name="iterations" value="0"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
345 <param name="no_alt_contigs" value="true"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
346 <output name="assembly_info" ftype="tabular">
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
347 <assert_contents>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
348 <has_size value="151" delta="100"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
349 </assert_contents>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
350 </output>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
351 <output name="assembly_graph" ftype="graph_dot">
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
352 <assert_contents>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
353 <has_size value="217" delta="100"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
354 </assert_contents>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
355 </output>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
356 <output name="assembly_gfa" ftype="gfa1">
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
357 <assert_contents>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
358 <has_size value="5110" delta="100"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
359 </assert_contents>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
360 </output>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
361 <output name="consensus" ftype="fasta">
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
362 <assert_contents>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
363 <has_size value="5123" delta="100"/>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
364 </assert_contents>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
365 </output>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
366 </test>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
367 </tests>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
368 <help><![CDATA[
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
369
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
370 **Purpose**
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
371
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
372 Flye is a de novo assembler for single molecule sequencing reads, such as those produced by PacBio and Oxford Nanopore Technologies.
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
373 It is designed for a wide range of datasets, from small bacterial projects to large mammalian-scale assemblies. The package represents
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
374 a complete pipeline: it takes raw PacBio/ONT reads as input and outputs polished contigs. Flye also has a special mode for metagenome
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
375 assembly.
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
376
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
377 ----
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
378
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
379 **Quick usage**
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
380
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
381 Input reads can be in FASTA or FASTQ format, uncompressed or compressed with gz. Currently, PacBio (raw, corrected, HiFi) and ONT reads
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
382 (raw, corrected) are supported. Expected error rates are <30% for raw, <3% for corrected, and <1% for HiFi. Note that Flye was primarily
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
383 developed to run on raw reads. You may specify multiple files with reads (separated by spaces). Mixing different read types is not yet supported. The *--meta* o
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
384 ption enables the mode for metagenome/uneven coverage assembly.
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
385
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
386 Genome size estimate is no longer a required option. You need to provide an estimate if using *--asm-coverage* option.
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
387
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
388 To reduce memory consumption for large genome assemblies, you can use a subset of the longest reads for initial disjointig assembly by
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
389 specifying *--asm-coverage* and *--genome-size* options. Typically, 40x coverage is enough to produce good disjointigs.
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
390
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
391 ----
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
392
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
393 **Outputs**
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
394
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
395 The main output files are:
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
396
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
397 * Final assembly: contains contigs and possibly scaffolds (see below).
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
398 * Final repeat graph: note that the edge sequences might be different (shorter) than contig sequences, because contigs might include multiple graph edges.
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
399 * Extra information about contigs (such as length or coverage).
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
400
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
401 Each contig is formed by a single unique graph edge. If possible, unique contigs are extended with the sequence from flanking unresolved repeats on the graph. Thus,
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
402 a contig fully contains the corresponding graph edge (with the same id), but might be longer then this edge. This is somewhat similar to unitig-contig relation in
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
403 OLC assemblers. In a rare case when a repetitive graph edge is not covered by the set of "extended" contigs, it will be also output in the assembly file.
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
404
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
405 Sometimes it is possible to further order contigs into scaffolds based on the repeat graph structure. These ordered contigs will be output as a part of scaffold in
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
406 the assembly file (with a scaffold prefix). Since it is hard to give a reliable estimate of the gap size, those gaps are represented with the default 100 Ns.
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
407 assembly_info.txt file (below) contains additional information about how scaffolds were formed.
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
408
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
409 Extra information about contigs/scaffolds is output into the assembly_info.txt file. It is a tab-delimited table with the columns as follows:
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
410
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
411 * Contig/scaffold id
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
412 * Length
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
413 * Coverage
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
414 * Is circular, (Y)es or (N)o
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
415 * Is repetitive, (Y)es or (N)o
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
416 * Multiplicity (based on coverage)
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
417 * Alternative group
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
418 * Graph path (graph path corresponding to this contig/scaffold).
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
419
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
420 Scaffold gaps are marked with `??` symbols, and `*` symbol denotes a terminal graph node. Alternative contigs (representing alternative haplotypes) will have the same alt.
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
421 group ID. Primary contigs are marked by `*`.
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
422
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
423 ----
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
424
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
425 **Algorithm Description**
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
426
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
427 This is a brief description of the Flye algorithm. Please refer to the manuscript for more detailed information. The draft contig extension is organized as follows:
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
428
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
429 * K-mer counting / erroneous k-mer pre-filtering
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
430 * Solid k-mer selection (k-mers with sufficient frequency, which are unlikely to be erroneous)
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
431 * Contig extension. The algorithm starts from a single read and extends it with a next overlapping read (overlaps are dynamically detected using the selected solid k-mers).
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
432
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
433 Note that we do not attempt to resolve repeats at this stage, thus the reconstructed contigs might contain misassemblies. Flye then aligns the reads on these draft
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
434 contigs using minimap2 and calls a consensus. Afterwards, Flye performs repeat analysis as follows:
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
435
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
436 * Repeat graph is constructed from the (possibly misassembled) contigs
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
437 * In this graph all repeats longer than minimum overlap are collapsed
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
438 * The algorithm resolves repeats using the read information and graph structure
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
439 * The unbranching paths in the graph are output as contigs
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
440
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
441 If enabled, after resolving bridged repeats, Trestle module attempts to resolve simple unbridged repeats (of multiplicity 2) using the heterogeneities between repeat copies.
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
442 Finally, Flye performs polishing of the resulting assembly to correct the remaining errors:
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
443
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
444 * Alignment of all reads to the current assembly using minimap2
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
445 * Partition the alignment into mini-alignments (bubbles)
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
446 * Error correction of each bubble using a maximum likelihood approach
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
447
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
448 The polishing steps could be repeated, which might slightly increase quality for some datasets.
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
449
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
450
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
451 ]]></help>
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
452 <expand macro="citations" />
e1e6ef58f334 planemo upload commit bdb45cf3a98e21f5002866b6789a1457f521bf5d
estrain
parents:
diff changeset
453 </tool>