kkonganti@1
|
1 // Help text for mash sketch within CPIPES.
|
kkonganti@1
|
2
|
kkonganti@1
|
3 def mashsketchHelp(params) {
|
kkonganti@1
|
4
|
kkonganti@1
|
5 Map tool = [:]
|
kkonganti@1
|
6 Map toolspecs = [:]
|
kkonganti@1
|
7 tool.text = [:]
|
kkonganti@1
|
8 tool.helpparams = [:]
|
kkonganti@1
|
9
|
kkonganti@1
|
10 toolspecs = [
|
kkonganti@1
|
11 'mashsketch_run': [
|
kkonganti@1
|
12 clihelp: 'Run `mash screen` tool. Default: ' +
|
kkonganti@1
|
13 (params.mashsketch_run ?: false),
|
kkonganti@1
|
14 cliflag: null,
|
kkonganti@1
|
15 clivalue: null
|
kkonganti@1
|
16 ],
|
kkonganti@1
|
17 'mashsketch_l': [
|
kkonganti@1
|
18 clihelp: 'List input. Lines in each <input> specify paths to sequence files, ' +
|
kkonganti@1
|
19 'one per line. ' +
|
kkonganti@1
|
20 "Default: ${params.mashsketch_l}",
|
kkonganti@1
|
21 cliflag: '-l',
|
kkonganti@1
|
22 clivalue: (params.mashsketch_l ? ' ' : '')
|
kkonganti@1
|
23 ],
|
kkonganti@1
|
24 'mashsketch_I': [
|
kkonganti@1
|
25 clihelp: '<path> ID field for sketch of reads (instead of first sequence ID). ' +
|
kkonganti@1
|
26 "Default: ${params.mashsketch_I}",
|
kkonganti@1
|
27 cliflag: '-I',
|
kkonganti@1
|
28 clivalue: (params.mashsketch_I ?: '')
|
kkonganti@1
|
29 ],
|
kkonganti@1
|
30 'mashsketch_C': [
|
kkonganti@1
|
31 clihelp: '<path> Comment for a sketch of reads (instead of first sequence comment). ' +
|
kkonganti@1
|
32 "Default: ${params.mashsketch_C}",
|
kkonganti@1
|
33 cliflag: '-C',
|
kkonganti@1
|
34 clivalue: (params.mashsketch_C ?: '')
|
kkonganti@1
|
35 ],
|
kkonganti@1
|
36 'mashsketch_k': [
|
kkonganti@1
|
37 clihelp: '<int> K-mer size. Hashes will be based on strings of this many ' +
|
kkonganti@1
|
38 'nucleotides. Canonical nucleotides are used by default (see ' +
|
kkonganti@1
|
39 'Alphabet options below). (1-32) ' +
|
kkonganti@1
|
40 "Default: ${params.mashsketch_k}",
|
kkonganti@1
|
41 cliflag: '-k',
|
kkonganti@1
|
42 clivalue: (params.mashsketch_k ?: '')
|
kkonganti@1
|
43 ],
|
kkonganti@1
|
44 'mashsketch_s': [
|
kkonganti@1
|
45 clihelp: '<int> Sketch size. Each sketch will have at most this many non-redundant ' +
|
kkonganti@1
|
46 'min-hashes. ' +
|
kkonganti@1
|
47 "Default: ${params.mashsketch_s}",
|
kkonganti@1
|
48 cliflag: '-s',
|
kkonganti@1
|
49 clivalue: (params.mashsketch_s ?: '')
|
kkonganti@1
|
50 ],
|
kkonganti@1
|
51 'mashsketch_i': [
|
kkonganti@1
|
52 clihelp: 'Sketch individual sequences, rather than whole files, e.g. for ' +
|
kkonganti@1
|
53 'multi-fastas of single-chromosome genomes or pair-wise gene ' +
|
kkonganti@1
|
54 'comparisons. ' +
|
kkonganti@1
|
55 "Default: ${params.mashsketch_i}",
|
kkonganti@1
|
56 cliflag: '-i',
|
kkonganti@1
|
57 clivalue: (params.mashsketch_i ? ' ' : '')
|
kkonganti@1
|
58 ],
|
kkonganti@1
|
59 'mashsketch_S': [
|
kkonganti@1
|
60 clihelp: '<int> Seed to provide to the hash function. (0-4294967296) [42] ' +
|
kkonganti@1
|
61 "Default: ${params.mashsketch_S}",
|
kkonganti@1
|
62 cliflag: '-S',
|
kkonganti@1
|
63 clivalue: (params.mashsketch_S ?: '')
|
kkonganti@1
|
64 ],
|
kkonganti@1
|
65
|
kkonganti@1
|
66 'mashsketch_w': [
|
kkonganti@1
|
67 clihelp: '<num> Probability threshold for warning about low k-mer size. (0-1) ' +
|
kkonganti@1
|
68 "Default: ${params.mashsketch_w}",
|
kkonganti@1
|
69 cliflag: '-w',
|
kkonganti@1
|
70 clivalue: (params.mashsketch_w ?: '')
|
kkonganti@1
|
71 ],
|
kkonganti@1
|
72 'mashsketch_r': [
|
kkonganti@1
|
73 clihelp: 'Input is a read set. See Reads options below. Incompatible with ' +
|
kkonganti@1
|
74 '--mashsketch_i. ' +
|
kkonganti@1
|
75 "Default: ${params.mashsketch_r}",
|
kkonganti@1
|
76 cliflag: '-r',
|
kkonganti@1
|
77 clivalue: (params.mashsketch_r ? ' ' : '')
|
kkonganti@1
|
78 ],
|
kkonganti@1
|
79 'mashsketch_b': [
|
kkonganti@1
|
80 clihelp: '<size> Use a Bloom filter of this size (raw bytes or with K/M/G/T) to ' +
|
kkonganti@1
|
81 'filter out unique k-mers. This is useful if exact filtering with ' +
|
kkonganti@1
|
82 '--mashsketch_m uses too much memory. However, some unique k-mers may pass ' +
|
kkonganti@1
|
83 'erroneously, and copies cannot be counted beyond 2. Implies --mashsketch_r. ' +
|
kkonganti@1
|
84 "Default: ${params.mashsketch_b}",
|
kkonganti@1
|
85 cliflag: '-b',
|
kkonganti@1
|
86 clivalue: (params.mashsketch_b ?: '')
|
kkonganti@1
|
87 ],
|
kkonganti@1
|
88 'mashsketch_m': [
|
kkonganti@1
|
89 clihelp: '<int> Minimum copies of each k-mer required to pass noise filter for ' +
|
kkonganti@1
|
90 'reads. Implies --mashsketch_r. ' +
|
kkonganti@1
|
91 "Default: ${params.mashsketch_r}",
|
kkonganti@1
|
92 cliflag: '-m',
|
kkonganti@1
|
93 clivalue: (params.mashsketch_m ?: '')
|
kkonganti@1
|
94 ],
|
kkonganti@1
|
95 'mashsketch_c': [
|
kkonganti@1
|
96 clihelp: '<num> Target coverage. Sketching will conclude if this coverage is ' +
|
kkonganti@1
|
97 'reached before the end of the input file (estimated by average ' +
|
kkonganti@1
|
98 'k-mer multiplicity). Implies --mashsketch_r. ' +
|
kkonganti@1
|
99 "Default: ${params.mashsketch_c}",
|
kkonganti@1
|
100 cliflag: '-c',
|
kkonganti@1
|
101 clivalue: (params.mashsketch_c ?: '')
|
kkonganti@1
|
102 ],
|
kkonganti@1
|
103 'mashsketch_g': [
|
kkonganti@1
|
104 clihelp: '<size> Genome size (raw bases or with K/M/G/T). If specified, will be used ' +
|
kkonganti@1
|
105 'for p-value calculation instead of an estimated size from k-mer ' +
|
kkonganti@1
|
106 'content. Implies --mashsketch_r. ' +
|
kkonganti@1
|
107 "Default: ${params.mashsketch_g}",
|
kkonganti@1
|
108 cliflag: '-g',
|
kkonganti@1
|
109 clivalue: (params.mashsketch_g ?: '')
|
kkonganti@1
|
110 ],
|
kkonganti@1
|
111 'mashsketch_n': [
|
kkonganti@1
|
112 clihelp: 'Preserve strand (by default, strand is ignored by using canonical ' +
|
kkonganti@1
|
113 'DNA k-mers, which are alphabetical minima of forward-reverse ' +
|
kkonganti@1
|
114 'pairs). Implied if an alphabet is specified with --mashsketch_a ' +
|
kkonganti@1
|
115 'or --mashsketch_z. ' +
|
kkonganti@1
|
116 "Default: ${params.mashsketch_n}",
|
kkonganti@1
|
117 cliflag: '-n',
|
kkonganti@1
|
118 clivalue: (params.mashsketch_n ? ' ' : '')
|
kkonganti@1
|
119 ],
|
kkonganti@1
|
120 'mashsketch_a': [
|
kkonganti@1
|
121 clihelp: 'Use amino acid alphabet (A-Z, except BJOUXZ). Implies ' +
|
kkonganti@1
|
122 '--mashsketch_n --mashsketch_k 9. ' +
|
kkonganti@1
|
123 "Default: ${params.mashsketch_a}",
|
kkonganti@1
|
124 cliflag: '-a',
|
kkonganti@1
|
125 clivalue: (params.mashsketch_a ? ' ' : '')
|
kkonganti@1
|
126 ],
|
kkonganti@1
|
127 'mashsketch_z': [
|
kkonganti@1
|
128 clihelp: '<text> Alphabet to base hashes on (case ignored by default; ' +
|
kkonganti@1
|
129 'see --mashsketch_Z). K-mers with other characters will be ' +
|
kkonganti@1
|
130 'ignored. Implies --mashsketch_n. ' +
|
kkonganti@1
|
131 "Default: ${params.mashsketch_z}",
|
kkonganti@1
|
132 cliflag: '-z',
|
kkonganti@1
|
133 clivalue: (params.mashsketch_z ?: '')
|
kkonganti@1
|
134 ],
|
kkonganti@1
|
135 'mashsketch_Z': [
|
kkonganti@1
|
136 clihelp: 'Preserve case in k-mers and alphabet (case is ignored by default). ' +
|
kkonganti@1
|
137 'Sequence letters whose case is not in the current alphabet will be ' +
|
kkonganti@1
|
138 'skipped when sketching. ' +
|
kkonganti@1
|
139 "Default: ${params.mashsketch_Z}",
|
kkonganti@1
|
140 cliflag: '-Z',
|
kkonganti@1
|
141 clivalue: (params.mashsketch_Z ?: '')
|
kkonganti@1
|
142 ]
|
kkonganti@1
|
143 ]
|
kkonganti@1
|
144
|
kkonganti@1
|
145 toolspecs.each {
|
kkonganti@1
|
146 k, v -> tool.text['--' + k] = "${v.clihelp}"
|
kkonganti@1
|
147 tool.helpparams[k] = [ cliflag: "${v.cliflag}", clivalue: v.clivalue ]
|
kkonganti@1
|
148 }
|
kkonganti@1
|
149
|
kkonganti@1
|
150 return tool
|
kkonganti@1
|
151 } |