annotate 0.1.0/lib/help/mashsketch.nf @ 6:a3c1cba6f773

"planemo upload"
author kkonganti
date Mon, 27 Nov 2023 19:52:20 -0500
parents c8597e9e1a97
children
rev   line source
kkonganti@0 1 // Help text for mash sketch within CPIPES.
kkonganti@0 2
kkonganti@0 3 def mashsketchHelp(params) {
kkonganti@0 4
kkonganti@0 5 Map tool = [:]
kkonganti@0 6 Map toolspecs = [:]
kkonganti@0 7 tool.text = [:]
kkonganti@0 8 tool.helpparams = [:]
kkonganti@0 9
kkonganti@0 10 toolspecs = [
kkonganti@0 11 'mashsketch_run': [
kkonganti@0 12 clihelp: 'Run `mash screen` tool. Default: ' +
kkonganti@0 13 (params.mashsketch_run ?: false),
kkonganti@0 14 cliflag: null,
kkonganti@0 15 clivalue: null
kkonganti@0 16 ],
kkonganti@0 17 'mashsketch_l': [
kkonganti@0 18 clihelp: 'List input. Lines in each <input> specify paths to sequence files, ' +
kkonganti@0 19 'one per line. ' +
kkonganti@0 20 "Default: ${params.mashsketch_l}",
kkonganti@0 21 cliflag: '-l',
kkonganti@0 22 clivalue: (params.mashsketch_l ? ' ' : '')
kkonganti@0 23 ],
kkonganti@0 24 'mashsketch_I': [
kkonganti@0 25 clihelp: '<path> ID field for sketch of reads (instead of first sequence ID). ' +
kkonganti@0 26 "Default: ${params.mashsketch_I}",
kkonganti@0 27 cliflag: '-I',
kkonganti@0 28 clivalue: (params.mashsketch_I ?: '')
kkonganti@0 29 ],
kkonganti@0 30 'mashsketch_C': [
kkonganti@0 31 clihelp: '<path> Comment for a sketch of reads (instead of first sequence comment). ' +
kkonganti@0 32 "Default: ${params.mashsketch_C}",
kkonganti@0 33 cliflag: '-C',
kkonganti@0 34 clivalue: (params.mashsketch_C ?: '')
kkonganti@0 35 ],
kkonganti@0 36 'mashsketch_k': [
kkonganti@0 37 clihelp: '<int> K-mer size. Hashes will be based on strings of this many ' +
kkonganti@0 38 'nucleotides. Canonical nucleotides are used by default (see ' +
kkonganti@0 39 'Alphabet options below). (1-32) ' +
kkonganti@0 40 "Default: ${params.mashsketch_k}",
kkonganti@0 41 cliflag: '-k',
kkonganti@0 42 clivalue: (params.mashsketch_k ?: '')
kkonganti@0 43 ],
kkonganti@0 44 'mashsketch_s': [
kkonganti@0 45 clihelp: '<int> Sketch size. Each sketch will have at most this many non-redundant ' +
kkonganti@0 46 'min-hashes. ' +
kkonganti@0 47 "Default: ${params.mashsketch_s}",
kkonganti@0 48 cliflag: '-s',
kkonganti@0 49 clivalue: (params.mashsketch_s ?: '')
kkonganti@0 50 ],
kkonganti@0 51 'mashsketch_i': [
kkonganti@0 52 clihelp: 'Sketch individual sequences, rather than whole files, e.g. for ' +
kkonganti@0 53 'multi-fastas of single-chromosome genomes or pair-wise gene ' +
kkonganti@0 54 'comparisons. ' +
kkonganti@0 55 "Default: ${params.mashsketch_i}",
kkonganti@0 56 cliflag: '-i',
kkonganti@0 57 clivalue: (params.mashsketch_i ? ' ' : '')
kkonganti@0 58 ],
kkonganti@0 59 'mashsketch_S': [
kkonganti@0 60 clihelp: '<int> Seed to provide to the hash function. (0-4294967296) [42] ' +
kkonganti@0 61 "Default: ${params.mashsketch_S}",
kkonganti@0 62 cliflag: '-S',
kkonganti@0 63 clivalue: (params.mashsketch_S ?: '')
kkonganti@0 64 ],
kkonganti@0 65
kkonganti@0 66 'mashsketch_w': [
kkonganti@0 67 clihelp: '<num> Probability threshold for warning about low k-mer size. (0-1) ' +
kkonganti@0 68 "Default: ${params.mashsketch_w}",
kkonganti@0 69 cliflag: '-w',
kkonganti@0 70 clivalue: (params.mashsketch_w ?: '')
kkonganti@0 71 ],
kkonganti@0 72 'mashsketch_r': [
kkonganti@0 73 clihelp: 'Input is a read set. See Reads options below. Incompatible with ' +
kkonganti@0 74 '--mashsketch_i. ' +
kkonganti@0 75 "Default: ${params.mashsketch_r}",
kkonganti@0 76 cliflag: '-r',
kkonganti@0 77 clivalue: (params.mashsketch_r ? ' ' : '')
kkonganti@0 78 ],
kkonganti@0 79 'mashsketch_b': [
kkonganti@0 80 clihelp: '<size> Use a Bloom filter of this size (raw bytes or with K/M/G/T) to ' +
kkonganti@0 81 'filter out unique k-mers. This is useful if exact filtering with ' +
kkonganti@0 82 '--mashsketch_m uses too much memory. However, some unique k-mers may pass ' +
kkonganti@0 83 'erroneously, and copies cannot be counted beyond 2. Implies --mashsketch_r. ' +
kkonganti@0 84 "Default: ${params.mashsketch_b}",
kkonganti@0 85 cliflag: '-b',
kkonganti@0 86 clivalue: (params.mashsketch_b ?: '')
kkonganti@0 87 ],
kkonganti@0 88 'mashsketch_m': [
kkonganti@0 89 clihelp: '<int> Minimum copies of each k-mer required to pass noise filter for ' +
kkonganti@0 90 'reads. Implies --mashsketch_r. ' +
kkonganti@0 91 "Default: ${params.mashsketch_r}",
kkonganti@0 92 cliflag: '-m',
kkonganti@0 93 clivalue: (params.mashsketch_m ?: '')
kkonganti@0 94 ],
kkonganti@0 95 'mashsketch_c': [
kkonganti@0 96 clihelp: '<num> Target coverage. Sketching will conclude if this coverage is ' +
kkonganti@0 97 'reached before the end of the input file (estimated by average ' +
kkonganti@0 98 'k-mer multiplicity). Implies --mashsketch_r. ' +
kkonganti@0 99 "Default: ${params.mashsketch_c}",
kkonganti@0 100 cliflag: '-c',
kkonganti@0 101 clivalue: (params.mashsketch_c ?: '')
kkonganti@0 102 ],
kkonganti@0 103 'mashsketch_g': [
kkonganti@0 104 clihelp: '<size> Genome size (raw bases or with K/M/G/T). If specified, will be used ' +
kkonganti@0 105 'for p-value calculation instead of an estimated size from k-mer ' +
kkonganti@0 106 'content. Implies --mashsketch_r. ' +
kkonganti@0 107 "Default: ${params.mashsketch_g}",
kkonganti@0 108 cliflag: '-g',
kkonganti@0 109 clivalue: (params.mashsketch_g ?: '')
kkonganti@0 110 ],
kkonganti@0 111 'mashsketch_n': [
kkonganti@0 112 clihelp: 'Preserve strand (by default, strand is ignored by using canonical ' +
kkonganti@0 113 'DNA k-mers, which are alphabetical minima of forward-reverse ' +
kkonganti@0 114 'pairs). Implied if an alphabet is specified with --mashsketch_a ' +
kkonganti@0 115 'or --mashsketch_z. ' +
kkonganti@0 116 "Default: ${params.mashsketch_n}",
kkonganti@0 117 cliflag: '-n',
kkonganti@0 118 clivalue: (params.mashsketch_n ? ' ' : '')
kkonganti@0 119 ],
kkonganti@0 120 'mashsketch_a': [
kkonganti@0 121 clihelp: 'Use amino acid alphabet (A-Z, except BJOUXZ). Implies ' +
kkonganti@0 122 '--mashsketch_n --mashsketch_k 9. ' +
kkonganti@0 123 "Default: ${params.mashsketch_a}",
kkonganti@0 124 cliflag: '-a',
kkonganti@0 125 clivalue: (params.mashsketch_a ? ' ' : '')
kkonganti@0 126 ],
kkonganti@0 127 'mashsketch_z': [
kkonganti@0 128 clihelp: '<text> Alphabet to base hashes on (case ignored by default; ' +
kkonganti@0 129 'see --mashsketch_Z). K-mers with other characters will be ' +
kkonganti@0 130 'ignored. Implies --mashsketch_n. ' +
kkonganti@0 131 "Default: ${params.mashsketch_z}",
kkonganti@0 132 cliflag: '-z',
kkonganti@0 133 clivalue: (params.mashsketch_z ?: '')
kkonganti@0 134 ],
kkonganti@0 135 'mashsketch_Z': [
kkonganti@0 136 clihelp: 'Preserve case in k-mers and alphabet (case is ignored by default). ' +
kkonganti@0 137 'Sequence letters whose case is not in the current alphabet will be ' +
kkonganti@0 138 'skipped when sketching. ' +
kkonganti@0 139 "Default: ${params.mashsketch_Z}",
kkonganti@0 140 cliflag: '-Z',
kkonganti@0 141 clivalue: (params.mashsketch_Z ?: '')
kkonganti@0 142 ]
kkonganti@0 143 ]
kkonganti@0 144
kkonganti@0 145 toolspecs.each {
kkonganti@0 146 k, v -> tool.text['--' + k] = "${v.clihelp}"
kkonganti@0 147 tool.helpparams[k] = [ cliflag: "${v.cliflag}", clivalue: v.clivalue ]
kkonganti@0 148 }
kkonganti@0 149
kkonganti@0 150 return tool
kkonganti@0 151 }