diff 0.5.0/lib/help/mashsketch.nf @ 1:365849f031fd

"planemo upload"
author kkonganti
date Mon, 05 Jun 2023 18:48:51 -0400
parents
children
line wrap: on
line diff
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/0.5.0/lib/help/mashsketch.nf	Mon Jun 05 18:48:51 2023 -0400
@@ -0,0 +1,151 @@
+// Help text for mash sketch within CPIPES.
+
+def mashsketchHelp(params) {
+
+    Map tool = [:]
+    Map toolspecs = [:]
+    tool.text = [:]
+    tool.helpparams = [:]
+
+    toolspecs = [
+        'mashsketch_run': [
+            clihelp: 'Run `mash screen` tool. Default: ' +
+                (params.mashsketch_run ?: false),
+            cliflag: null,
+            clivalue: null
+        ],
+        'mashsketch_l': [
+            clihelp: 'List input. Lines in each <input> specify paths to sequence files, ' +
+                'one per line. ' +
+                "Default: ${params.mashsketch_l}",
+            cliflag: '-l',
+            clivalue: (params.mashsketch_l ? ' ' : '')
+        ],
+        'mashsketch_I': [
+            clihelp: '<path>  ID field for sketch of reads (instead of first sequence ID). ' +
+                "Default: ${params.mashsketch_I}",
+            cliflag: '-I',
+            clivalue: (params.mashsketch_I ?: '')
+        ],
+        'mashsketch_C': [
+            clihelp: '<path>  Comment for a sketch of reads (instead of first sequence comment). ' +
+                "Default: ${params.mashsketch_C}",
+            cliflag: '-C',
+            clivalue: (params.mashsketch_C ?: '')
+        ],
+        'mashsketch_k': [
+            clihelp: '<int>   K-mer size. Hashes will be based on strings of this many ' +
+                'nucleotides. Canonical nucleotides are used by default (see ' +
+                'Alphabet options below). (1-32) ' +
+                "Default: ${params.mashsketch_k}",
+            cliflag: '-k',
+            clivalue: (params.mashsketch_k ?: '')
+        ],
+        'mashsketch_s': [
+            clihelp: '<int>   Sketch size. Each sketch will have at most this many non-redundant ' +
+                'min-hashes. ' +
+                "Default: ${params.mashsketch_s}",
+            cliflag: '-s',
+            clivalue: (params.mashsketch_s ?: '')
+        ],
+        'mashsketch_i': [
+            clihelp: 'Sketch individual sequences, rather than whole files, e.g. for ' +
+                'multi-fastas of single-chromosome genomes or pair-wise gene ' +
+                'comparisons. ' +
+                "Default: ${params.mashsketch_i}",
+            cliflag: '-i',
+            clivalue: (params.mashsketch_i ? ' ' : '')
+        ],
+        'mashsketch_S': [
+            clihelp: '<int>   Seed to provide to the hash function. (0-4294967296) [42] ' +
+                "Default: ${params.mashsketch_S}",
+            cliflag: '-S',
+            clivalue: (params.mashsketch_S ?: '')
+        ],
+
+        'mashsketch_w': [
+            clihelp: '<num>   Probability threshold for warning about low k-mer size. (0-1) ' +
+                "Default: ${params.mashsketch_w}",
+            cliflag: '-w',
+            clivalue: (params.mashsketch_w ?: '')
+        ],
+        'mashsketch_r': [
+            clihelp: 'Input is a read set. See Reads options below. Incompatible with ' +
+                '--mashsketch_i. ' +
+                "Default: ${params.mashsketch_r}",
+            cliflag: '-r',
+            clivalue: (params.mashsketch_r ? ' ' : '')
+        ],
+        'mashsketch_b': [
+            clihelp: '<size>  Use a Bloom filter of this size (raw bytes or with K/M/G/T) to ' +
+                'filter out unique k-mers. This is useful if exact filtering with ' +
+                '--mashsketch_m uses too much memory. However, some unique k-mers may pass ' +
+                'erroneously, and copies cannot be counted beyond 2. Implies --mashsketch_r. ' +
+                "Default: ${params.mashsketch_b}",
+            cliflag: '-b',
+            clivalue: (params.mashsketch_b ?: '')
+        ],
+        'mashsketch_m': [
+            clihelp: '<int>   Minimum copies of each k-mer required to pass noise filter for ' +
+                'reads. Implies --mashsketch_r. ' +
+                "Default: ${params.mashsketch_r}",
+            cliflag: '-m',
+            clivalue: (params.mashsketch_m ?: '')
+        ],
+        'mashsketch_c': [
+            clihelp: '<num>   Target coverage. Sketching will conclude if this coverage is ' +
+                'reached before the end of the input file (estimated by average ' +
+                'k-mer multiplicity). Implies --mashsketch_r. ' +
+                "Default: ${params.mashsketch_c}",
+            cliflag: '-c',
+            clivalue: (params.mashsketch_c ?: '')
+        ],
+        'mashsketch_g': [
+            clihelp: '<size>  Genome size (raw bases or with K/M/G/T). If specified, will be used ' +
+                'for p-value calculation instead of an estimated size from k-mer ' +
+                'content. Implies --mashsketch_r. ' +
+                "Default: ${params.mashsketch_g}",
+            cliflag: '-g',
+            clivalue: (params.mashsketch_g ?: '')
+        ],
+        'mashsketch_n': [
+            clihelp: 'Preserve strand (by default, strand is ignored by using canonical ' +
+                'DNA k-mers, which are alphabetical minima of forward-reverse ' +
+                'pairs). Implied if an alphabet is specified with --mashsketch_a ' +
+                'or --mashsketch_z. ' +
+                "Default: ${params.mashsketch_n}",
+            cliflag: '-n',
+            clivalue: (params.mashsketch_n ? ' ' : '')
+        ],
+        'mashsketch_a': [
+            clihelp: 'Use amino acid alphabet (A-Z, except BJOUXZ). Implies ' +
+                '--mashsketch_n --mashsketch_k 9. ' +
+                "Default: ${params.mashsketch_a}",
+            cliflag: '-a',
+            clivalue: (params.mashsketch_a ? ' ' : '')
+        ],
+        'mashsketch_z': [
+            clihelp: '<text>  Alphabet to base hashes on (case ignored by default; ' +
+                'see --mashsketch_Z). K-mers with other characters will be ' +
+                'ignored. Implies --mashsketch_n. ' +
+                "Default: ${params.mashsketch_z}",
+            cliflag: '-z',
+            clivalue: (params.mashsketch_z ?: '')
+        ],
+        'mashsketch_Z': [
+            clihelp: 'Preserve case in k-mers and alphabet (case is ignored by default). ' +
+                'Sequence letters whose case is not in the current alphabet will be ' +
+                'skipped when sketching. ' +
+                "Default: ${params.mashsketch_Z}",
+            cliflag: '-Z',
+            clivalue: (params.mashsketch_Z ?: '')
+        ]
+    ]
+
+    toolspecs.each {
+        k, v -> tool.text['--' + k] = "${v.clihelp}"
+        tool.helpparams[k] = [ cliflag: "${v.cliflag}", clivalue: v.clivalue ]
+    }
+
+    return tool
+}
\ No newline at end of file