Mercurial > repos > rliterman > csp2
diff CSP2/nextflow.config @ 0:01431fa12065
"planemo upload"
author | rliterman |
---|---|
date | Mon, 02 Dec 2024 10:40:55 -0500 |
parents | |
children | 0d775868ee62 |
line wrap: on
line diff
--- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/CSP2/nextflow.config Mon Dec 02 10:40:55 2024 -0500 @@ -0,0 +1,102 @@ +/* +~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ + CSP2 Nextflow config file +~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ + Default config options for all compute environments +---------------------------------------------------------------------------------------- +*/ + +// Enable conda +conda.enabled = true + +// Import profile settings +includeConfig "conf/profiles.config" + +// Global default params +params { + + // Setting output directory + + // Set name for output folder/file prefixes + out = "CSP2_${new java.util.Date().getTime()}" + + // Set output parent directory [Default: CWD; Set this to have all output go to the same parent folder, with unique IDs set by --out] + outroot = "" + + // CSP2 can run in the following run-modes: + + // assemble: Assemble read data (--reads/--ref_reads) into FASTA via SKESA (ignores --fasta/--ref_fasta/--snpdiffs) + // align: Given query data (--reads/--fasta) and reference data (--ref_reads/--ref_fasta), run MUMmer alignment analysis for each query/ref combination (ignores --snpdiffs) + // screen: Given query data (--reads/--fasta) and reference data (--ref_reads/--ref_fasta) and/or MUMmer output (.snpdiffs), create a report for raw SNP distances between each query and reference assembly + // snp: Given query data (--reads/--fasta) and reference data (--ref_reads/--ref_fasta) and/or MUMmer output (.snpdiffs), generate alignments and pairwise distances for all queries based on each reference dataset + + runmode = "" + + // Location for isolate sequence data + reads = "" + fasta = "" + + // Location for reference sequence data + ref_reads = "" + ref_fasta = "" + + // IDs for reference sequences (Comma-separated list) + ref_id = "" + + // Location for snpdiffs files + snpdiffs = "" + + // Read read_info + readext = "fastq.gz" + forward = "_1.fastq.gz" + reverse = "_2.fastq.gz" + + ref_readext = "fastq.gz" + ref_forward = "_1.fastq.gz" + ref_reverse = "_2.fastq.gz" + + // Analytical variables + + // Only consider queries if the reference genome is covered by at least <min_cov>% [Default: 85] + min_cov = 85 + + // Only consider SNPs from contig alignments longer than <min_len> bp [Default: 500] + min_len = 500 + + // Only consider SNPs from contig alignments with <min_iden>% identity [Default: 99] + min_iden = 99 + + // Remove SNPs that occur within <ref_edge>bp from the end of the reference contig [Default: 150] + ref_edge = 150 + + // Remove SNPs that occur within <query_edge>bp from the end of the query contig [Default: 150] + query_edge = 150 + + // SNP density filters: Given density windows provided by dwin, purge windows where more than the allowable window SNPs (wsnps) are found + // Default: 3 max per 1000bp, 2 max per 125bp, 1 max per 15bp, filtered from biggest window to smallest + // Set --dwin 0 to disable density filtering + dwin = "1000,125,15" + wsnps = "3,2,1" + + // If running refchooser in snp mode, compare queries to the top X references [Default: 1] + n_ref = 1 + + // If the assembly file contains the string <trim_name>, remove it from the sample name (e.g. '_contigs_skesa') + trim_name = '""' + + // If running SNP pipeline, set the maximum percent of isolates with missing data allowed in the final alignment/distances [Default: 50] + max_missing = 50 + + // Alternate directory for pybedtools tmp files [Default: "" (system default)] + tmp_dir = "" + + // Set IDs for isolates to exclude from analysis (Comma-separated list) + exclude = "" + + // By default, do not perform edge-filtered SNP rescuing + rescue = "norescue" + + // Help function + help = "nohelp" + h = "nohelp" +} \ No newline at end of file