Mercurial > repos > rliterman > csp2

/*
~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
    CSP2 Nextflow config file
~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
    Default config options for all compute environments
----------------------------------------------------------------------------------------
*/

// Enable conda
conda.enabled = true

// Import profile settings
includeConfig "conf/profiles.config"

// CPU/memory settings
process {
    withLabel: 'mummerMem' {
        task_name = 'CSP2-MUMmer'
        cpus = 1
        // memory = '4 GB'
    }
    withLabel: 'skesaMem' {
        task_name = 'CSP2-SKESA'
        // memory = '12 GB'
    }
}

// Global default params
params {

    // Setting output directory

    // Set name for output folder/file prefixes
    out = "CSP2_${new java.util.Date().getTime()}"

    // Set output parent directory [Default: CWD; Set this to have all output go to the same parent folder, with unique IDs set by --out]
    outroot = ""

    // CSP2 can run in the following run-modes:

    // assemble: Assemble read data (--reads/--ref_reads) into FASTA via SKESA (ignores --fasta/--ref_fasta/--snpdiffs)
    // align: Given query data (--reads/--fasta) and reference data (--ref_reads/--ref_fasta), run MUMmer alignment analysis for each query/ref combination (ignores --snpdiffs)
    // screen: Given query data (--reads/--fasta) and reference data (--ref_reads/--ref_fasta) and/or MUMmer output (.snpdiffs), create a report for raw SNP distances between each query and reference assembly
    // snp: Given query data (--reads/--fasta) and reference data (--ref_reads/--ref_fasta) and/or MUMmer output (.snpdiffs), generate alignments and pairwise distances for all queries based on each reference dataset

    runmode = ""

    // Location for isolate sequence data
    reads = ""
    fasta = ""

    // Location for reference sequence data
    ref_reads = ""
    ref_fasta = ""

    // IDs for reference sequences (Comma-separated list)
    ref_id = ""

    // Location for snpdiffs files
    snpdiffs = ""

    // Read read_info
    readext = "fastq.gz"
    forward = "_1.fastq.gz"
    reverse = "_2.fastq.gz"

    ref_readext = "fastq.gz"
    ref_forward = "_1.fastq.gz"
    ref_reverse = "_2.fastq.gz"

    // Analytical variables

    // Only consider queries if the reference genome is covered by at least <min_cov>% [Default: 85]
    min_cov = 85

    // Only consider SNPs from contig alignments longer than <min_len> bp [Default: 500]
    min_len = 500

    // Only consider SNPs from contig alignments with <min_iden>% identity [Default: 99]
    min_iden = 99

    // Remove SNPs that occur within <ref_edge>bp from the end of the reference contig [Default: 150]
    ref_edge = 150

    // Remove SNPs that occur within <query_edge>bp from the end of the query contig [Default: 150]
    query_edge = 150

    // SNP density filters: Given density windows provided by dwin, purge windows where more than the allowable window SNPs (wsnps) are found
    // Default: 3 max per 1000bp, 2 max per 125bp, 1 max per 15bp, filtered from biggest window to smallest
    // Set --dwin 0 to disable density filtering
    dwin = "1000,125,15"
    wsnps = "3,2,1"

    // If running refchooser in snp mode, compare queries to the top X references [Default: 1]
    n_ref = 1

    // If the assembly file contains the string <trim_name>, remove it from the sample name (e.g. '_contigs_skesa')
    trim_name = '""'

    // If running SNP pipeline, set the maximum percent of isolates with missing data allowed in the final alignment/distances [Default: 50]
    max_missing = 50

    // Alternate directory for pybedtools tmp files [Default: "" (system default)]
    tmp_dir = ""

    // Set IDs for isolates to exclude from analysis (Comma-separated list)
    exclude = ""

    // By default, do not perform edge-filtered SNP rescuing
    rescue = "norescue"

    // Help function
    help = "nohelp"
    h = "nohelp"
}
author	rliterman
date	Thu, 19 Dec 2024 13:02:58 -0500
parents	bbbf36187d87
children