Mercurial > repos > rliterman > csp2
comparison CSP2/CSP2_env/env-d9b9114564458d9d-741b3de822f2aaca6c6caa4325c4afce/opt/bbmap-39.01-1/splitnextera.sh @ 69:33d812a61356
planemo upload commit 2e9511a184a1ca667c7be0c6321a36dc4e3d116d
author | jpayne |
---|---|
date | Tue, 18 Mar 2025 17:55:14 -0400 |
parents | |
children |
comparison
equal
deleted
inserted
replaced
67:0e9998148a16 | 69:33d812a61356 |
---|---|
1 #!/bin/bash | |
2 | |
3 usage(){ | |
4 echo " | |
5 Written by Brian Bushnell | |
6 Last modified March 6, 2015 | |
7 | |
8 Description: Splits Nextera LMP libraries into subsets based on linker orientation: | |
9 LMP, fragment, unknown, and singleton. | |
10 Please read bbmap/docs/guides/SplitNexteraGuide.txt for more information. | |
11 | |
12 Usage: splitnextera.sh in=<file> out=<file> outf=<file> outu=<file> outs=<file> | |
13 | |
14 For pairs in two files, use in1, in2, out1, out2, etc. | |
15 | |
16 *** Note *** | |
17 For maximal speed, before running splitnextera, the linkers can be replaced with a constant first. | |
18 | |
19 In other words, you can either do this (which is slightly faster): | |
20 bbduk.sh in=reads.fq out=replaced.fq ktmask=J k=19 hdist=1 mink=11 hdist2=0 literal=CTGTCTCTTATACACATCTAGATGTGTATAAGAGACAG | |
21 splitnextera.sh in=replaced.fq out=longmate.fq outf=frag.fq outu=unknown.fq outs=singleton.fq | |
22 | |
23 Or this: | |
24 splitnextera.sh in=reads.fq out=longmate.fq outf=frag.fq outu=unknown.fq outs=singleton.fq mask=t | |
25 | |
26 | |
27 I/O parameters: | |
28 in=<file> Input reads. Set to 'stdin.fq' to read from stdin. | |
29 out=<file> Output for pairs with LMP orientation. | |
30 outf=<file> Output for pairs with fragment orientation. | |
31 outu=<file> Pairs with unknown orientation. | |
32 outs=<file> Singleton output. | |
33 ow=f (overwrite) Overwrites files that already exist. | |
34 app=f (append) Append to files that already exist. | |
35 zl=4 (ziplevel) Set compression level, 1 (low) to 9 (max). | |
36 int=f (interleaved) Determines whether INPUT file is considered interleaved. | |
37 qin=auto ASCII offset for input quality. May be 33 (Sanger), 64 (Illumina), or auto. | |
38 qout=auto ASCII offset for output quality. May be 33 (Sanger), 64 (Illumina), or auto (same as input). | |
39 | |
40 Processing Parameters: | |
41 mask=f Set to true if you did not already convert junctions to some symbol, and it will be done automatically. | |
42 junction=J Look for this symbol to designate the junction bases. | |
43 innerlmp=f Generate long mate pairs from the inner pair also, when the junction is found in both reads. | |
44 rename=t Rename read 2 of output when using single-ended input. | |
45 minlength=40 (ml) Do not output reads shorter than this. | |
46 merge=f Attempt to merge overlapping reads before looking for junctions. | |
47 testmerge=0.0 If nonzero, only merge reads if at least the fraction of input reads are mergable. | |
48 | |
49 Sampling parameters: | |
50 | |
51 reads=-1 Set to a positive number to only process this many INPUT reads (or pairs), then quit. | |
52 samplerate=1 Randomly output only this fraction of reads; 1 means sampling is disabled. | |
53 sampleseed=-1 Set to a positive number to use that prng seed for sampling (allowing deterministic sampling). | |
54 | |
55 Java Parameters: | |
56 -Xmx This will set Java's memory usage, overriding autodetection. | |
57 -Xmx20g will specify 20 gigs of RAM, and -Xmx200m will specify 200 megs. | |
58 The max is typically 85% of physical memory. | |
59 -eoom This flag will cause the process to exit if an out-of-memory | |
60 exception occurs. Requires Java 8u92+. | |
61 -da Disable assertions. | |
62 | |
63 Please contact Brian Bushnell at bbushnell@lbl.gov if you encounter any problems. | |
64 " | |
65 } | |
66 | |
67 #This block allows symlinked shellscripts to correctly set classpath. | |
68 pushd . > /dev/null | |
69 DIR="${BASH_SOURCE[0]}" | |
70 while [ -h "$DIR" ]; do | |
71 cd "$(dirname "$DIR")" | |
72 DIR="$(readlink "$(basename "$DIR")")" | |
73 done | |
74 cd "$(dirname "$DIR")" | |
75 DIR="$(pwd)/" | |
76 popd > /dev/null | |
77 | |
78 #DIR="$( cd "$( dirname "${BASH_SOURCE[0]}" )" && pwd )/" | |
79 CP="$DIR""current/" | |
80 | |
81 z="-Xmx200m" | |
82 set=0 | |
83 | |
84 if [ -z "$1" ] || [[ $1 == -h ]] || [[ $1 == --help ]]; then | |
85 usage | |
86 exit | |
87 fi | |
88 | |
89 calcXmx () { | |
90 source "$DIR""/calcmem.sh" | |
91 setEnvironment | |
92 parseXmx "$@" | |
93 } | |
94 calcXmx "$@" | |
95 | |
96 function splitnextera() { | |
97 local CMD="java $EA $EOOM $z -cp $CP jgi.SplitNexteraLMP $@" | |
98 echo $CMD >&2 | |
99 eval $CMD | |
100 } | |
101 | |
102 splitnextera "$@" |