jpayne@69
|
1 #!/bin/bash
|
jpayne@69
|
2
|
jpayne@69
|
3 usage(){
|
jpayne@69
|
4 echo "
|
jpayne@69
|
5 Written by Shijie Yao
|
jpayne@69
|
6 Last modified May 31, 2018
|
jpayne@69
|
7
|
jpayne@69
|
8 Description: DNA Tetramer analysis.
|
jpayne@69
|
9 DNA tetramers are counted for each sub-sequence of window size in the sequence.
|
jpayne@69
|
10 The window slides along the sequence by the step length.
|
jpayne@69
|
11 Sub-sequence shorter than the window size is ignored. Tetramers containing N are ignored.
|
jpayne@69
|
12
|
jpayne@69
|
13 Usage: TetramerFreq.sh in=<input file> out=<output file> step=500 window=2000
|
jpayne@69
|
14
|
jpayne@69
|
15 Input may be fasta or fastq, compressed or uncompressed.
|
jpayne@69
|
16
|
jpayne@69
|
17 Standard parameters:
|
jpayne@69
|
18 in=<file> DNA sequence input file
|
jpayne@69
|
19 out=<file> Output file name
|
jpayne@69
|
20 step/s=INT Step size (default 500)
|
jpayne@69
|
21 window/w=INT Window size (default 2kb); <=0 turns windowing off (e.g. short reads)
|
jpayne@69
|
22 short=T/F Print lines for sequences shorter than window (default F)
|
jpayne@69
|
23 k=INT Kmer length (default 4)
|
jpayne@69
|
24
|
jpayne@69
|
25 Java Parameters:
|
jpayne@69
|
26 -Xmx This will set Java's memory usage, overriding autodetection.
|
jpayne@69
|
27 -Xmx20g will specify 20 gigs of RAM, and -Xmx200m will
|
jpayne@69
|
28 specify 200 megs. The max is typically 85% of physical memory.
|
jpayne@69
|
29 -eoom This flag will cause the process to exit if an out-of-memory
|
jpayne@69
|
30 exception occurs. Requires Java 8u92+.
|
jpayne@69
|
31 -da Disable assertions.
|
jpayne@69
|
32
|
jpayne@69
|
33 Please contact Brian Bushnell at bbushnell@lbl.gov if you encounter any problems.
|
jpayne@69
|
34 "
|
jpayne@69
|
35 }
|
jpayne@69
|
36
|
jpayne@69
|
37 #This block allows symlinked shellscripts to correctly set classpath.
|
jpayne@69
|
38 pushd . > /dev/null
|
jpayne@69
|
39 DIR="${BASH_SOURCE[0]}"
|
jpayne@69
|
40 while [ -h "$DIR" ]; do
|
jpayne@69
|
41 cd "$(dirname "$DIR")"
|
jpayne@69
|
42 DIR="$(readlink "$(basename "$DIR")")"
|
jpayne@69
|
43 done
|
jpayne@69
|
44 cd "$(dirname "$DIR")"
|
jpayne@69
|
45 DIR="$(pwd)/"
|
jpayne@69
|
46 popd > /dev/null
|
jpayne@69
|
47
|
jpayne@69
|
48 #DIR="$( cd "$( dirname "${BASH_SOURCE[0]}" )" && pwd )/"
|
jpayne@69
|
49 CP="$DIR""current/"
|
jpayne@69
|
50
|
jpayne@69
|
51 z="-Xmx4g"
|
jpayne@69
|
52 z2="-Xms4g"
|
jpayne@69
|
53 set=0
|
jpayne@69
|
54
|
jpayne@69
|
55 if [ -z "$1" ] || [[ $1 == -h ]] || [[ $1 == --help ]]; then
|
jpayne@69
|
56 usage
|
jpayne@69
|
57 exit
|
jpayne@69
|
58 fi
|
jpayne@69
|
59
|
jpayne@69
|
60 calcXmx () {
|
jpayne@69
|
61 source "$DIR""/calcmem.sh"
|
jpayne@69
|
62 setEnvironment
|
jpayne@69
|
63 parseXmx "$@"
|
jpayne@69
|
64 if [[ $set == 1 ]]; then
|
jpayne@69
|
65 return
|
jpayne@69
|
66 fi
|
jpayne@69
|
67 freeRam 4000m 84
|
jpayne@69
|
68 z="-Xmx${RAM}m"
|
jpayne@69
|
69 z2="-Xms${RAM}m"
|
jpayne@69
|
70 }
|
jpayne@69
|
71 calcXmx "$@"
|
jpayne@69
|
72
|
jpayne@69
|
73 tetramerfreq () {
|
jpayne@69
|
74 local CMD="java $EA $EOOM $z -cp $CP jgi.TetramerFrequencies $@"
|
jpayne@69
|
75 echo $CMD >&2
|
jpayne@69
|
76 eval $CMD
|
jpayne@69
|
77 }
|
jpayne@69
|
78
|
jpayne@69
|
79 tetramerfreq "$@"
|