jpayne@69
|
1 #!/bin/bash
|
jpayne@69
|
2
|
jpayne@69
|
3 usage(){
|
jpayne@69
|
4 echo "
|
jpayne@69
|
5 Written by Brian Bushnell
|
jpayne@69
|
6 Last modified July 31, 2015
|
jpayne@69
|
7
|
jpayne@69
|
8 Description: Reduces Silva entries down to one entry per taxa (the first).
|
jpayne@69
|
9 This is accomplished by splitting the semicolon-delimited name on semicolons,
|
jpayne@69
|
10 and assuming everything is in the form of:
|
jpayne@69
|
11 kingdom;phylum;class;order;family;genus;species
|
jpayne@69
|
12 ...so it's not very reliable.
|
jpayne@69
|
13
|
jpayne@69
|
14 Usage: reducesilva.sh in=<file> out=<file> column=<1>
|
jpayne@69
|
15
|
jpayne@69
|
16 Parameters:
|
jpayne@69
|
17 column The taxonomic level. 0=species, 1=genus, etc.
|
jpayne@69
|
18 ow=f (overwrite) Overwrites files that already exist.
|
jpayne@69
|
19 zl=4 (ziplevel) Set compression level, 1 (low) to 9 (max).
|
jpayne@69
|
20 fastawrap=70 Length of lines in fasta output.
|
jpayne@69
|
21
|
jpayne@69
|
22 Sampling parameters:
|
jpayne@69
|
23 reads=-1 Set to a positive number to only process this many INPUT sequences, then quit.
|
jpayne@69
|
24
|
jpayne@69
|
25 Java Parameters:
|
jpayne@69
|
26 -Xmx This will set Java's memory usage, overriding autodetection.
|
jpayne@69
|
27 -Xmx20g will specify 20 gigs of RAM, and -Xmx200m will specify 200 megs.
|
jpayne@69
|
28 The max is typically 85% of physical memory.
|
jpayne@69
|
29 -eoom This flag will cause the process to exit if an out-of-memory
|
jpayne@69
|
30 exception occurs. Requires Java 8u92+.
|
jpayne@69
|
31 -da Disable assertions.
|
jpayne@69
|
32
|
jpayne@69
|
33 Please contact Brian Bushnell at bbushnell@lbl.gov if you encounter any problems.
|
jpayne@69
|
34 "
|
jpayne@69
|
35 }
|
jpayne@69
|
36
|
jpayne@69
|
37 #This block allows symlinked shellscripts to correctly set classpath.
|
jpayne@69
|
38 pushd . > /dev/null
|
jpayne@69
|
39 DIR="${BASH_SOURCE[0]}"
|
jpayne@69
|
40 while [ -h "$DIR" ]; do
|
jpayne@69
|
41 cd "$(dirname "$DIR")"
|
jpayne@69
|
42 DIR="$(readlink "$(basename "$DIR")")"
|
jpayne@69
|
43 done
|
jpayne@69
|
44 cd "$(dirname "$DIR")"
|
jpayne@69
|
45 DIR="$(pwd)/"
|
jpayne@69
|
46 popd > /dev/null
|
jpayne@69
|
47
|
jpayne@69
|
48 #DIR="$( cd "$( dirname "${BASH_SOURCE[0]}" )" && pwd )/"
|
jpayne@69
|
49 CP="$DIR""current/"
|
jpayne@69
|
50
|
jpayne@69
|
51 z="-Xmx1g"
|
jpayne@69
|
52 set=0
|
jpayne@69
|
53
|
jpayne@69
|
54 if [ -z "$1" ] || [[ $1 == -h ]] || [[ $1 == --help ]]; then
|
jpayne@69
|
55 usage
|
jpayne@69
|
56 exit
|
jpayne@69
|
57 fi
|
jpayne@69
|
58
|
jpayne@69
|
59 calcXmx () {
|
jpayne@69
|
60 source "$DIR""/calcmem.sh"
|
jpayne@69
|
61 setEnvironment
|
jpayne@69
|
62 parseXmx "$@"
|
jpayne@69
|
63 }
|
jpayne@69
|
64 calcXmx "$@"
|
jpayne@69
|
65
|
jpayne@69
|
66 function reducesilva() {
|
jpayne@69
|
67 local CMD="java $EA $EOOM $z -cp $CP driver.ReduceSilva $@"
|
jpayne@69
|
68 echo $CMD >&2
|
jpayne@69
|
69 eval $CMD
|
jpayne@69
|
70 }
|
jpayne@69
|
71
|
jpayne@69
|
72 reducesilva "$@"
|