forked from jenniferlu717/Bracken
-
Notifications
You must be signed in to change notification settings - Fork 0
/
bracken
executable file
·122 lines (118 loc) · 4.22 KB
/
bracken
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
#!/bin/bash
#####################################################################
#bracken.sh checks that the Bracken files are present and generates the abundance estimation
#Copyright (C) 2016-2020 Jennifer Lu, [email protected]
#
#This file is part of Bracken.
#
#Bracken is free software; you can redistribute it and/or modify
#it under the terms of the GNU General Public License as published by
#the Free Software Foundation; either version 3 of the license, or
#(at your option) any later version.
#
#This program is distributed in the hope that it will be useful,
#but WITHOUT ANY WARRANTY; without even the implied warranty of
#MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
#GNU General Public License for more details
#
#You should have received a copy of the GNU General Public License
#along with this program; if not, see <http://www.gnu.org/licenses/>.
#
#####################################################################
set -eu
INPUT=""
OUTPUT=""
OUTREPORT=""
DATABASE=""
READ_LEN=100
THRESHOLD=10
LEVEL="S"
VERSION="2.5"
while getopts "t:i:o:r:d:w:l:" OPTION
do
case $OPTION in
t)
THRESHOLD=$OPTARG
;;
r)
READ_LEN=$OPTARG
;;
l)
LEVEL=$OPTARG
;;
d)
DATABASE=$OPTARG
;;
i)
INPUT=$OPTARG
;;
o)
OUTPUT=$OPTARG
;;
w)
OUTREPORT=$OPTARG
;;
\?)
echo "Usage: bracken -d MY_DB -i INPUT -o OUTPUT -w OUTREPORT -r READ_LEN -l LEVEL -t THRESHOLD"
echo " MY_DB location of Kraken database"
echo " INPUT Kraken REPORT file to use for abundance estimation"
echo " OUTPUT file name for Bracken default output"
echo " OUTREPORT New Kraken REPORT output file with Bracken read estimates"
echo " READ_LEN read length to get all classifications for (default: 100)"
echo " LEVEL level to estimate abundance at [options: D,P,C,O,F,G,S,S1,etc] (default: S)"
echo " THRESHOLD number of reads required PRIOR to abundance estimation to perform reestimation (default: 0)"
echo
exit
;;
esac
done
if [[ "$DATABASE" =~ "/"$ ]]
then
DATABASE=${DATABASE:0:-1}
fi
#Check if Kraken database exists
echo " >> Checking for Valid Options..."
if [ -d $DATABASE ]
then
#Directory exists, check for databaseXmers.kmer_distrib
if [ ! -f $DATABASE/database${READ_LEN}mers.kmer_distrib ]
then
echo " ERROR: ${DATABASE}/database${READ_LEN}mers.kmer_distrib does not exist"
echo " Run bracken-build to generate the kmer distribution file."
exit
fi
else
echo " ERROR: Kraken database ${DATABASE} does not exist"
exit
fi
#DIR="$( cd "$( dirname "${BASH_SOURCE[0]}" )" >/dev/null && pwd )"
DIR=`dirname $(readlink $0 || echo $0)`
#cd $DIR
echo " >> Running Bracken "
#Check to make sure input file exists
if [ -f ${INPUT} ]
then
if [[ "${OUTREPORT}" = "" ]]
then
echo " >> python src/est_abundance.py -i ${INPUT} -o ${OUTPUT} -k $DATABASE/database${READ_LEN}mers.kmer_distrib -l ${LEVEL} -t ${THRESHOLD}"
python $DIR/src/est_abundance.py -i ${INPUT} \
-o ${OUTPUT} \
-k $DATABASE/database${READ_LEN}mers.kmer_distrib \
-l ${LEVEL} \
-t ${THRESHOLD}
else
echo " >> python src/est_abundance.py -i ${INPUT} -o ${OUTPUT} -k $DATABASE/database${READ_LEN}mers.kmer_distrib -l ${LEVEL} -t ${THRESHOLD}"
python $DIR/src/est_abundance.py -i ${INPUT} \
-o ${OUTPUT} \
--out-report ${OUTREPORT} \
-k $DATABASE/database${READ_LEN}mers.kmer_distrib \
-l ${LEVEL} \
-t ${THRESHOLD}
fi
else
echo " ERROR: Input file ${INPUT} does not exist"
echo " If running kraken v1.0, run kraken-report"
echo " If running kraken v2.0, run kraken2 with the --report flag"
exit
fi
echo " Bracken complete."