forked from naumenko-sa/cre
-
Notifications
You must be signed in to change notification settings - Fork 0
/
cre.prepare_bcbio_run.sh
executable file
·78 lines (64 loc) · 2.03 KB
/
cre.prepare_bcbio_run.sh
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
#!/bin/bash
# prepares family for bcbio run when input files are family_sample.bam or family_sample_1/2.fq.gz
family=$1
# $2 = template type,
# - default = no value = default WES
# - noalign - no alignment (for rerunning or for running after alignment to reference with decoy),
# - fast - no realignment,recalibration, and only gatk
# - validation = NA12878 validation
# - align_decoy - align only, reference with decoy
# - annotate - variants were pre-called, annotation only
template_type=$2
echo "Generating bcbio project using template type: " $template_type
cd $family
cp ~/cre/bcbio.sample_sheet_header.csv $family.csv
cd input
shopt -s extglob
ls @(*.bam|*.gz) | sed s/.bam// | sed s/.bai// | sed s/"_1.fq.gz"// | sed s/"_2.fq.gz"// | sort | uniq > ../samples.txt
cd ..
variant_regions=""
#default template
template=~/cre/config/cre.bcbio.templates.wes.yaml
if [ -n "$2" ]
then
if [ $template_type == "noalign" ]
then
template=~/cre/config/cre.bcbio.templates.wes.noalign.yaml
elif [ $template_type == "fast" ]
then
echo fast
template=~/cre/config/cre.bcbio.templates.wes.fast.yaml
elif [ $template_type == "validation" ]
then
template=~/cre/config/cre.bcbio.templates.wes.validation.yaml
variant_regions=$3
elif [ $template_type == "gatk4" ]
then
template=~/cre/config/cre.bcbio.templates.wes.gatk4.yaml
variant_regions=$3
elif [ $template_type == "align_decoy" ]
then
template=~/cre/config/cre.bcbio.templates.align_decoy.yaml
fi
fi
while read sample
do
echo $sample","$sample","$family",,,$variant_regions" >> $family.csv
done < samples.txt
if [ -n "$2" ] && [ $template_type == "annotate" ]
then
mkdir config
mkdir work
cd input
vcf=`ls *.vcf.gz`
template=~/cre/config/cre.bcbio.templates.annotate.yaml
cat $template | sed s/"\[vrn_file\]"/$vcf/ | sed s/"\[familyid\]"/$family/ > ../config/$family.yaml
cd ..
else
bcbio_nextgen.py -w template $template $family.csv input/*
mv $family/config .
mv $family/work .
rm $family.csv
rmdir $family
cd ..
fi