-
Notifications
You must be signed in to change notification settings - Fork 0
/
cnvkit_detection.sh
131 lines (105 loc) · 2.93 KB
/
cnvkit_detection.sh
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
# Author: Julie BOGOIN
source ~/miniconda3/etc/profile.d/conda.sh
conda activate cnvkit_env
REF="/media/Data1/jbogoin/ref/fa_hg38/hg38_GenDev/hg38_GenDev.fa"
TARGET_AUTO="/media/Data1/jbogoin/ref/gencode/v36_hg38/autosomes/gencode.v36.basic.annotation.autosomes.interval_list"
TARGET_XY="/media/Data1/jbogoin/ref/gencode/v36_hg38/XY/gencode.v36.basic.annotation.XY.interval_list"
DATA=$PWD
echo ""
echo "**********************"
echo "CNVKIT DETECTION start"
echo "**********************"
echo ""
rm -Rf cnvkit_output
mkdir cnvkit_output
cd cnvkit_output
mkdir all
mkdir female
mkdir male
cd ..
####################################################################################
echo ""
echo "Working on female..."
echo ""
FEMALE=""
while read line
do
FEMALE+="$line.dedup.bam "
done < female_list.txt
echo "Liste des femmes:"
echo $FEMALE
echo ""
#create a pooled reference by running batch command specifying only normal samples
~/cnvkit/cnvkit.py batch -n $FEMALE \
-m hybrid \
-f $REF \
--targets $TARGET_XY \
--output-reference $DATA/cnvkit_output/female/pooled-reference.cnn \
--short-names \
-d $DATA/cnvkit_output/female \
-p 12
# Run WGS batch pipeline using the pooled reference file
~/cnvkit/cnvkit.py batch $FEMALE \
-m hybrid \
-r $DATA/cnvkit_output/female/pooled-reference.cnn \
-d $DATA/cnvkit_output/female \
-p 12 \
--scatter \
--diagram
rm $DATA/cnvkit_output/female/*.target.bed;
####################################################################################
echo ""
echo "Working on male..."
echo ""
MALE=""
while read line
do
MALE+="$line.dedup.bam "
done < male_list.txt
echo "Liste des hommes:"
echo $MALE
echo ""
#create a pooled reference by running batch command specifying only normal samples
~/cnvkit/cnvkit.py batch -n $MALE \
-m hybrid \
-f $REF \
--targets $TARGET_XY \
--output-reference $DATA/cnvkit_output/male/pooled-reference.cnn \
--short-names \
-d $DATA/cnvkit_output/male \
-p 12
# Run WGS batch pipeline using the pooled reference file
~/cnvkit/cnvkit.py batch $MALE \
-m hybrid \
-r $DATA/cnvkit_output/male/pooled-reference.cnn \
-d $DATA/cnvkit_output/male \
-p 12 \
--scatter \
--diagram
rm $DATA/cnvkit_output/male/*.target.bed;
####################################################################################
echo ""
echo "Working on all..."
echo ""
SAMPLES=$(ls *.dedup.bam)
#create a pooled reference by running batch command specifying only normal samples
~/cnvkit/cnvkit.py batch -n $SAMPLES \
-m hybrid \
-f $REF \
--targets $TARGET_AUTO \
--output-reference $DATA/cnvkit_output/all/pooled-reference.cnn \
--short-names \
-d $DATA/cnvkit_output/all \
-p 12
# Run WGS batch pipeline using the pooled reference file
~/cnvkit/cnvkit.py batch $SAMPLES \
-m hybrid \
-r $DATA/cnvkit_output/all/pooled-reference.cnn \
-d $DATA/cnvkit_output/all \
-p 12 \
--scatter \
--diagram
rm $DATA/cnvkit_output/all/*.target.bed;
echo ""
echo "CNVKIT DETECTION job done!"
echo ""