forked from 38/d4-format
-
Notifications
You must be signed in to change notification settings - Fork 0
/
example.sh
38 lines (30 loc) · 1.01 KB
/
example.sh
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
DATA_DIR=./sample_data
export HTSLIB=dynamic
export LD_LIBRARY_PATH=`pwd`/hts/htslib:${LD_LIBRARY_PATH}
export DYLD_LIBRARY_PATH=`pwd`/hts/htslib:${DYLD_LIBRARY_PATH}
mkdir -p sample_data
function check_file() {
if [ ! -e ${DATA_DIR}/$1 ]
then
curl "http://home.chpc.utah.edu/~u0875014/$1" > ${DATA_DIR}/$1
fi
}
check_file hg002.cram
check_file hg002.cram.crai
check_file hg19.fa.gz
check_file hg19.fa.gz.fai
check_file hg19.fa.gz.gzi
if [ ! -e ${DATA_DIR}/hg002.d4 ]
then
cargo run --release -- create -r ${DATA_DIR}/hg19.fa.gz ${DATA_DIR}/hg002.cram ${DATA_DIR}/hg002.d4
fi
if [ ! -e ${DATA_DIR}/callset.bed ]
then
curl ftp://ftp-trace.ncbi.nlm.nih.gov/giab/ftp/data/AshkenazimTrio/analysis/NIST_SVs_Integration_v0.6/HG002_SVs_Tier1_v0.6.vcf.gz \
| zgrep 'SVTYPE=DEL' \
| awk '$7 == "PASS" {print}' \
| sed -n 's/^\(.*SVLEN=-\([0-9]*\);.*\)$/\2\t\1/gp' \
| awk '$1 > 200 { print $2"\t"$3"\t"($3+$1); }' \
> ${DATA_DIR}/callset.bed
fi
cargo run --release -- stat -r ${DATA_DIR}/callset.bed ${DATA_DIR}/hg002.d4