-
Notifications
You must be signed in to change notification settings - Fork 4
/
Copy pathconfig.txt
executable file
·93 lines (74 loc) · 2.53 KB
/
config.txt
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
### configuration file for the pipeline
# ==============================
# for hpcc cluster
# ==============================
CPU=4
QUEUE=big-multi
MEMORY=4000 # unit in megabase
# ==============================
# to pre-load the needed tools
# ==============================
# load modules
module use /apps/modulefiles/test
module load jre7.7
module load zlib-1.2.7
module load python/2.7.3
module load pysam/0.9.1.4
module load numpy/1.9
module load kpal/2.1.2 # for kmer profiling
module load pybedtools/0.6.2
module load vcftools_0.1.9
module load gatk-2.2-4
module load cufflinks/2.2.1
module load bowtie1/1.0.1
module load bowtie2-2.1.0
module load tophat/2.0.10
module load bedtools/2.26.0
module load samtools/0.1.19
module load prinseq
module load fastqc/default
module load perl
#module load R/3.1.0 # default version of R
#module load R/3.0.2 # only required by PEER --> will load when running PEER
#module load peer/1.3
module load htseq/0.6.1
# ==============================
# for genome and its annotation
# ==============================
index=hg19
export GENOME=/data/neurogen/referenceGenome/Homo_sapiens/UCSC/$index
ANNOTATION=$GENOME/Annotation/Genes
ANNOTATION_GTF=$ANNOTATION/gencode.v19.annotation.gtf
ANNOTATION_EXON=$ANNOTATION/gencode.v19.annotation.gtf.exons.bed
ANNOTATION_INTRON=$ANNOTATION/gencode.v19.annotation.gtf.introns.bed
ANNOTATION_5UTR=$ANNOTATION/gencode.v19.annotation.gtf.5utr.bed
ANNOTATION_3UTR=$ANNOTATION/gencode.v19.annotation.gtf.3utr.bed
ANNOTATION_INTERGENIC=$ANNOTATION/gencode.v19.annotation.intergenic.bed
FASTAGENOME=$GENOME/Sequence/Chromosomes
CRHOME_SIZE=$ANNOTATION/ChromInfo.txt
MASK_GTF=$ANNOTATION/chrM.rRNA.tRNA.gtf
# db version mapping
GENCODE=v19
ENSEMBL=v74 # or v75, see http://www.gencodegenes.org/releases/
NCBI=GRCh37
UCSC=hg19
dbSNP=snp137
BIOMART=dec2013 # http://useast.ensembl.org/info/website/archives/assembly.html
# ==============================
# index for mapper
# ==============================
export BOWTIE_INDEXES=$GENOME/Sequence/BowtieIndex
export BOWTIE2_INDEXES=$GENOME/Sequence/Bowtie2Index
#phred score
bowtie="--phred33-quals"; bowtie2="--phred33"; tophat=""; far="fastq-sanger"; fastqmcf="33"; trimmomatic="-phred33"
#mismatch
mm=2
mindist=200 ## Fusion min distance if in same chromosome
ignorechr=chrM
#PE option
PE_option="--mate-inner-dist 50 --mate-std-dev 20" ## Shuijin found that 50/20 can get higher mappability
#strand option used by Tophat and Cufflinks
strandoption="--library-type fr-unstranded"
# maximal mapper
MAX_HIT=100