-
Notifications
You must be signed in to change notification settings - Fork 6
/
01-resources.sh
executable file
·49 lines (41 loc) · 1.33 KB
/
01-resources.sh
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
#!/bin/bash
# Set resources path
RESOURCES_PATH=/home/user/resources
mkdir -p $RESOURCES_PATH
CWD=`pwd`
# Download reference genome
cd $RESOURCES_PATH
mkdir hs37d5
cd hs37d5
wget ftp://ftp-trace.ncbi.nih.gov/1000genomes/ftp/technical/reference/phase2_reference_assembly_sequence/hs37d5.fa.gz
gunzip hs37d5.fa.gz
cd $CWD
# Download exome capture kit coordinates
cd $RESOURCES_PATH
mkdir panel
cd panel
wget --no-check-certificate https://figshare.com/ndownloader/files/33961505
mv 33961505 Agilent_SureSelect_All_Exon_V2.bed.gz
gunzip Agilent_SureSelect_All_Exon_V2.bed.gz
cd $CWD
# Download and configure dbSNP, dbSNFP and gnomAD
cd $RESOURCES_PATH
mkdir dbSNP
cd dbSNP
wget ftp://ftp.ncbi.nih.gov/snp/organisms/human_9606_b151_GRCh37p13/VCF/00-All.vcf.gz
gunzip 00-All.vcf.gz
mv 00-All.vcf dbSNP151.vcf
cd ..
mkdir dbNSFP
cd dbNSFP
wget https://dbnsfp.s3.amazonaws.com/dbNSFPv2.9.3.zip
unzip dbNSFPv2.9.3.zip
(head -n 1 dbNSFP2.9.3_variant.chr1 ; cat dbNSFP2.9.3_variant.chr* | grep -v "^#") > dbNSFP2.9.3.txt
bgzip dbNSFP2.9.txt # 17’
tabix -s 1 -b 2 -e 2 dbNSFP2.9.txt.gz
cd ..
mkdir gnomAD
cd gnomAD
wget https://storage.googleapis.com/gcp-public-data--gnomad/release/2.1.1/vcf/exomes/gnomad.exomes.r2.1.1.sites.vcf.bgz.tbi
wget https://storage.googleapis.com/gcp-public-data--gnomad/release/2.1.1/vcf/exomes/gnomad.exomes.r2.1.1.sites.vcf.bgz
cd $CWD