-
Notifications
You must be signed in to change notification settings - Fork 2
/
Makefile
55 lines (51 loc) · 1.88 KB
/
Makefile
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
ASPERA_CONNECT = ibm-aspera-connect-3.11.1.58-linux-g2.12-64
GENBANK_DATA_DIR = "/content/drive/Shareddrives/mGEM R&D"
NONROOT = igem
aspera: domain = none
aspera:
/home/$(NONROOT)/.aspera/connect/bin/ascp -k1 -drT -l128m --overwrite=never \
-i /home/$(NONROOT)/.aspera/connect/etc/asperaweb_id_dsa.openssh \
anonftp@ftp.ncbi.nlm.nih.gov:/genomes/genbank/$(domain) $(GENBANK_DATA_DIR)/genomes/genbank
colab:
apt install bc cmake htop iftop parallel vim --yes
curl -fsSL https://code-server.dev/install.sh | sh
pip3 install -r requirements.txt
git clone https://github.com/kblin/ncbi-genome-download.git ../ncbi-genome-download
cd ../ncbi-genome-download && pip3 install .
rm -rf ../ncbi-genome-download
wget https://ak-delivery04-mul.dhe.ibm.com/sar/CMA/OSA/09ff1/0/$(ASPERA_CONNECT).tar.gz
tar -xzvf $(ASPERA_CONNECT).tar.gz
rm $(ASPERA_CONNECT).tar.gz
useradd -m -s /bin/bash $(NONROOT)
su $(NONROOT) -c "./$(ASPERA_CONNECT).sh"
rm -f $(ASPERA_CONNECT).sh
wget https://raw.githubusercontent.com/pirovc/genome_updater/master/genome_updater.sh
chmod +x genome_updater.sh
git clone https://github.com/google/sentencepiece.git
cd sentencepiece && mkdir build && cd build && cmake .. && $(MAKE) && $(MAKE) install && ldconfig -v
rm -rf sentencepiece
genome_updater: flags = "", group = none, threads = 1, top = ""
# make group=bacteria threads=16 top=taxids:1 genome_updater
genome_updater:
./genome_updater.sh -m -p \
-c all \
-d refseq,genbank \
-f genomic.gbff.gz,protein.gpff.gz \
-g $(group) \
-j $(top) \
-l "Complete Genome" \
-o $(group) \
-t $(threads) \
$(flags)
cp -ruv $(group) $(GENBANK_DATA_DIR)
ncbi-genome-download: domain = none
ncbi-genome-download:
ncbi-genome-download \
--assembly-levels complete \
--debug \
--formats genbank \
--output-folder $(GENBANK_DATA_DIR)/genomes/genbank \
--parallel 16 \
--progress-bar \
--retries 9999 \
$(domain)