-
Notifications
You must be signed in to change notification settings - Fork 1
Commit
This commit does not belong to any branch on this repository, and may belong to a fork outside of the repository.
Updated interpro
- Loading branch information
Data Mover
committed
Sep 9, 2024
1 parent
da184c9
commit 34d46c8
Showing
19 changed files
with
316 additions
and
7 deletions.
There are no files selected for viewing
Empty file.
Empty file.
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,58 @@ | ||
#!/bin/bash | ||
# ----------------SLURM Parameters---------------- | ||
#SBATCH -p admin | ||
#SBATCH -n 4 | ||
#SBATCH --mem=20g | ||
#SBATCH -N 1 | ||
#SBATCH --mail-user=datamover@igb.illinois.edu | ||
#SBATCH --mail-type=ALL | ||
#SBATCH -J BUSCO-db_extract | ||
#SBATCH -D /home/a-m/datamover/jobs | ||
#SBATCH -o %x-%j.out | ||
# ----------------Load Modules-------------------- | ||
module load pigz/2.4-IGB-gcc-8.2.0 | ||
# ----------------Commands------------------------ | ||
# | ||
# Replace DATABASE with name of database you are downloading | ||
# Replace WEBSITE with remote location of database# | ||
# | ||
|
||
DATABASE="BUSCO-db" | ||
|
||
if [ -z "$1" ]; | ||
then | ||
echo "Please specify ${DATABASE} version number"; | ||
exit 1; | ||
fi | ||
|
||
VERSION=$1 | ||
MIRROR_DIR=/private_stores/mirror/${DATABASE}/${VERSION} | ||
|
||
|
||
echo "`date "+%Y-%m-%d %k:%M:%S"` Extracting tar.gz Files" | ||
for f in $(find ${MIRROR_DIR} -name '*.gz'); | ||
do | ||
gzip -d $f | ||
if [ $? -ne 0 ]; then | ||
echo "`date "+%Y-%m-%d %k:%M:%S"` Error extracting file: $f" | ||
exit $? | ||
else | ||
echo "`date "+%Y-%m-%d %k:%M:%S"` Done extracting file: $f" | ||
fi | ||
done | ||
|
||
echo "`date "+%Y-%m-%d %k:%M:%S"` Extracting .gz Files with Pigz" | ||
pigz -p ${SLURM_NTASKS} -dr ${MIRROR_DIR} | ||
if [ $? -ne 0 ] | ||
then | ||
echo "`date "+%Y-%m-%d %k:%M:%S"` Extracting files Failed" | ||
exit $? | ||
else | ||
echo "`date "+%Y-%m-%d %k:%M:%S"` Extracting Files Complete" | ||
fi | ||
|
||
echo "`date "+%Y-%m-%d %k:%M:%S"` Fix Permissions Start" | ||
find ${MIRROR_DIR} -type d -exec chmod 775 {} \; | ||
find ${MIRROR_DIR} -type f -exec chmod 664 {} \; | ||
echo "`date "+%Y-%m-%d %k:%M:%S"` Fix Permissions Completed" | ||
|
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,27 @@ | ||
easyblock = 'Bundle' | ||
|
||
name = 'checkv-db' | ||
version = '1.5' | ||
|
||
homepage = 'https://portal.nersc.gov/CheckV/' | ||
description = """The main change in v1.5 was to remove putatively non-viral sequences to minimize high-confidence matches to the CheckV database for non-viral sequences.""" | ||
|
||
toolchain = SYSTEM | ||
|
||
|
||
dependencies = [] | ||
|
||
sanity_check_paths = { | ||
'files': [], | ||
'dirs': ['checkv-db-v1.5'], | ||
} | ||
|
||
modextrapaths = { | ||
'BIODB':'' | ||
} | ||
|
||
keeppreviousinstall = True | ||
moduleclass = 'data' | ||
|
||
modloadmsg = "%(name)s/%(version)s database is located at %(installdir)s\n" | ||
|
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,42 @@ | ||
#!/bin/bash | ||
# ----------------SLURM Parameters---------------- | ||
#SBATCH -p admin | ||
#SBATCH -n 1 | ||
#SBATCH --mem=20g | ||
#SBATCH -N 1 | ||
#SBATCH --mail-user=datamover@igb.illinois.edu | ||
#SBATCH --mail-type=ALL | ||
#SBATCH -J checkv-db_download | ||
#SBATCH -D /home/a-m/datamover/jobs | ||
#SBATCH -o %x-%j.out | ||
# ----------------Load Modules-------------------- | ||
# ----------------Commands------------------------ | ||
# | ||
# Replace DATABASE with name of database you are downloading | ||
# Replace WEBSITE with remote location of database | ||
# | ||
|
||
DATABASE="checkv-db" | ||
|
||
if [ -z "$1" ]; | ||
then | ||
echo "Please specify ${DATABASE} version number"; | ||
exit 1; | ||
fi | ||
|
||
VERSION=$1 | ||
MIRROR_DIR=/private_stores/mirror/${DATABASE}/${VERSION} | ||
|
||
echo "`date "+%Y-%m-%d %k:%M:%S"` Downloading Files" | ||
mkdir -p ${MIRROR_DIR} | ||
wget https://portal.nersc.gov/CheckV/checkv-db-v${VERSION}.tar.gz -P ${MIRROR_DIR}/ | ||
if [ $? -ne 0 ] | ||
then | ||
echo "`date "+%Y-%m-%d %k:%M:%S"` Downloading Files Failed" | ||
exit $? | ||
else | ||
echo "`date "+%Y-%m-%d %k:%M:%S"` Downloading Files Complete" | ||
fi | ||
|
||
|
||
|
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,50 @@ | ||
#!/bin/bash | ||
# ----------------SLURM Parameters---------------- | ||
#SBATCH -p admin | ||
#SBATCH -n 4 | ||
#SBATCH --mem=20g | ||
#SBATCH -N 1 | ||
#SBATCH --mail-user=datamover@igb.illinois.edu | ||
#SBATCH --mail-type=ALL | ||
#SBATCH -J checkv-db_extract | ||
#SBATCH -D /home/a-m/datamover/jobs | ||
#SBATCH -o %x-%j.out | ||
# ----------------Load Modules-------------------- | ||
module load pigz/2.4-IGB-gcc-8.2.0 | ||
# ----------------Commands------------------------ | ||
# | ||
# Replace DATABASE with name of database you are downloading | ||
# Replace WEBSITE with remote location of database# | ||
# | ||
|
||
DATABASE="checkv-db" | ||
|
||
if [ -z "$1" ]; | ||
then | ||
echo "Please specify ${DATABASE} version number"; | ||
exit 1; | ||
fi | ||
|
||
VERSION=$1 | ||
MIRROR_DIR=/private_stores/mirror/${DATABASE}/${VERSION} | ||
|
||
|
||
echo "`date "+%Y-%m-%d %k:%M:%S"` Extracting tar.gz Files" | ||
for f in $(find ${MIRROR_DIR} -name '*.tar.gz'); | ||
do | ||
tar -xvzf $f -C `dirname $f` | ||
if [ $? -ne 0 ]; then | ||
echo "`date "+%Y-%m-%d %k:%M:%S"` Error extracting file: $f" | ||
exit $? | ||
else | ||
echo "`date "+%Y-%m-%d %k:%M:%S"` Done extracting file: $f" | ||
fi | ||
done | ||
|
||
#Run diamond to create index | ||
diamond makedb -p $SLURM_NTASKS --in ${MIRROR_DIR}/checkv-db-v${VERSION}/genome_db/checkv_reps.faa --db ${MIRROR_DIR}/checkv-db-v${VERSION}/genome_db/checkv_reps.dmnd | ||
echo "`date "+%Y-%m-%d %k:%M:%S"` Fix Permissions Start" | ||
find ${MIRROR_DIR} -type d -exec chmod 775 {} \; | ||
find ${MIRROR_DIR} -type f -exec chmod 664 {} \; | ||
echo "`date "+%Y-%m-%d %k:%M:%S"` Fix Permissions Completed" | ||
|
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,29 @@ | ||
easyblock = 'Bundle' | ||
|
||
name = 'dorado-db' | ||
version = '20240501' | ||
|
||
homepage = 'https://github.com/nanoporetech/dorado' | ||
description = """Databases for dorado""" | ||
|
||
toolchain = SYSTEM | ||
|
||
source_urls = [''] | ||
sources = [] | ||
|
||
dependencies = [] | ||
|
||
sanity_check_paths = { | ||
'files': [], | ||
'dirs': ['dna_r9.4.1_e8_fast@v3.4'], | ||
} | ||
|
||
modextrapaths = { | ||
'BIODB':'' | ||
} | ||
|
||
keeppreviousinstall = True | ||
moduleclass = 'data' | ||
|
||
modloadmsg = "%(name)s/%(version)s database is located at %(installdir)s\n" | ||
|
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,35 @@ | ||
#!/bin/bash | ||
# ----------------SLURM Parameters---------------- | ||
#SBATCH -p admin | ||
#SBATCH -n 1 | ||
#SBATCH --mem=20g | ||
#SBATCH -N 1 | ||
#SBATCH --mail-user=datamover@igb.illinois.edu | ||
#SBATCH --mail-type=ALL | ||
#SBATCH -J dorado-db_download | ||
#SBATCH -D /home/a-m/datamover/jobs | ||
#SBATCH -o %x-%j.out | ||
# ----------------Load Modules-------------------- | ||
module load dorado | ||
# ----------------Commands------------------------ | ||
# | ||
# Replace DATABASE with name of database you are downloading | ||
# Replace WEBSITE with remote location of database | ||
# | ||
|
||
DATABASE="dorado-db" | ||
|
||
if [ -z "$1" ]; | ||
then | ||
echo "Please specify ${DATABASE} version number"; | ||
exit 1; | ||
fi | ||
|
||
VERSION=$1 | ||
MIRROR_DIR=/private_stores/mirror/${DATABASE}/${VERSION} | ||
|
||
echo "`date "+%Y-%m-%d %k:%M:%S"` Downloading Files" | ||
mkdir -p ${MIRROR_DIR} | ||
cd ${MIRROR_DIR} | ||
dorado download | ||
|
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,30 @@ | ||
easyblock = 'Bundle' | ||
|
||
name = 'funannotate-db' | ||
version = '20240515' | ||
|
||
homepage = 'https://github.com/nextgenusfs/funannotate' | ||
description = """funannotate is a pipeline for genome annotation (built specifically for fungi, but will also work with higher eukaryotes). Installation, usage, and more information can be found at http://funannotate.readthedocs.io""" | ||
|
||
toolchain = SYSTEM | ||
|
||
source_urls = [''] | ||
sources = [] | ||
|
||
dependencies = [] | ||
|
||
sanity_check_paths = { | ||
'files': ['uniprot.dmnd'], | ||
'dirs': [], | ||
} | ||
|
||
modextrapaths = { | ||
'BIODB':'', | ||
'FUNANNOTATE_DB': '' | ||
} | ||
|
||
keeppreviousinstall = True | ||
moduleclass = 'data' | ||
|
||
modloadmsg = "%(name)s/%(version)s database is located at %(installdir)s\n" | ||
|
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Empty file.
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Binary file not shown.
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,38 @@ | ||
easyblock = 'Bundle' | ||
|
||
name = 'uniprot' | ||
version = '2024_04' | ||
|
||
|
||
homepage = 'https://www.uniprot.org/' | ||
description = """The mission of UniProt is to provide the scientific community with a comprehensive, high-quality and freely accessible resource of protein sequence and functional information. """ | ||
|
||
toolchain = SYSTEM | ||
|
||
dependencies = [] | ||
|
||
|
||
sanity_check_paths = { | ||
'files': ['db/knowledgebase/complete/uniprot_sprot.fasta', | ||
'db/knowledgebase/complete/uniprot_trembl.fasta', | ||
'db/knowledgebase/idmapping/idmapping.dat', | ||
'db/uniref/uniref100/uniref100.fasta', | ||
'db/uniref/uniref90/uniref90.fasta', | ||
'db/uniref/uniref50/uniref50.fasta' | ||
], | ||
'dirs': ['db','blastdb_v4','blastdb_v5','diamond'] | ||
} | ||
|
||
modextrapaths = {'BIODB':'db', | ||
'BLASTDB': ['blastdb_v4','blastdb_v5'], | ||
'DIAMONDDB': 'diamond', | ||
} | ||
|
||
keeppreviousinstall = True | ||
|
||
moduleclass = 'data' | ||
|
||
modloadmsg = "%(name)s/%(version)s database and indexes are located at %(installdir)s/\n" | ||
|
||
##Helpful documentation | ||
#https://embl.service-now.com/kb?id=kb_article_view&sysparm_article=KB0011060 |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters