Skip to content

Commit

Permalink
Browse files Browse the repository at this point in the history
…asyconfigs into 20240110135037_new_pr_netcdf4-python165
  • Loading branch information
smoors committed Jan 11, 2024
2 parents c10569a + 7f4026b commit a1e967c
Show file tree
Hide file tree
Showing 46 changed files with 1,504 additions and 12 deletions.
8 changes: 7 additions & 1 deletion easybuild/easyconfigs/a/Arrow/Arrow-11.0.0-gfbf-2022b.eb
Original file line number Diff line number Diff line change
Expand Up @@ -11,7 +11,12 @@ toolchain = {'name': 'gfbf', 'version': '2022b'}

source_urls = ['https://archive.apache.org/dist/%(namelower)s/%(namelower)s-%(version)s']
sources = ['apache-arrow-%(version)s.tar.gz']
checksums = ['2dd8f0ea0848a58785628ee3a57675548d509e17213a2f5d72b0d900b43f5430']
patches = ['Arrow-8.0.0_fix-BaseExtensionType-arrow-ext-methods.patch']
checksums = [
{'apache-arrow-11.0.0.tar.gz': '2dd8f0ea0848a58785628ee3a57675548d509e17213a2f5d72b0d900b43f5430'},
{'Arrow-8.0.0_fix-BaseExtensionType-arrow-ext-methods.patch':
'2db8a4c655e2a3f0ec7dac05e13bda6c2843203568873e736d2f1b8321b0dfc7'},
]

builddependencies = [
('CMake', '3.24.3'),
Expand Down Expand Up @@ -69,6 +74,7 @@ sanity_check_commands = [
"python -c 'import pyarrow'",
"python -c 'import pyarrow.dataset'",
"python -c 'import pyarrow.parquet'",
"python -c 'from pyarrow.lib import BaseExtensionType; print(BaseExtensionType.__arrow_ext_class__)'",
]

moduleclass = 'data'
8 changes: 7 additions & 1 deletion easybuild/easyconfigs/a/Arrow/Arrow-8.0.0-foss-2021a.eb
Original file line number Diff line number Diff line change
Expand Up @@ -11,7 +11,12 @@ toolchain = {'name': 'foss', 'version': '2021a'}

source_urls = ['https://archive.apache.org/dist/%(namelower)s/%(namelower)s-%(version)s']
sources = ['apache-arrow-%(version)s.tar.gz']
checksums = ['ad9a05705117c989c116bae9ac70492fe015050e1b80fb0e38fde4b5d863aaa3']
patches = ['Arrow-8.0.0_fix-BaseExtensionType-arrow-ext-methods.patch']
checksums = [
{'apache-arrow-8.0.0.tar.gz': 'ad9a05705117c989c116bae9ac70492fe015050e1b80fb0e38fde4b5d863aaa3'},
{'Arrow-8.0.0_fix-BaseExtensionType-arrow-ext-methods.patch':
'2db8a4c655e2a3f0ec7dac05e13bda6c2843203568873e736d2f1b8321b0dfc7'},
]

builddependencies = [
('CMake', '3.20.1'),
Expand Down Expand Up @@ -66,6 +71,7 @@ sanity_check_commands = [
"python -c 'import pyarrow'",
"python -c 'import pyarrow.dataset'",
"python -c 'import pyarrow.parquet'",
"python -c 'from pyarrow.lib import BaseExtensionType; print(BaseExtensionType.__arrow_ext_class__)'",
]

moduleclass = 'data'
8 changes: 7 additions & 1 deletion easybuild/easyconfigs/a/Arrow/Arrow-8.0.0-foss-2022.05.eb
Original file line number Diff line number Diff line change
Expand Up @@ -11,7 +11,12 @@ toolchain = {'name': 'foss', 'version': '2022.05'}

source_urls = ['https://archive.apache.org/dist/%(namelower)s/%(namelower)s-%(version)s']
sources = ['apache-arrow-%(version)s.tar.gz']
checksums = ['ad9a05705117c989c116bae9ac70492fe015050e1b80fb0e38fde4b5d863aaa3']
patches = ['Arrow-8.0.0_fix-BaseExtensionType-arrow-ext-methods.patch']
checksums = [
{'apache-arrow-8.0.0.tar.gz': 'ad9a05705117c989c116bae9ac70492fe015050e1b80fb0e38fde4b5d863aaa3'},
{'Arrow-8.0.0_fix-BaseExtensionType-arrow-ext-methods.patch':
'2db8a4c655e2a3f0ec7dac05e13bda6c2843203568873e736d2f1b8321b0dfc7'},
]

builddependencies = [
('CMake', '3.23.1'),
Expand Down Expand Up @@ -66,6 +71,7 @@ sanity_check_commands = [
"python -c 'import pyarrow'",
"python -c 'import pyarrow.dataset'",
"python -c 'import pyarrow.parquet'",
"python -c 'from pyarrow.lib import BaseExtensionType; print(BaseExtensionType.__arrow_ext_class__)'",
]

moduleclass = 'data'
8 changes: 7 additions & 1 deletion easybuild/easyconfigs/a/Arrow/Arrow-8.0.0-foss-2022a.eb
Original file line number Diff line number Diff line change
Expand Up @@ -11,7 +11,12 @@ toolchain = {'name': 'foss', 'version': '2022a'}

source_urls = ['https://archive.apache.org/dist/%(namelower)s/%(namelower)s-%(version)s']
sources = ['apache-arrow-%(version)s.tar.gz']
checksums = ['ad9a05705117c989c116bae9ac70492fe015050e1b80fb0e38fde4b5d863aaa3']
patches = ['Arrow-8.0.0_fix-BaseExtensionType-arrow-ext-methods.patch']
checksums = [
{'apache-arrow-8.0.0.tar.gz': 'ad9a05705117c989c116bae9ac70492fe015050e1b80fb0e38fde4b5d863aaa3'},
{'Arrow-8.0.0_fix-BaseExtensionType-arrow-ext-methods.patch':
'2db8a4c655e2a3f0ec7dac05e13bda6c2843203568873e736d2f1b8321b0dfc7'},
]

builddependencies = [
('CMake', '3.23.1'),
Expand Down Expand Up @@ -66,6 +71,7 @@ sanity_check_commands = [
"python -c 'import pyarrow'",
"python -c 'import pyarrow.dataset'",
"python -c 'import pyarrow.parquet'",
"python -c 'from pyarrow.lib import BaseExtensionType; print(BaseExtensionType.__arrow_ext_class__)'",
]

moduleclass = 'data'
Original file line number Diff line number Diff line change
@@ -0,0 +1,25 @@
fix for:
AttributeError: 'pyarrow.lib.BaseExtensionType' object has no attribute '__arrow_ext_class__'
see https://github.com/apache/arrow/pull/33802
diff -u python/pyarrow/types.pxi.orig python/pyarrow/types.pxi
--- python/pyarrow/types.pxi.orig 2022-05-03 18:59:12.000000000 +0200
+++ python/pyarrow/types.pxi 2024-01-09 13:15:20.313755064 +0100
@@ -760,6 +836,18 @@
DataType.init(self, type)
self.ext_type = <const CExtensionType*> type.get()

+ def __arrow_ext_class__(self):
+ """
+ The associated array extension class
+ """
+ return ExtensionArray
+
+ def __arrow_ext_scalar_class__(self):
+ """
+ The associated scalar class
+ """
+ return ExtensionScalar
+
@property
def extension_name(self):
"""
Original file line number Diff line number Diff line change
Expand Up @@ -10,7 +10,7 @@ easyblock = 'ConfigureMake'
name = 'argtable'
version = '2.13'

homepage = 'http://argtable.sourceforge.net/'
homepage = 'https://argtable.sourceforge.io/'
description = """ Argtable is an ANSI C library for parsing GNU style
command line options with a minimum of fuss. """

Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -10,7 +10,7 @@ easyblock = 'ConfigureMake'
name = 'argtable'
version = '2.13'

homepage = 'http://argtable.sourceforge.net/'
homepage = 'https://argtable.sourceforge.io/'
description = """ Argtable is an ANSI C library for parsing GNU style
command line options with a minimum of fuss. """

Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -10,7 +10,7 @@ easyblock = 'ConfigureMake'
name = 'argtable'
version = '2.13'

homepage = 'http://argtable.sourceforge.net/'
homepage = 'https://argtable.sourceforge.io/'
description = """ Argtable is an ANSI C library for parsing GNU style
command line options with a minimum of fuss. """

Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -10,7 +10,7 @@ easyblock = 'ConfigureMake'
name = 'argtable'
version = '2.13'

homepage = 'http://argtable.sourceforge.net/'
homepage = 'https://argtable.sourceforge.io/'
description = """ Argtable is an ANSI C library for parsing GNU style
command line options with a minimum of fuss. """

Expand Down
3 changes: 2 additions & 1 deletion easybuild/easyconfigs/a/argtable/argtable-2.13-foss-2016b.eb
Original file line number Diff line number Diff line change
Expand Up @@ -10,14 +10,15 @@ easyblock = 'ConfigureMake'
name = 'argtable'
version = '2.13'

homepage = 'http://argtable.sourceforge.net/'
homepage = 'https://argtable.sourceforge.io/'
description = """ Argtable is an ANSI C library for parsing GNU style
command line options with a minimum of fuss. """

toolchain = {'name': 'foss', 'version': '2016b'}

source_urls = [SOURCEFORGE_SOURCE]
sources = ['%s%s.tar.gz' % (name, version.replace('.', '-'))]
checksums = ['8f77e8a7ced5301af6e22f47302fdbc3b1ff41f2b83c43c77ae5ca041771ddbf']

sanity_check_paths = {
'files': ['lib/libargtable2.so', 'lib/libargtable2.la'],
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -10,7 +10,7 @@ easyblock = 'ConfigureMake'
name = 'argtable'
version = '2.13'

homepage = 'http://argtable.sourceforge.net/'
homepage = 'https://argtable.sourceforge.io/'
description = """ Argtable is an ANSI C library for parsing GNU style
command line options with a minimum of fuss. """

Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -10,7 +10,7 @@ easyblock = 'ConfigureMake'
name = 'argtable'
version = '2.13'

homepage = 'http://argtable.sourceforge.net/'
homepage = 'https://argtable.sourceforge.io/'
description = """ Argtable is an ANSI C library for parsing GNU style
command line options with a minimum of fuss. """

Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -10,7 +10,7 @@ easyblock = 'ConfigureMake'
name = 'argtable'
version = '2.13'

homepage = 'http://argtable.sourceforge.net/'
homepage = 'https://argtable.sourceforge.io/'
description = """ Argtable is an ANSI C library for parsing GNU style
command line options with a minimum of fuss. """

Expand Down
23 changes: 23 additions & 0 deletions easybuild/easyconfigs/a/autopep8/autopep8-2.0.4-foss-2022a.eb
Original file line number Diff line number Diff line change
@@ -0,0 +1,23 @@
easyblock = 'PythonPackage'

name = 'autopep8'
version = '2.0.4'

homepage = "https://github.com/hhatto/autopep8"
description = """A tool that automatically formats Python code to conform to the PEP 8 style guide."""

toolchain = {'name': 'foss', 'version': '2022a'}

sources = [SOURCE_TAR_GZ]
checksums = ['2913064abd97b3419d1cc83ea71f042cb821f87e45b9c88cad5ad3c4ea87fe0c']

dependencies = [
('Python', '3.10.4'),
('pycodestyle', '2.11.1'),
]

download_dep_fail = True
use_pip = True
sanity_pip_check = True

moduleclass = 'lib'
67 changes: 67 additions & 0 deletions easybuild/easyconfigs/b/BiG-SCAPE/BiG-SCAPE-1.1.5-foss-2022a.eb
Original file line number Diff line number Diff line change
@@ -0,0 +1,67 @@
easyblock = 'PythonPackage'

name = 'BiG-SCAPE'
version = '1.1.5'

homepage = 'https://bigscape-corason.secondarymetabolites.org/index.html'
description = """BiG-SCAPE and CORASON provide a set of tools to explore the diversity of biosynthetic gene clusters
(BGCs) across large numbers of genomes, by constructing BGC sequence similarity networks, grouping BGCs into gene
cluster families, and exploring gene cluster diversity linked to enzyme phylogenies."""

toolchain = {'name': 'foss', 'version': '2022a'}

github_account = 'medema-group'
source_urls = [GITHUB_SOURCE]
sources = ['v%(version)s.tar.gz']
patches = [
'%(name)s-%(version)s_use_env_var_to_find-MIBiG-files.patch',
'%(name)s-%(version)s_use_env_var_for_domain_files.patch',
'%(name)s-%(version)s_use_env_var_for_html.patch',
'%(name)s-%(version)s_use_correct_name_for_FastTree.patch',
]
checksums = [
{'v1.1.5.tar.gz': 'ec7cebbec8f83f4187c80e02ecbb37411a1898a2b83bb80088810f1600528ec7'},
{'BiG-SCAPE-1.1.5_use_env_var_to_find-MIBiG-files.patch':
'f0602208765a2686a324a27ff6073aac01c230b6a81a00656269fd89c97cf370'},
{'BiG-SCAPE-1.1.5_use_env_var_for_domain_files.patch':
'51337f22b2619ed38969f4ead5f7ce2f2df884f272793b47fb46d77e9c5e2aa2'},
{'BiG-SCAPE-1.1.5_use_env_var_for_html.patch': '540be22396ab982c2aeaaed4ce5acdb8ccb8ce2b31d36bc69d37be7a29c7c42a'},
{'BiG-SCAPE-1.1.5_use_correct_name_for_FastTree.patch':
'e1572e4134c6163a3927ac32bd2a39b7f87cf01109f7913b3c55126e2381a771'},
]

dependencies = [
('Python', '3.10.4'),
('SciPy-bundle', '2022.05'),
('Biopython', '1.79'),
('scikit-learn', '1.1.2'),
('networkx', '2.8.4'),
('HMMER', '3.3.2'),
('FastTree', '2.1.11'),
]

use_pip = True
download_dep_fail = True
sanity_pip_check = True

options = {'modulename': False}

sanity_check_commands = [
'bigscape.py --help',
]

modextravars = {
'BIG_SCAPE_HTML_PATH': '%(installdir)s/lib/python%(pyshortver)s/site-packages/BiG-SCAPE',
}

modloadmsg = "%(name)s needs processed Pfam database to work properly.\n"
modloadmsg += "For this, download the latest 'Pfam-A.hmm.gz' file from the Pfam website "
modloadmsg += "(http://ftp.ebi.ac.uk/pub/databases/Pfam/releases/), "
modloadmsg += "uncompress it and process it using the `hmmpress` command.\n"
modloadmsg += "For data files, like the domains_color_file.tsv and domain_includelist.txt, "
modloadmsg += "one can set the environment variable BIG_SCAPE_DATA_PATH, if that is not set "
modloadmsg += "it will use the directory where the bigscape command is started from.\n"
modloadmsg += "One can copy the domains_color_file.tsv from "
modloadmsg += "%(installdir)s/lib/python%(pyshortver)s/site-packages/BiG-SCAPE/domains_color_file.tsv\n"

moduleclass = 'bio'
Original file line number Diff line number Diff line change
@@ -0,0 +1,15 @@
FastTree binary is not lowercase.

Åke Sandgren, 2023-11-13
diff -ru BiG-SCAPE-1.1.5.orig/bigscape.py BiG-SCAPE-1.1.5/bigscape.py
--- BiG-SCAPE-1.1.5.orig/bigscape.py 2022-11-14 17:04:47.000000000 +0100
+++ BiG-SCAPE-1.1.5/bigscape.py 2023-11-13 07:52:23.064042200 +0100
@@ -1644,7 +1644,7 @@
# make tree
newick_file_path = os.path.join(gcf_trees_path, "GCF_c{:4.2f}_{:05d}.newick".format(cutoff,exemplar_idx))
with open(newick_file_path, "w") as newick_file:
- command = ["fasttree", "-nopr", "-quiet", alignment_file_path]
+ command = ["FastTree", "-nopr", "-quiet", alignment_file_path]
p = subprocess.Popen(command, stdout=newick_file, shell=False)
p.wait() # only with process has terminated will the file be ready

Original file line number Diff line number Diff line change
@@ -0,0 +1,37 @@
Don't use domains_color_file.tsv and domain_includelist.txt from the install tree.
Use env var or current dir.

Åke Sandgren, 2023-11-02
diff -ru BiG-SCAPE-1.1.5.orig/ArrowerSVG.py BiG-SCAPE-1.1.5/ArrowerSVG.py
--- BiG-SCAPE-1.1.5.orig/ArrowerSVG.py 2022-11-14 17:04:47.000000000 +0100
+++ BiG-SCAPE-1.1.5/ArrowerSVG.py 2023-11-02 15:48:51.313247855 +0100
@@ -27,7 +27,7 @@
gene_contour_thickness = 2 # thickness grows outwards
stripe_thickness = 3

-domains_color_file = os.path.join(os.path.dirname(os.path.realpath(__file__)), "domains_color_file.tsv")
+domains_color_file = os.path.join(os.getenv('BIG_SCAPE_DATA_PATH', os.getcwd()), "domains_color_file.tsv")


def read_color_domains_file():
diff -ru BiG-SCAPE-1.1.5.orig/bigscape.py BiG-SCAPE-1.1.5/bigscape.py
--- BiG-SCAPE-1.1.5.orig/bigscape.py 2022-11-14 17:04:47.000000000 +0100
+++ BiG-SCAPE-1.1.5/bigscape.py 2023-11-02 15:48:02.929621562 +0100
@@ -2235,7 +2235,7 @@
# Get domain_includelist
has_includelist = False
if options.domain_includelist:
- bigscape_path = os.path.dirname(os.path.realpath(__file__))
+ bigscape_path = os.getenv('BIG_SCAPE_DATA_PATH', os.getcwd())
if os.path.isfile(os.path.join(bigscape_path,"domain_includelist.txt")):
domain_includelist = set()
for line in open(os.path.join(bigscape_path,"domain_includelist.txt"), "r"):
@@ -2850,7 +2852,7 @@
if not os.path.isfile(pfams_js_file):
with open(pfams_js_file, "w") as pfams_js:
pfam_json = {}
- pfam_colors = generatePfamColorsMatrix(os.path.join(os.path.dirname(os.path.realpath(__file__)), "domains_color_file.tsv"))
+ pfam_colors = generatePfamColorsMatrix(os.path.join(os.getenv('BIG_SCAPE_DATA_PATH', os.getcwd()), "domains_color_file.tsv"))
for pfam_code in pfam_info:
pfam_obj = {}
if pfam_code in pfam_colors:
Original file line number Diff line number Diff line change
@@ -0,0 +1,33 @@
Use EB specific env var to locate html_template

Åke Sandgren, 20231106
diff -ru BiG-SCAPE-1.1.5.orig/bigscape.py BiG-SCAPE-1.1.5/bigscape.py
--- BiG-SCAPE-1.1.5.orig/bigscape.py 2022-11-14 17:04:47.000000000 +0100
+++ BiG-SCAPE-1.1.5/bigscape.py 2023-11-06 11:20:46.410872382 +0100
@@ -1881,7 +1881,7 @@
with open(os.path.join(module_html_path, "bs_data.js"), "w") as bs_data_js:
bs_data_js.write("var bs_data={};\n".format(json.dumps(bs_data, indent=4, separators=(',', ':'), sort_keys=True)))
bs_data_js.write("dataLoaded('bs_data');\n")
- shutil.copy(os.path.join(os.path.dirname(os.path.realpath(__file__)), "html_template", "index_html"), os.path.join(module_html_path, "index.html"))
+ shutil.copy(os.path.join(os.getenv('BIG_SCAPE_HTML_PATH'), "html_template", "index_html"), os.path.join(module_html_path, "index.html"))

## Write bgc_networks.js
with open(os.path.join(module_html_path, "bs_networks.js"), "w") as bs_networks_js:
@@ -2832,7 +2834,7 @@
create_directory(network_files_folder, "Network Files", False)

# copy html templates
- dir_util.copy_tree(os.path.join(os.path.dirname(os.path.realpath(__file__)), "html_template", "output"), output_folder)
+ dir_util.copy_tree(os.path.join(os.getenv('BIG_SCAPE_HTML_PATH'), "html_template", "output"), output_folder)

# make a new run folder in the html output & copy the overview_html
network_html_folder = os.path.join(output_folder, "html_content", "networks", run_name)
@@ -2841,7 +2843,7 @@
for cutoff in cutoff_list:
network_html_folder_cutoff = "{}_c{:.2f}".format(network_html_folder, cutoff)
create_directory(network_html_folder_cutoff, "Network HTML Files", False)
- shutil.copy(os.path.join(os.path.dirname(os.path.realpath(__file__)), "html_template", "overview_html"), os.path.join(network_html_folder_cutoff, "overview.html"))
+ shutil.copy(os.path.join(os.getenv('BIG_SCAPE_HTML_PATH'), "html_template", "overview_html"), os.path.join(network_html_folder_cutoff, "overview.html"))
rundata_networks_per_run[network_html_folder_cutoff] = []
html_subs_per_run[network_html_folder_cutoff] = []

Original file line number Diff line number Diff line change
@@ -0,0 +1,16 @@
Use MIBIG_PATH env var to locate MIBiG files instead of hardocded path
that isn't right in the first place.

Åke Sandgren, 20231027
diff -ru BiG-SCAPE-1.1.5.orig/bigscape.py BiG-SCAPE-1.1.5/bigscape.py
--- BiG-SCAPE-1.1.5.orig/bigscape.py 2022-11-14 17:04:47.000000000 +0100
+++ BiG-SCAPE-1.1.5/bigscape.py 2023-10-27 14:15:41.385679191 +0200
@@ -2336,6 +2336,8 @@

print("\n Trying to read bundled MIBiG BGCs as reference")
mibig_path = os.path.join(os.path.dirname(os.path.realpath(__file__)),"Annotated_MIBiG_reference")
+ # Use environment variable as first choice
+ mibig_path = os.getenv('MIBIG_PATH', mibig_path)
bgcs_path = os.path.join(mibig_path,mibig_zipfile_numbgcs[1])

# try to see if the zip file has already been decompressed
Loading

0 comments on commit a1e967c

Please sign in to comment.