File tree Expand file tree Collapse file tree 13 files changed +41
-39
lines changed Expand file tree Collapse file tree 13 files changed +41
-39
lines changed Original file line number Diff line number Diff line change 1
1
---
2
2
dataproc :
3
- python_main_module : gs://genetics_etl_python_playground/initialisation/gentropy/dev/ cli.py
3
+ python_main_module : gs://genetics_etl_python_playground/initialisation/cli.py
4
4
cluster_metadata :
5
- PACKAGE : gs://genetics_etl_python_playground/initialisation/gentropy/dev/gentropy-0 .0.0-py3-none-any.whl
6
- cluster_init_script : gs://genetics_etl_python_playground/initialisation/gentropy/dev/ install_dependencies_on_cluster.sh
5
+ GENTROPY_REF : v2 .0.1
6
+ cluster_init_script : gs://genetics_etl_python_playground/initialisation/install_dependencies_on_cluster.sh
7
7
cluster_name : otg-credible-set-qc
8
8
autoscaling_policy : otg-etl
9
9
Original file line number Diff line number Diff line change @@ -4,10 +4,10 @@ eqtl_catalogue_decompressed_susie_path: gs://eqtl_catalogue_data/ebi_ftp/susie_d
4
4
decompression_logs : gs://eqtl_catalogue_data/ebi_ftp/susie_decompressed_tmp/logs.log
5
5
6
6
dataproc :
7
- python_main_module : gs://genetics_etl_python_playground/initialisation/gentropy/dev/ cli.py
7
+ python_main_module : gs://genetics_etl_python_playground/initialisation/cli.py
8
8
cluster_metadata :
9
- PACKAGE : gs://genetics_etl_python_playground/initialisation/gentropy/dev/gentropy-0 .0.0-py3-none-any.whl
10
- cluster_init_script : gs://genetics_etl_python_playground/initialisation/gentropy/dev/ install_dependencies_on_cluster.sh
9
+ GENTROPY_REF : v2 .0.1
10
+ cluster_init_script : gs://genetics_etl_python_playground/initialisation/install_dependencies_on_cluster.sh
11
11
cluster_name : otg-preprocess-eqtl
12
12
autoscaling_policy : eqtl-preprocess
13
13
num_workers : 4
Original file line number Diff line number Diff line change 1
1
---
2
2
dataproc :
3
- python_main_module : gs://genetics_etl_python_playground/initialisation/gentropy/dev/ cli.py
3
+ python_main_module : gs://genetics_etl_python_playground/initialisation/cli.py
4
4
cluster_metadata :
5
- PACKAGE : gs://genetics_etl_python_playground/initialisation/gentropy/dev/gentropy-0 .0.0-py3-none-any.whl
6
- cluster_init_script : gs://genetics_etl_python_playground/initialisation/gentropy/dev/ install_dependencies_on_cluster.sh
5
+ GENTROPY_REF : v2 .0.1
6
+ cluster_init_script : gs://genetics_etl_python_playground/initialisation/install_dependencies_on_cluster.sh
7
7
cluster_name : otg-ingestion-finngen
8
8
autoscaling_policy : finngen-preprocess
9
9
master_disk_size : 2000
Original file line number Diff line number Diff line change 1
1
---
2
2
dataproc :
3
- python_main_module : gs://genetics_etl_python_playground/initialisation/gentropy/szsz-update-package-for-dataproc-run /cli.py
3
+ python_main_module : gs://genetics_etl_python_playground/initialisation//cli.py
4
4
cluster_metadata :
5
- PACKAGE : gs://genetics_etl_python_playground/initialisation/gentropy/szsz-update-package-for-dataproc-run/gentropy-0 .0.0-py3-none-any.whl
6
- cluster_init_script : gs://genetics_etl_python_playground/initialisation/0.0.0/ install_dependencies_on_cluster.sh
5
+ GENTROPY_REF : v2 .0.1
6
+ cluster_init_script : gs://genetics_etl_python_playground/install_dependencies_on_cluster.sh
7
7
cluster_name : otg-finngen-ukb-meta
8
8
9
9
nodes :
Original file line number Diff line number Diff line change 1
1
---
2
2
dataproc :
3
- python_main_module : gs://genetics_etl_python_playground/initialisation/gentropy/dev/ cli.py
3
+ python_main_module : gs://genetics_etl_python_playground/initialisation/cli.py
4
4
cluster_metadata :
5
- PACKAGE : gs://genetics_etl_python_playground/initialisation/gentropy/dev/gentropy-0.0.0-py3-none-any.whl
6
- cluster_init_script : gs://genetics_etl_python_playground/initialisation/gentropy/dev/install_dependencies_on_cluster.sh
5
+ GENTROPY_REF : v2.0.1
6
+ cluster_init_script : gs://genetics_etl_python_playground/initialisation/install_dependencies_on_cluster.sh
7
+
7
8
cluster_name : foldx-ingestion
8
9
autoscaling_policy : otg-etl
9
10
allow_efm : false
Original file line number Diff line number Diff line change 2
2
l2g_gold_standard_path : gs://genetics_etl_python_playground/input/l2g/gold_standard/curation.json
3
3
release_dir : gs://ot_orchestration/releases/24.11_freeze10
4
4
dataproc :
5
- python_main_module : gs://genetics_etl_python_playground/initialisation/gentropy/dev/ cli.py
5
+ python_main_module : gs://genetics_etl_python_playground/initialisation/cli.py
6
6
cluster_metadata :
7
- PACKAGE : gs://genetics_etl_python_playground/initialisation/gentropy/dev/gentropy-0 .0.0-py3-none-any.whl
8
- cluster_init_script : gs://genetics_etl_python_playground/initialisation/gentropy/dev/ install_dependencies_on_cluster.sh
9
- cluster_name : otg-etl
7
+ GENTROPY_REF : v2 .0.1
8
+ cluster_init_script : gs://genetics_etl_python_playground/initialisation/install_dependencies_on_cluster.sh
9
+ cluster_name : test-dataproc
10
10
autoscaling_policy : otg-etl
11
11
allow_efm : false
12
12
num_workers : 2
Original file line number Diff line number Diff line change 1
1
---
2
- python_main_module : gs://genetics_etl_python_playground/initialisation/gentropy/{gentropy_version}/ cli.py
2
+ python_main_module : gs://genetics_etl_python_playground/initialisation/cli.py
3
3
4
4
dataproc_cluster_settings :
5
5
cluster_metadata :
6
- PACKAGE : gs://genetics_etl_python_playground/initialisation/gentropy/ {gentropy_version}/gentropy-0.0.0-py3-none-any.whl
7
- cluster_init_script : gs://genetics_etl_python_playground/initialisation/gentropy/{gentropy_version}/ install_dependencies_on_cluster.sh
6
+ GENTROPY_REF : {gentropy_version: ''}
7
+ cluster_init_script : gs://genetics_etl_python_playground/initialisation/install_dependencies_on_cluster.sh
8
8
autoscaling_policy : otg-etl
9
9
allow_efm : false
10
10
num_workers : 2
Original file line number Diff line number Diff line change 1
1
---
2
2
dataproc :
3
- python_main_module : gs://genetics_etl_python_playground/initialisation/gentropy/dev/ cli.py
3
+ python_main_module : gs://genetics_etl_python_playground/initialisation/cli.py
4
4
cluster_metadata :
5
- PACKAGE : gs://genetics_etl_python_playground/initialisation/gentropy/dev/gentropy-0 .0.0-py3-none-any.whl
6
- cluster_init_script : gs://genetics_etl_python_playground/initialisation/gentropy/dev/ install_dependencies_on_cluster.sh
5
+ GENTROPY_REF : v2 .0.1
6
+ cluster_init_script : gs://genetics_etl_python_playground/initialisation/install_dependencies_on_cluster.sh
7
7
cluster_name : gnomad-preprocess
8
8
autoscaling_policy : otg-etl
9
9
allow_efm : false
Original file line number Diff line number Diff line change 2
2
dataproc :
3
3
cluster_name : otg-gwascatalog-sumstats-pics
4
4
autoscaling_policy : otg-preprocess-gwascatalog
5
- python_main_module : gs://genetics_etl_python_playground/initialisation/gentropy/dev/ cli.py
5
+ python_main_module : gs://genetics_etl_python_playground/initialisation/cli.py
6
6
cluster_metadata :
7
- PACKAGE : gs://genetics_etl_python_playground/initialisation/gentropy/dev/gentropy-0 .0.0-py3-none-any.whl
8
- cluster_init_script : gs://genetics_etl_python_playground/initialisation/gentropy/dev/ install_dependencies_on_cluster.sh
7
+ GENTROPY_REF : v2 .0.1
8
+ cluster_init_script : gs://genetics_etl_python_playground/initialisation/install_dependencies_on_cluster.sh
9
9
num_workers : 5
10
10
11
11
nodes :
Original file line number Diff line number Diff line change 1
1
---
2
2
dataproc :
3
- python_main_module : gs://genetics_etl_python_playground/initialisation/gentropy/dev/ cli.py
3
+ python_main_module : gs://genetics_etl_python_playground/initialisation/cli.py
4
4
cluster_metadata :
5
- PACKAGE : gs://genetics_etl_python_playground/initialisation/gentropy/dev/gentropy-0 .0.0-py3-none-any.whl
6
- cluster_init_script : gs://genetics_etl_python_playground/initialisation/gentropy/dev/ install_dependencies_on_cluster.sh
5
+ GENTROPY_REF : v2 .0.1
6
+ cluster_init_script : gs://genetics_etl_python_playground/initialisation/install_dependencies_on_cluster.sh
7
7
cluster_name : otg-gwas-catalog-sumstat-susie-clumping
8
8
autoscaling_policy : otg-etl
9
9
Original file line number Diff line number Diff line change 2
2
dataproc :
3
3
cluster_name : otg-tophit-gwascatalog
4
4
autoscaling_policy : otg-gwascatalog-tophit
5
- python_main_module : gs://genetics_etl_python_playground/initialisation/gentropy/dev/ cli.py
5
+ python_main_module : gs://genetics_etl_python_playground/initialisation/cli.py
6
6
cluster_metadata :
7
- PACKAGE : gs://genetics_etl_python_playground/initialisation/gentropy/dev/gentropy-0 .0.0-py3-none-any.whl
8
- cluster_init_script : gs://genetics_etl_python_playground/initialisation/gentropy/dev/ install_dependencies_on_cluster.sh
7
+ GENTROPY_REF : v2 .0.1
8
+ cluster_init_script : gs://genetics_etl_python_playground/initialisation/install_dependencies_on_cluster.sh
9
9
num_workers : 2
10
10
11
11
nodes :
Original file line number Diff line number Diff line change 1
1
---
2
2
dataproc :
3
- python_main_module : gs://genetics_etl_python_playground/initialisation/gentropy/dev/ cli.py
3
+ python_main_module : gs://genetics_etl_python_playground/initialisation/cli.py
4
4
cluster_metadata :
5
- PACKAGE : gs://genetics_etl_python_playground/initialisation/gentropy/dev/gentropy-0 .0.0-py3-none-any.whl
6
- cluster_init_script : gs://genetics_etl_python_playground/initialisation/gentropy/dev/ install_dependencies_on_cluster.sh
5
+ GENTROPY_REF : v2 .0.1
6
+ cluster_init_script : gs://genetics_etl_python_playground/initialisation/install_dependencies_on_cluster.sh
7
7
cluster_name : otg-ukb-ppp-eur
8
8
autoscaling_policy : otg-etl
9
9
Original file line number Diff line number Diff line change @@ -105,6 +105,7 @@ def create_cluster(
105
105
num_preemptible_workers = num_preemptible_workers ,
106
106
num_workers = num_workers ,
107
107
image_version = GCP_DATAPROC_IMAGE ,
108
+ internal_ip_only = False ,
108
109
enable_component_gateway = True ,
109
110
metadata = cluster_metadata ,
110
111
idle_delete_ttl = idle_delete_ttl ,
@@ -229,8 +230,8 @@ def submit_pyspark_job(
229
230
"main_python_file_uri" : python_main_module ,
230
231
"args" : args ,
231
232
"properties" : {
232
- "spark.jars" : "/opt/conda/miniconda3/lib/python3.10 /site-packages/hail/backend/hail-all-spark.jar" ,
233
- "spark.driver.extraClassPath" : "/opt/conda/miniconda3/lib/python3.10 /site-packages/hail/backend/hail-all-spark.jar" ,
233
+ "spark.jars" : "/opt/conda/miniconda3/lib/python3.11 /site-packages/hail/backend/hail-all-spark.jar" ,
234
+ "spark.driver.extraClassPath" : "/opt/conda/miniconda3/lib/python3.11 /site-packages/hail/backend/hail-all-spark.jar" ,
234
235
"spark.executor.extraClassPath" : "./hail-all-spark.jar" ,
235
236
"spark.serializer" : "org.apache.spark.serializer.KryoSerializer" ,
236
237
"spark.kryo.registrator" : "is.hail.kryo.HailKryoRegistrator" ,
You can’t perform that action at this time.
0 commit comments