|
11 | 11 | AUTOSCALING = "finngen-preprocess"
|
12 | 12 |
|
13 | 13 | RELEASEBUCKET = "gs://genetics_etl_python_playground/output/python_etl/parquet/XX.XX"
|
| 14 | +SUMSTATS = "{RELEASEBUCKET}/summary_statistics/finngen" |
| 15 | +WINDOWBASED_CLUMPED = ( |
| 16 | + "{RELEASEBUCKET}/study_locus/from_sumstats_study_locus_window_clumped/finngen" |
| 17 | +) |
| 18 | +LD_CLUMPED = "{RELEASEBUCKET}/study_locus/from_sumstats_study_locus_ld_clumped/finngen" |
| 19 | +PICSED = "{RELEASEBUCKET}/credible_set/from_sumstats_study_locus/finngen" |
14 | 20 |
|
15 | 21 | with DAG(
|
16 | 22 | dag_id=Path(__file__).stem,
|
|
24 | 30 | task_id="finngen_sumstats_and_study_index",
|
25 | 31 | )
|
26 | 32 |
|
27 |
| - clumping = common.submit_step( |
| 33 | + window_based_clumping = common.submit_step( |
28 | 34 | cluster_name=CLUSTER_NAME,
|
29 | 35 | step_id="clump",
|
30 |
| - task_id="finngen_clump", |
| 36 | + task_id="finngen_window_based_clumping", |
31 | 37 | other_args=[
|
32 |
| - f"step.summary_stats_path={RELEASEBUCKET}/summary_statistics/finngen", |
33 |
| - f"step.clumped_study_locus_out={RELEASEBUCKET}/study_locus/from_sumstats_study_locus/finngen", |
| 38 | + "step.input_path={SUMSTATS}", |
| 39 | + "step.clumped_study_locus_path={WINDOWBASED_CLUMPED}", |
| 40 | + ], |
| 41 | + ) |
| 42 | + ld_clumping = common.submit_step( |
| 43 | + cluster_name=CLUSTER_NAME, |
| 44 | + step_id="clump", |
| 45 | + task_id="finngen_ld_clumping", |
| 46 | + other_args=[ |
| 47 | + "step.input_path={WINDOWBASED_CLUMPED}", |
| 48 | + "step.clumped_study_locus_path={LD_CLUMPED}", |
34 | 49 | ],
|
35 |
| - # This allows to attempt running the task when above step fails do to failifexists |
36 | 50 | trigger_rule=TriggerRule.ALL_DONE,
|
37 | 51 | )
|
38 | 52 |
|
|
41 | 55 | step_id="pics",
|
42 | 56 | task_id="finngen_pics",
|
43 | 57 | other_args=[
|
44 |
| - f"step.study_locus_ld_annotated_in={RELEASEBUCKET}/study_locus/from_sumstats_study_locus/finngen", |
45 |
| - f"step.picsed_study_locus_out={RELEASEBUCKET}/credible_set/from_sumstats_study_locus/finngen", |
| 58 | + f"step.study_locus_ld_annotated_in={LD_CLUMPED}", |
| 59 | + f"step.picsed_study_locus_out={PICSED}", |
46 | 60 | ],
|
47 | 61 | # This allows to attempt running the task when above step fails do to failifexists
|
48 | 62 | trigger_rule=TriggerRule.ALL_DONE,
|
|
52 | 66 | common.create_cluster(CLUSTER_NAME, autoscaling_policy=AUTOSCALING)
|
53 | 67 | >> common.install_dependencies(CLUSTER_NAME)
|
54 | 68 | >> study_and_sumstats
|
55 |
| - >> clumping |
| 69 | + >> window_based_clumping |
| 70 | + >> ld_clumping |
56 | 71 | >> pics
|
57 | 72 | >> common.delete_cluster(CLUSTER_NAME)
|
58 | 73 | )
|
0 commit comments