From b24d16a3cf1d0e71f702b7b183908d33220f91e7 Mon Sep 17 00:00:00 2001 From: pdimens Date: Wed, 3 Jul 2024 09:44:22 -0400 Subject: [PATCH 1/6] make stitch its own env --- src/harpy/conda_deps.py | 5 +++-- src/harpy/snakefiles/impute.smk | 2 +- src/harpy/validations.py | 2 +- 3 files changed, 5 insertions(+), 4 deletions(-) diff --git a/src/harpy/conda_deps.py b/src/harpy/conda_deps.py index 6132b5696..6efa0b06d 100644 --- a/src/harpy/conda_deps.py +++ b/src/harpy/conda_deps.py @@ -6,13 +6,14 @@ def generate_conda_deps(): """Create the YAML files of the workflow conda dependencies""" condachannels = ["bioconda","conda-forge","defaults"] environ = { - "qc" : ["bioconda::falco", "bioconda::fastp", "bioconda::multiqc=1.22", "bioconda::pysam=0.22"], + "qc" : ["bioconda::quickdeconvolution", "bioconda::falco", "bioconda::fastp", "bioconda::multiqc=1.22", "bioconda::pysam=0.22"], "align": ["bioconda::bwa", "bioconda::ema","bioconda::strobealign", "conda-forge::icu","conda-forge::libzlib", "bioconda::samtools=1.20", "bioconda::seqtk", "bioconda::tabix", "conda-forge::xz"], "snp": ["bioconda::bcftools=1.20", "bioconda::freebayes=1.3.6"], "sv": ["bioconda::leviathan", "bioconda::naibr-plus"], "phase" : ["bioconda::hapcut2", "bioconda::whatshap"], "simulations" : ["conda-forge::perl", "bioconda::perl-math-random", "bioconda::perl-inline-c", "bioconda::perl-parse-recdescent", "conda-forge::numpy", "bioconda::dwgsim", "alienzj::msort"], - "r" : ["conda-forge::r-xml2", "conda-forge::r-highcharter", "conda-forge::r-circlize", "r::r-biocircos", "conda-forge::r-dt", "conda-forge::r-flexdashboard", "conda-forge::r-ggplot2", "conda-forge::r-ggridges", "conda-forge::r-plotly", "conda-forge::r-tidyr", "bioconda::r-stitch"] + "r" : ["conda-forge::r-xml2", "conda-forge::r-highcharter", "conda-forge::r-circlize", "r::r-biocircos", "conda-forge::r-dt", "conda-forge::r-flexdashboard", "conda-forge::r-ggplot2", "conda-forge::r-ggridges", "conda-forge::r-plotly", "conda-forge::r-tidyr"], + "stitch" : ["bioconda::r-stitch=1.6.10"] } os.makedirs(".harpy_envs", exist_ok = True) # overwrites existing diff --git a/src/harpy/snakefiles/impute.smk b/src/harpy/snakefiles/impute.smk index 1a531300a..19368710e 100644 --- a/src/harpy/snakefiles/impute.smk +++ b/src/harpy/snakefiles/impute.smk @@ -129,7 +129,7 @@ rule impute: parameters = paramspace.instance, extra = config.get("extra", "") conda: - f"{envdir}/r.yaml" + f"{envdir}/stitch.yaml" benchmark: f".Benchmark/{outdir}/stitch.{paramspace.wildcard_pattern}" + ".{part}.txt" threads: diff --git a/src/harpy/validations.py b/src/harpy/validations.py index 50873b2dc..cca3b6bf5 100644 --- a/src/harpy/validations.py +++ b/src/harpy/validations.py @@ -18,7 +18,7 @@ def check_envdir(dirpath): print_error("This working directory does not contain the expected directory of conda environment definitions ([blue bold].harpy_envs/[/blue bold])\n - use [green bold]--conda[/green bold] to recreate it") sys.exit(1) envlist = os.listdir(dirpath) - envs = ["qc", "align", "snp", "sv", "phase", "simulations", "r"] + envs = ["align", "phase", "qc", "r", "simulations", "snp", "stitch", "sv"] errcount = 0 errtable = Table(show_footer=True, box=box.SIMPLE) errtable.add_column("File", justify="left", style="blue", no_wrap=True) From f7373df6d6f25dd0ea6ce6dbf1fb56586076ae0d Mon Sep 17 00:00:00 2001 From: pdimens Date: Wed, 3 Jul 2024 09:45:04 -0400 Subject: [PATCH 2/6] bump patch number --- pyproject.toml | 2 +- src/harpy/__main__.py | 2 +- 2 files changed, 2 insertions(+), 2 deletions(-) diff --git a/pyproject.toml b/pyproject.toml index f50501b33..340f1a204 100644 --- a/pyproject.toml +++ b/pyproject.toml @@ -4,7 +4,7 @@ build-backend = "setuptools.build_meta" [project] name = "harpy" -version = "1.1.0" +version = "1.1.1" authors = [ {name = "Pavel Dimens"} ] diff --git a/src/harpy/__main__.py b/src/harpy/__main__.py index e36529dae..0d6cd4ca3 100644 --- a/src/harpy/__main__.py +++ b/src/harpy/__main__.py @@ -41,7 +41,7 @@ click.rich_click.ERRORS_EPILOGUE = "See the documentation: [link=https://pdimens.github.io/harpy/]https://pdimens.github.io/harpy/[/link]" @click.group(options_metavar='', context_settings={"help_option_names" : ["-h", "--help"]}) -@click.version_option("1.1.0", prog_name="Harpy") +@click.version_option("1.1.1", prog_name="Harpy") def cli(): """ An automated workflow for haplotagging linked-read data From 299005ed173f2d43147150c297a213fd65fbf6d8 Mon Sep 17 00:00:00 2001 From: pdimens Date: Wed, 3 Jul 2024 10:46:08 -0400 Subject: [PATCH 3/6] add missing env --- src/harpy/snakefiles/containerize.smk | 5 +++++ 1 file changed, 5 insertions(+) diff --git a/src/harpy/snakefiles/containerize.smk b/src/harpy/snakefiles/containerize.smk index 2aa6e42f6..108c370a7 100644 --- a/src/harpy/snakefiles/containerize.smk +++ b/src/harpy/snakefiles/containerize.smk @@ -38,6 +38,11 @@ rule r_env: conda: os.getcwd() + "/.harpy_envs/r.yaml" shell: "touch {output}" +rule r_env: + output: "stitch.env" + conda: os.getcwd() + "/.harpy_envs/stitch.yaml" + shell: "touch {output}" + rule simulations: output: "simulations.env" conda: os.getcwd() + "/.harpy_envs/simulations.yaml" From 8855f0f196f83a4fb30da01cd61b1c21a148a30e Mon Sep 17 00:00:00 2001 From: pdimens Date: Wed, 3 Jul 2024 10:47:34 -0400 Subject: [PATCH 4/6] add to out --- src/harpy/snakefiles/containerize.smk | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/src/harpy/snakefiles/containerize.smk b/src/harpy/snakefiles/containerize.smk index 108c370a7..a36abaa11 100644 --- a/src/harpy/snakefiles/containerize.smk +++ b/src/harpy/snakefiles/containerize.smk @@ -6,7 +6,7 @@ onsuccess: rule all: input: - collect("{conda}.env", conda = ["qc","align","snp","sv","phase","r","simulations"]) + collect("{conda}.env", conda = ["align", "phase", "qc", "r","simulations", "snp","sv"]) rule qc: output: "qc.env" From 8c0e13281d9a4f88bd71995d0c80c26f0b29f156 Mon Sep 17 00:00:00 2001 From: pdimens Date: Wed, 3 Jul 2024 10:49:53 -0400 Subject: [PATCH 5/6] rename --- src/harpy/snakefiles/containerize.smk | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/src/harpy/snakefiles/containerize.smk b/src/harpy/snakefiles/containerize.smk index a36abaa11..06f37ce7f 100644 --- a/src/harpy/snakefiles/containerize.smk +++ b/src/harpy/snakefiles/containerize.smk @@ -33,12 +33,12 @@ rule phase: conda: os.getcwd() + "/.harpy_envs/phase.yaml" shell: "touch {output}" -rule r_env: +rule r: output: "r.env" conda: os.getcwd() + "/.harpy_envs/r.yaml" shell: "touch {output}" -rule r_env: +rule stitch: output: "stitch.env" conda: os.getcwd() + "/.harpy_envs/stitch.yaml" shell: "touch {output}" From bb1867f7857edd8bb42d24b7aef80581a2bc2e61 Mon Sep 17 00:00:00 2001 From: pdimens Date: Wed, 3 Jul 2024 11:14:35 -0400 Subject: [PATCH 6/6] add missing stitch. STOP DOING THIS --- src/harpy/snakefiles/containerize.smk | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/src/harpy/snakefiles/containerize.smk b/src/harpy/snakefiles/containerize.smk index 06f37ce7f..53ee6fc30 100644 --- a/src/harpy/snakefiles/containerize.smk +++ b/src/harpy/snakefiles/containerize.smk @@ -6,7 +6,7 @@ onsuccess: rule all: input: - collect("{conda}.env", conda = ["align", "phase", "qc", "r","simulations", "snp","sv"]) + collect("{conda}.env", conda = ["align", "phase", "qc", "r", "simulations", "snp", "stitch", "sv"]) rule qc: output: "qc.env"