Skip to content

Commit

Permalink
Merge branch 'master' into kingfisher
Browse files Browse the repository at this point in the history
  • Loading branch information
SilasK authored Jun 25, 2024
2 parents eaffd5d + 4232e6e commit 378d2b5
Show file tree
Hide file tree
Showing 33 changed files with 170 additions and 183 deletions.
2 changes: 1 addition & 1 deletion atlas/atlas.py
Original file line number Diff line number Diff line change
Expand Up @@ -121,7 +121,7 @@ def get_snakefile(file="workflow/Snakefile"):
type=int,
default=multiprocessing.cpu_count(),
show_default=True,
help="use at most this many jobs in parallel (see cluster submission for mor details).",
help="use at most this many jobs in parallel (see cluster submission for more details).",
)
@click.option(
"--max-mem",
Expand Down
2 changes: 1 addition & 1 deletion atlas/init/create_sample_table.py
Original file line number Diff line number Diff line change
Expand Up @@ -158,7 +158,7 @@ def get_samples_from_fastq(path, fraction_split_character=split_character):
# parse subfolder
if len(subfolders) > 0:
logger.info(
f"Found {len(subfolders)} subfolders. Check if I find fastq files inside. Use the the subfolder as sample_names "
f"Found {len(subfolders)} subfolders. Check if I find fastq files inside. Use the subfolder as sample_names "
)

for subf in subfolders:
Expand Down
6 changes: 3 additions & 3 deletions atlas/init/parse_sra.py
Original file line number Diff line number Diff line change
Expand Up @@ -67,7 +67,7 @@ def filter_runinfo(RunTable, ignore_paired=False):

if Difference > 0:
logger.info(
f"Runs have the folowing values for {key}: {', '.join(All_values)}\n"
f"Runs have the following values for {key}: {', '.join(All_values)}\n"
f"Select only runs {key} == {Expected_library_values[key]}, "
f"Filtered out {Difference} runs"
)
Expand All @@ -77,7 +77,7 @@ def filter_runinfo(RunTable, ignore_paired=False):
All_values = RunTable[key].unique()
if any(RunTable[key] != Expected_library_values[key]):
logger.warning(
f"Runs have the folowing values for {key}: {', '.join(All_values)}\n"
f"Runs have the following values for {key}: {', '.join(All_values)}\n"
f"Usually I expect {key} == {Expected_library_values[key]} "
)

Expand Down Expand Up @@ -141,7 +141,7 @@ def validate_merging_runinfo(path):
logger.error(
f"You attemt to merge runs from the same sample. "
f"But for {len(problematic_samples)} samples the runs are sequenced with different platforms and should't be merged.\n"
f"Please resolve the the abiguity in the table {path} and rerun the command.\n"
f"Please resolve the abiguity in the table {path} and rerun the command.\n"
)

exit(1)
Expand Down
8 changes: 4 additions & 4 deletions docs/reports/QC_report.html

Large diffs are not rendered by default.

2 changes: 1 addition & 1 deletion docs/reports/assembly_report.html
Original file line number Diff line number Diff line change
Expand Up @@ -66,7 +66,7 @@ <h2>Total assembly length</h2>
<div> <div id="24f3b6b6-2545-4c37-a8a8-ed1e78adb3df" class="plotly-graph-div" style="height:100%; width:100%;"></div> <script type="text/javascript"> window.PLOTLYENV=window.PLOTLYENV || {}; if (document.getElementById("24f3b6b6-2545-4c37-a8a8-ed1e78adb3df")) { Plotly.newPlot( "24f3b6b6-2545-4c37-a8a8-ed1e78adb3df", [{"hovertemplate":"<b>%{hovertext}</b><br><br>Contigs (count)=%{x}<br>Total BP=%{y}<extra></extra>","hovertext":["SRS1992958","SRS1992960","SRS1992962","SRS1992964","SRS1992966","SRS1992968","SRS1992970","SRS1992972","SRS1992974","SRS1992976","SRS1992978","SRS1992980","SRS1992988","SRS1992990","SRS1992991","SRS1992992","SRS1992993","SRS1992994","SRS1992995","SRS1992998","SRS1992999","SRS1993000","SRS1993001","SRS1993002","SRS1993003","SRS1993004","SRS1993006","SRS1993058","SRS1993062","SRS1993066","SRS1993078","SRS1993092","SRS1993106","SRS1993108","SRS1993116","SRS1993122","SRS1993132","SRS1993134","SRS1993140","SRS1993148","SRS1993150","SRS1993166","SRS1993172"],"legendgroup":"","marker":{"color":"#1F77B4","symbol":"circle"},"mode":"markers","name":"","orientation":"v","showlegend":false,"type":"scatter","x":[4809,6784,17555,12992,4861,2581,2369,3496,2053,1744,3418,2536,6879,959,6749,4475,1093,246,16009,7905,7323,15292,13722,6504,10963,13463,8641,2553,11817,16472,6013,3032,4215,12521,4974,3951,7880,19989,1402,3496,12227,1675,4518],"xaxis":"x","y":[22869065,37434437,63947104,52814464,18082852,14448642,17760159,28515843,14761412,14488525,21928608,14389212,37573930,13916023,29542853,24835497,8923950,5200445,70290913,39996427,49074212,51637442,67178502,44411971,39617553,50726622,38929314,23970819,49606407,52610954,17441853,16835480,30879085,37415823,25264552,19655831,27150699,72270939,13382422,13741612,41840211,12372381,22028675],"yaxis":"y"}], {"legend":{"tracegroupgap":0},"margin":{"t":60},"template":{"data":{"bar":[{"error_x":{"color":"rgb(36,36,36)"},"error_y":{"color":"rgb(36,36,36)"},"marker":{"line":{"color":"white","width":0.5},"pattern":{"fillmode":"overlay","size":10,"solidity":0.2}},"type":"bar"}],"barpolar":[{"marker":{"line":{"color":"white","width":0.5},"pattern":{"fillmode":"overlay","size":10,"solidity":0.2}},"type":"barpolar"}],"carpet":[{"aaxis":{"endlinecolor":"rgb(36,36,36)","gridcolor":"white","linecolor":"white","minorgridcolor":"white","startlinecolor":"rgb(36,36,36)"},"baxis":{"endlinecolor":"rgb(36,36,36)","gridcolor":"white","linecolor":"white","minorgridcolor":"white","startlinecolor":"rgb(36,36,36)"},"type":"carpet"}],"choropleth":[{"colorbar":{"outlinewidth":1,"tickcolor":"rgb(36,36,36)","ticks":"outside"},"type":"choropleth"}],"contour":[{"colorbar":{"outlinewidth":1,"tickcolor":"rgb(36,36,36)","ticks":"outside"},"colorscale":[[0.0,"#440154"],[0.1111111111111111,"#482878"],[0.2222222222222222,"#3e4989"],[0.3333333333333333,"#31688e"],[0.4444444444444444,"#26828e"],[0.5555555555555556,"#1f9e89"],[0.6666666666666666,"#35b779"],[0.7777777777777778,"#6ece58"],[0.8888888888888888,"#b5de2b"],[1.0,"#fde725"]],"type":"contour"}],"contourcarpet":[{"colorbar":{"outlinewidth":1,"tickcolor":"rgb(36,36,36)","ticks":"outside"},"type":"contourcarpet"}],"heatmap":[{"colorbar":{"outlinewidth":1,"tickcolor":"rgb(36,36,36)","ticks":"outside"},"colorscale":[[0.0,"#440154"],[0.1111111111111111,"#482878"],[0.2222222222222222,"#3e4989"],[0.3333333333333333,"#31688e"],[0.4444444444444444,"#26828e"],[0.5555555555555556,"#1f9e89"],[0.6666666666666666,"#35b779"],[0.7777777777777778,"#6ece58"],[0.8888888888888888,"#b5de2b"],[1.0,"#fde725"]],"type":"heatmap"}],"heatmapgl":[{"colorbar":{"outlinewidth":1,"tickcolor":"rgb(36,36,36)","ticks":"outside"},"colorscale":[[0.0,"#440154"],[0.1111111111111111,"#482878"],[0.2222222222222222,"#3e4989"],[0.3333333333333333,"#31688e"],[0.4444444444444444,"#26828e"],[0.5555555555555556,"#1f9e89"],[0.6666666666666666,"#35b779"],[0.7777777777777778,"#6ece58"],[0.8888888888888888,"#b5de2b"],[1.0,"#fde725"]],"type":"heatmapgl"}],"histogram":[{"marker":{"line":{"color":"white","width":0.6}},"type":"histogram"}],"histogram2d":[{"colorbar":{"outlinewidth":1,"tickcolor":"rgb(36,36,36)","ticks":"outside"},"colorscale":[[0.0,"#440154"],[0.1111111111111111,"#482878"],[0.2222222222222222,"#3e4989"],[0.3333333333333333,"#31688e"],[0.4444444444444444,"#26828e"],[0.5555555555555556,"#1f9e89"],[0.6666666666666666,"#35b779"],[0.7777777777777778,"#6ece58"],[0.8888888888888888,"#b5de2b"],[1.0,"#fde725"]],"type":"histogram2d"}],"histogram2dcontour":[{"colorbar":{"outlinewidth":1,"tickcolor":"rgb(36,36,36)","ticks":"outside"},"colorscale":[[0.0,"#440154"],[0.1111111111111111,"#482878"],[0.2222222222222222,"#3e4989"],[0.3333333333333333,"#31688e"],[0.4444444444444444,"#26828e"],[0.5555555555555556,"#1f9e89"],[0.6666666666666666,"#35b779"],[0.7777777777777778,"#6ece58"],[0.8888888888888888,"#b5de2b"],[1.0,"#fde725"]],"type":"histogram2dcontour"}],"mesh3d":[{"colorbar":{"outlinewidth":1,"tickcolor":"rgb(36,36,36)","ticks":"outside"},"type":"mesh3d"}],"parcoords":[{"line":{"colorbar":{"outlinewidth":1,"tickcolor":"rgb(36,36,36)","ticks":"outside"}},"type":"parcoords"}],"pie":[{"automargin":true,"type":"pie"}],"scatter":[{"marker":{"colorbar":{"outlinewidth":1,"tickcolor":"rgb(36,36,36)","ticks":"outside"}},"type":"scatter"}],"scatter3d":[{"line":{"colorbar":{"outlinewidth":1,"tickcolor":"rgb(36,36,36)","ticks":"outside"}},"marker":{"colorbar":{"outlinewidth":1,"tickcolor":"rgb(36,36,36)","ticks":"outside"}},"type":"scatter3d"}],"scattercarpet":[{"marker":{"colorbar":{"outlinewidth":1,"tickcolor":"rgb(36,36,36)","ticks":"outside"}},"type":"scattercarpet"}],"scattergeo":[{"marker":{"colorbar":{"outlinewidth":1,"tickcolor":"rgb(36,36,36)","ticks":"outside"}},"type":"scattergeo"}],"scattergl":[{"marker":{"colorbar":{"outlinewidth":1,"tickcolor":"rgb(36,36,36)","ticks":"outside"}},"type":"scattergl"}],"scattermapbox":[{"marker":{"colorbar":{"outlinewidth":1,"tickcolor":"rgb(36,36,36)","ticks":"outside"}},"type":"scattermapbox"}],"scatterpolar":[{"marker":{"colorbar":{"outlinewidth":1,"tickcolor":"rgb(36,36,36)","ticks":"outside"}},"type":"scatterpolar"}],"scatterpolargl":[{"marker":{"colorbar":{"outlinewidth":1,"tickcolor":"rgb(36,36,36)","ticks":"outside"}},"type":"scatterpolargl"}],"scatterternary":[{"marker":{"colorbar":{"outlinewidth":1,"tickcolor":"rgb(36,36,36)","ticks":"outside"}},"type":"scatterternary"}],"surface":[{"colorbar":{"outlinewidth":1,"tickcolor":"rgb(36,36,36)","ticks":"outside"},"colorscale":[[0.0,"#440154"],[0.1111111111111111,"#482878"],[0.2222222222222222,"#3e4989"],[0.3333333333333333,"#31688e"],[0.4444444444444444,"#26828e"],[0.5555555555555556,"#1f9e89"],[0.6666666666666666,"#35b779"],[0.7777777777777778,"#6ece58"],[0.8888888888888888,"#b5de2b"],[1.0,"#fde725"]],"type":"surface"}],"table":[{"cells":{"fill":{"color":"rgb(237,237,237)"},"line":{"color":"white"}},"header":{"fill":{"color":"rgb(217,217,217)"},"line":{"color":"white"}},"type":"table"}]},"layout":{"annotationdefaults":{"arrowhead":0,"arrowwidth":1},"autotypenumbers":"strict","coloraxis":{"colorbar":{"outlinewidth":1,"tickcolor":"rgb(36,36,36)","ticks":"outside"}},"colorscale":{"diverging":[[0.0,"rgb(103,0,31)"],[0.1,"rgb(178,24,43)"],[0.2,"rgb(214,96,77)"],[0.3,"rgb(244,165,130)"],[0.4,"rgb(253,219,199)"],[0.5,"rgb(247,247,247)"],[0.6,"rgb(209,229,240)"],[0.7,"rgb(146,197,222)"],[0.8,"rgb(67,147,195)"],[0.9,"rgb(33,102,172)"],[1.0,"rgb(5,48,97)"]],"sequential":[[0.0,"#440154"],[0.1111111111111111,"#482878"],[0.2222222222222222,"#3e4989"],[0.3333333333333333,"#31688e"],[0.4444444444444444,"#26828e"],[0.5555555555555556,"#1f9e89"],[0.6666666666666666,"#35b779"],[0.7777777777777778,"#6ece58"],[0.8888888888888888,"#b5de2b"],[1.0,"#fde725"]],"sequentialminus":[[0.0,"#440154"],[0.1111111111111111,"#482878"],[0.2222222222222222,"#3e4989"],[0.3333333333333333,"#31688e"],[0.4444444444444444,"#26828e"],[0.5555555555555556,"#1f9e89"],[0.6666666666666666,"#35b779"],[0.7777777777777778,"#6ece58"],[0.8888888888888888,"#b5de2b"],[1.0,"#fde725"]]},"colorway":["#1F77B4","#FF7F0E","#2CA02C","#D62728","#9467BD","#8C564B","#E377C2","#7F7F7F","#BCBD22","#17BECF"],"font":{"color":"rgb(36,36,36)"},"geo":{"bgcolor":"white","lakecolor":"white","landcolor":"white","showlakes":true,"showland":true,"subunitcolor":"white"},"hoverlabel":{"align":"left"},"hovermode":"closest","mapbox":{"style":"light"},"paper_bgcolor":"white","plot_bgcolor":"white","polar":{"angularaxis":{"gridcolor":"rgb(232,232,232)","linecolor":"rgb(36,36,36)","showgrid":false,"showline":true,"ticks":"outside"},"bgcolor":"white","radialaxis":{"gridcolor":"rgb(232,232,232)","linecolor":"rgb(36,36,36)","showgrid":false,"showline":true,"ticks":"outside"}},"scene":{"xaxis":{"backgroundcolor":"white","gridcolor":"rgb(232,232,232)","gridwidth":2,"linecolor":"rgb(36,36,36)","showbackground":true,"showgrid":false,"showline":true,"ticks":"outside","zeroline":false,"zerolinecolor":"rgb(36,36,36)"},"yaxis":{"backgroundcolor":"white","gridcolor":"rgb(232,232,232)","gridwidth":2,"linecolor":"rgb(36,36,36)","showbackground":true,"showgrid":false,"showline":true,"ticks":"outside","zeroline":false,"zerolinecolor":"rgb(36,36,36)"},"zaxis":{"backgroundcolor":"white","gridcolor":"rgb(232,232,232)","gridwidth":2,"linecolor":"rgb(36,36,36)","showbackground":true,"showgrid":false,"showline":true,"ticks":"outside","zeroline":false,"zerolinecolor":"rgb(36,36,36)"}},"shapedefaults":{"fillcolor":"black","line":{"width":0},"opacity":0.3},"ternary":{"aaxis":{"gridcolor":"rgb(232,232,232)","linecolor":"rgb(36,36,36)","showgrid":false,"showline":true,"ticks":"outside"},"baxis":{"gridcolor":"rgb(232,232,232)","linecolor":"rgb(36,36,36)","showgrid":false,"showline":true,"ticks":"outside"},"bgcolor":"white","caxis":{"gridcolor":"rgb(232,232,232)","linecolor":"rgb(36,36,36)","showgrid":false,"showline":true,"ticks":"outside"}},"title":{"x":0.05},"xaxis":{"automargin":true,"gridcolor":"rgb(232,232,232)","linecolor":"rgb(36,36,36)","showgrid":false,"showline":true,"ticks":"outside","title":{"standoff":15},"zeroline":false,"zerolinecolor":"rgb(36,36,36)"},"yaxis":{"automargin":true,"gridcolor":"rgb(232,232,232)","linecolor":"rgb(36,36,36)","showgrid":false,"showline":true,"ticks":"outside","title":{"standoff":15},"zeroline":false,"zerolinecolor":"rgb(36,36,36)"}}},"xaxis":{"anchor":"y","domain":[0.0,1.0],"title":{"text":"Contigs (count)"}},"yaxis":{"anchor":"x","domain":[0.0,1.0],"title":{"text":"Total BP"}}}, {"responsive": true} ) }; </script> </div>


<h2>Fragmentation<h/2>
<h2>Fragmentation</h2>

<p>
N50/N90 is a measure of how fractionated assemblies are:
Expand Down
8 changes: 4 additions & 4 deletions docs/reports/bin_report_DASTool.html

Large diffs are not rendered by default.

8 changes: 4 additions & 4 deletions docs/reports/bin_report_SemiBin.html

Large diffs are not rendered by default.

8 changes: 4 additions & 4 deletions docs/reports/bin_report_vamb.html

Large diffs are not rendered by default.

15 changes: 7 additions & 8 deletions docs/usage/configuration.rst
Original file line number Diff line number Diff line change
Expand Up @@ -11,10 +11,10 @@ _contaminants:
Remove reads from Host
======================

One of the most important steps in the Quality control is to remove host genome.
One of the most important steps in the Quality control is to remove reads from the host's genome.
You can add any number of genomes to be removed.

We recommend you to use genomes where repetitive sequences are masked.
We recommend using genomes where repetitive sequences are masked.
See here for more details `human genome <http://seqanswers.com/forums/archive/index.php/t-42552.html>`_.


Expand All @@ -36,7 +36,7 @@ There are two primary strategies for co-abundance binning:
The samples to be binned together are specified using the `BinGroup` in the `sample.tsv` file.
The size of the BinGroup should be selected based on the binner and the co-binning strategy in use.

Cross mapping complexity scales quadratically with the size of the BinGroup since each sample's reads are mapped to each other.
Cross-mapping complexity scales quadratically with the size of the BinGroup since each sample's reads are mapped to each other.
This might yield better results for complex metagenomes, although no definitive benchmark is known.
On the other hand, co-binning is more efficient, as it maps a sample's reads only once to a potentially large assembly.

Expand Down Expand Up @@ -88,21 +88,20 @@ Long reads
==========

Limitation: Hybrid assembly of long and short reads is supported with spades and metaSpades.
However metaSpades needs a paired-end short-read library.
However, metaSpades needs a paired-end short-read library.

The path of the (preprocessed) long reads should be added manually to the
the sample table under a new column heading 'longreads'.
sample table under a new column heading 'longreads'.

In addition the type of the long reads should be defined in the config file:
In addition, the type of the long reads should be defined in the config file:
``longread_type`` one of ["pacbio", "nanopore", "sanger", "trusted-contigs", "untrusted-contigs"]


Example config file
===================


..
include:: ../../workflow/../config/template_config.yaml
..include:: ../../config/template_config.yaml
:code:


Expand Down
Loading

0 comments on commit 378d2b5

Please sign in to comment.