@@ -2,7 +2,7 @@ viash_version: 0.9.0-RC7
2
2
3
3
# Step 1: Change the name of the task.
4
4
# example: task_name_of_this_task
5
- name : task_template
5
+ name : task_dimensionality_reduction
6
6
organization : openproblems-bio
7
7
version : dev
8
8
@@ -11,68 +11,107 @@ license: MIT
11
11
keywords : [single-cell, openproblems, benchmark]
12
12
# Step 3: Update the `task_template` to the name of the task from step 1.
13
13
links :
14
- issue_tracker : https://github.com/openproblems-bio/task_template /issues
15
- repository : https://github.com/openproblems-bio/task_template
14
+ issue_tracker : https://github.com/openproblems-bio/task_dimensionality_reduction /issues
15
+ repository : https://github.com/openproblems-bio/task_dimensionality_reduction
16
16
docker_registry : ghcr.io
17
17
18
-
19
18
# Step 4: Update the label, summary and description.
20
19
# A unique, human-readable, short label. Used for creating summary tables and visualisations.
21
- label : Template
22
- summary : A one sentence summary of purpose and methodology. Used for creating an overview tables .
20
+ label : Dimensionality Reduction for Visualization
21
+ summary : Reduction of high-dimensional datasets to 2D for visualization & interpretation .
23
22
description : |
24
- Provide a clear and concise description of your task, detailing the specific problem it aims
25
- to solve. Outline the input data types, the expected output, and any assumptions or constraints.
26
- Be sure to explain any terminology or concepts that are essential for understanding the task.
27
-
28
- Explain the motivation behind your proposed task. Describe the biological or computational
29
- problem you aim to address and why it's important. Discuss the current state of research in
30
- this area and any gaps or challenges that your task could help address. This section
31
- should convince readers of the significance and relevance of your task.
32
-
23
+ Data visualisation is an important part of all stages of single-cell analysis, from
24
+ initial quality control to interpretation and presentation of final results. For bulk RNA-seq
25
+ studies, linear dimensionality reduction techniques such as PCA and MDS are commonly used
26
+ to visualise the variation between samples. While these methods are highly effective they
27
+ can only be used to show the first few components of variation which cannot fully represent
28
+ the increased complexity and number of observations in single-cell datasets. For this reason
29
+ non-linear techniques (most notably t-SNE and UMAP) have become the standard for visualising
30
+ single-cell studies. These methods attempt to compress a dataset into a two-dimensional space
31
+ while attempting to capture as much of the variance between observations as possible. Many
32
+ methods for solving this problem now exist. In general these methods try to preserve distances,
33
+ while some additionally consider aspects such as density within the embedded space or conservation
34
+ of continuous trajectories. Despite almost every single-cell study using one of these visualisations
35
+ there has been debate as to whether they can effectively capture the variation in single-cell
36
+ datasets [@chari2023speciousart].
37
+
38
+ The dimensionality reduction task attempts to quantify the ability of methods to embed the
39
+ information present in complex single-cell studies into a two-dimensional space. Thus, this task
40
+ is specifically designed for dimensionality reduction for visualisation and does not consider other
41
+ uses of dimensionality reduction in standard single-cell workflows such as improving the
42
+ signal-to-noise ratio (and in fact several of the methods use PCA as a pre-processing step for this
43
+ reason). Unlike most tasks, methods for the dimensionality reduction task must accept a matrix
44
+ containing expression values normalised to 10,000 counts per cell and log transformed (log-10k) and
45
+ produce a two-dimensional coordinate for each cell. Pre-normalised matrices are required to
46
+ enforce consistency between the metric evaluation (which generally requires normalised data) and
47
+ the method runs. When these are not consistent, methods that use the same normalisation as used in
48
+ the metric tend to score more highly. For some methods we also evaluate the pre-processing
49
+ recommended by the method.
33
50
# A list of references to relevant literature. Each reference should be a DOI or a bibtex entry
34
- references :
35
- doi :
36
- - 10.21203/rs.3.rs-4181617/v1
37
- # bibtex:
38
- # - |
39
- # @article{doe_2021_template,
40
- # doi = {10.21203/rs.3.rs-4181617/v1},
41
- # url = {https://doi.org/10.21203/rs.3.rs-4181617/v1},
42
- # author = {Doe, John},
43
- # title = {A template for creating new tasks},
44
- # publisher = {Research Square},
45
- # year = {2021},
46
- # }
51
+ # references:
52
+ # doi:
53
+ # - 10.21203/rs.3.rs-4181617/v1
54
+ # bibtex:
55
+ # - |
56
+ # @article{doe_2021_template,
57
+ # doi = {10.21203/rs.3.rs-4181617/v1},
58
+ # url = {https://doi.org/10.21203/rs.3.rs-4181617/v1},
59
+ # author = {Doe, John},
60
+ # title = {A template for creating new tasks},
61
+ # publisher = {Research Square},
62
+ # year = {2021},
63
+ # }
47
64
48
65
info :
49
- image : The name of the image file to use for the component on the website.
66
+ image : thumbnail.svg
50
67
# Step 5: Replace the task_template to the name of the task.
51
68
test_resources :
52
69
- type : s3
53
- path : s3://openproblems-data/resources_test/task_template /
54
- dest : resources_test/task_template
70
+ path : s3://openproblems-data/resources_test/common/pancreas /
71
+ dest : resources_test/common/pancreas/
55
72
- type : s3
56
- path : s3://openproblems-data/resources_test/common /
57
- dest : resources_test/common
73
+ path : s3://openproblems-data/resources_test/dimensionality_reduction /
74
+ dest : resources_test/dimensionality_reduction
58
75
59
76
# Step 6: Update the authors of the task.
60
77
authors :
61
- # Full name of the author, usually in the name of FirstName MiddleName LastName.
62
- - name : John Doe
63
- # Role of the author. Possible values:
64
- #
65
- # * `"author"`: Authors who have made substantial contributions to the component.
66
- # * `"maintainer"`: The maintainer of the component.
67
- # * `"contributor"`: Authors who have made smaller contributions (such as code patches etc.).
68
- roles : [ "author", "maintainer" ]
69
- # Additional information on the author
70
- info :
71
- github : johndoe
72
- orcid : 0000-0000-0000-0000
73
- email : john@doe.me
74
- twitter : johndoe
75
- linkedin : johndoe
78
+ - name : Luke Zappia
79
+ roles : [ maintainer, author ]
80
+ info :
81
+ github : lazappi
82
+ - name : Michal Klein
83
+ roles : [ author ]
84
+ info :
85
+ github : michalk8
86
+ - name : Scott Gigante
87
+ roles : [ author ]
88
+ info :
89
+ github : scottgigante
90
+ orcid : " 0000-0002-4544-2764"
91
+ - name : Ben DeMeo
92
+ roles : [ author ]
93
+ info :
94
+ github : bendemeo
95
+ - name : Robrecht Cannoodt
96
+ roles : [ author ]
97
+ info :
98
+ github : rcannood
99
+ orcid : 0000-0003-3641-729X
100
+ - name : Kai Waldrant
101
+ roles : [ contributor ]
102
+ info :
103
+ github : KaiWaldrant
104
+ orcid : 0009-0003-8555-1361
105
+ - name : Sai Nirmayi Yasa
106
+ roles : [ contributor ]
107
+ info :
108
+ github : sainirmayi
109
+ orcid : 0009-0003-6319-9803
110
+ - name : Juan A. Cordero Varela
111
+ roles : [ contributor ]
112
+ info :
113
+ github : jacorvar
114
+ orcid : 0000-0002-7373-5433
76
115
77
116
# Step 7: Remove all of the comments of the steps you completed
78
117
# Step 8: High five yourself!
0 commit comments