From 2bc357c9b1b781182d1d3e397ae5bca65af0c78e Mon Sep 17 00:00:00 2001
From: "Michael R. Crusoe" <michael.crusoe@gmail.com>
Date: Wed, 1 Nov 2023 17:30:06 +0100
Subject: [PATCH 1/3] codespell: ignore "implementors"

---
 .ci/ignore-spelling.txt | 1 +
 1 file changed, 1 insertion(+)

diff --git a/.ci/ignore-spelling.txt b/.ci/ignore-spelling.txt
index 62397276eda2..42499364624a 100644
--- a/.ci/ignore-spelling.txt
+++ b/.ci/ignore-spelling.txt
@@ -1 +1,2 @@
 hda
+implementors

From 4dafda64d1ae8d7df5977ec8243d3d24598e3f08 Mon Sep 17 00:00:00 2001
From: "Michael R. Crusoe" <michael.crusoe@gmail.com>
Date: Wed, 1 Nov 2023 18:34:33 +0100
Subject: [PATCH 2/3] typo fix

Co-authored-by: Nicola Soranzo <nicola.soranzo@earlham.ac.uk>
---
 test/unit/app/jobs/test_rule_helper.py | 8 +++-----
 1 file changed, 3 insertions(+), 5 deletions(-)

diff --git a/test/unit/app/jobs/test_rule_helper.py b/test/unit/app/jobs/test_rule_helper.py
index f7296b0861dc..eaf98dc0741e 100644
--- a/test/unit/app/jobs/test_rule_helper.py
+++ b/test/unit/app/jobs/test_rule_helper.py
@@ -56,11 +56,9 @@ def test_job_count():
 
 
 def __assert_job_count_is(expected_count, rule_helper, **kwds):
-    acutal_count = rule_helper.job_count(**kwds)
-
-    if expected_count != acutal_count:
-        template = "Expected job count %d, actual job count %s for params %s"
-        raise AssertionError(template % (expected_count, acutal_count, kwds))
+    actual_count = rule_helper.job_count(**kwds)
+    if expected_count != actual_count:
+        raise AssertionError(f"Expected job count {expected_count}, actual job count {actual_count} for params {kwds}")
 
 
 def __setup_fixtures(app):

From 707b31b0591771f8827a6b2061a1ba6628f429de Mon Sep 17 00:00:00 2001
From: mvdbeek <m.vandenbeek@gmail.com>
Date: Wed, 1 Nov 2023 21:38:02 +0100
Subject: [PATCH 3/3] Fix Anndata set_meta for updated h5py

---
 lib/galaxy/datatypes/binary.py | 48 +++++++++++++++++-----------------
 1 file changed, 24 insertions(+), 24 deletions(-)

diff --git a/lib/galaxy/datatypes/binary.py b/lib/galaxy/datatypes/binary.py
index c15b2213a94c..175034f083c4 100644
--- a/lib/galaxy/datatypes/binary.py
+++ b/lib/galaxy/datatypes/binary.py
@@ -22,6 +22,7 @@
     Optional,
     Tuple,
     TYPE_CHECKING,
+    Union,
 )
 
 import h5py
@@ -1482,6 +1483,22 @@ def set_meta(self, dataset: DatasetProtocol, overwrite: bool = True, **kwd) -> N
             dataset.metadata.layers_count = len(anndata_file)
             dataset.metadata.layers_names = list(anndata_file.keys())
 
+            def get_index_value(tmp: Union[h5py.Dataset, h5py.Datatype, h5py.Group]):
+                if isinstance(tmp, (h5py.Dataset, h5py.Datatype)):
+                    if "index" in tmp.dtype.names:
+                        return tmp["index"]
+                    if "_index" in tmp.dtype.names:
+                        return tmp["_index"]
+                    return None
+                else:
+                    index_var = tmp.attrs.get("index")
+                    if index_var is not None:
+                        return tmp[index_var]
+                    index_var = tmp.attrs.get("_index")
+                    if index_var is not None:
+                        return tmp[index_var]
+                    return None
+
             def _layercountsize(tmp, lennames=0):
                 "From TMP and LENNAMES, return layers, their number, and the length of one of the layers (all equal)."
                 if hasattr(tmp, "dtype"):
@@ -1489,30 +1506,17 @@ def _layercountsize(tmp, lennames=0):
                     count = len(tmp.dtype)
                     size = int(tmp.size)
                 else:
-                    layers = list(tmp.keys())
+                    layers = list(tmp.attrs)
                     count = len(layers)
                     size = lennames
                 return (layers, count, size)
 
             if "obs" in dataset.metadata.layers_names:
                 tmp = anndata_file["obs"]
-                obs_index = None
-                if "index" in tmp:
-                    obs_index = "index"
-                elif "_index" in tmp:
-                    obs_index = "_index"
+                obs = get_index_value(tmp)
                 # Determine cell labels
-                if obs_index:
-                    dataset.metadata.obs_names = list(tmp[obs_index])
-                elif hasattr(tmp, "dtype"):
-                    if "index" in tmp.dtype.names:
-                        # Yes, we call tmp["index"], and not tmp.dtype["index"]
-                        # here, despite the above tests.
-                        dataset.metadata.obs_names = list(tmp["index"])
-                    elif "_index" in tmp.dtype.names:
-                        dataset.metadata.obs_names = list(tmp["_index"])
-                    else:
-                        log.warning("Could not determine cell labels for %s", self)
+                if obs is not None:
+                    dataset.metadata.obs_names = [n.decode() for n in obs]
                 else:
                     log.warning("Could not determine observation index for %s", self)
 
@@ -1536,15 +1540,11 @@ def _layercountsize(tmp, lennames=0):
 
             if "var" in dataset.metadata.layers_names:
                 tmp = anndata_file["var"]
-                var_index = None
-                if "index" in tmp:
-                    var_index = "index"
-                elif "_index" in tmp:
-                    var_index = "_index"
+                index = get_index_value(tmp)
                 # We never use var_names
                 # dataset.metadata.var_names = tmp[var_index]
-                if var_index:
-                    x, y, z = _layercountsize(tmp, len(tmp[var_index]))
+                if index is not None:
+                    x, y, z = _layercountsize(tmp, len(index))
                 else:
                     # failing to detect a var_index is not an indicator
                     # that the dataset is empty