scverse · rcannood · Dec 2, 2023 · Sep 19, 2023 · Sep 19, 2023 · Sep 19, 2023
diff --git a/R/AbstractAnnData.R b/R/AbstractAnnData.R
@@ -69,6 +69,10 @@ AbstractAnnData <- R6::R6Class("AbstractAnnData", # nolint
     #'   with all elements having the same number of rows and columns as `var`.
     varp = function(value) {
       .abstract_function("ad$varp")
+    },
+    #' @field uns The uns slot. Must be `NULL` or a named list.
+    uns = function(value) {
+      .abstract_function("ad$uns")
     }
   ),
   public = list(
@@ -236,6 +240,21 @@ AbstractAnnData <- R6::R6Class("AbstractAnnData", # nolint
       collection
     },
 
+    # @description `.validate_named_list()` checks for whether a value
+    #   is NULL or a named list and throws an error if it is not.
+    .validate_named_list = function(collection, label) {
+      if (is.null(collection)) {
+        return(collection)
+      }
+
+      collection_names <- names(collection)
+      if (!is.list(collection) || ((length(collection) != 0) && is.null(collection_names))) {
+        stop(paste0(label, " must be a named list, was ", class(collection)))
+      }
+
+      collection
+    },
+
     # @description `.validate_obsvar_dataframe()` checks that the
     #   object is a data.frame and removes explicit dimnames.
     # @param df A data frame to validate. Should be an obs or a var.

diff --git a/R/AnnData.R b/R/AnnData.R
@@ -39,6 +39,8 @@
 #' @param varp The varp slot is used to store sparse multi-dimensional
 #'   annotation arrays. It must be either `NULL` or a named list, where each
 #'   element is a sparse matrix where each dimension has length `n_vars`.
+#' @param uns The uns slot is used to store unstructured annotation. It must
+#'   be either `NULL` or a named list.
 #'
 #' @export
 #'
@@ -67,7 +69,8 @@ AnnData <- function(
     obsm = NULL,
     varm = NULL,
     obsp = NULL,
-    varp = NULL) {
+    varp = NULL,
+    uns = NULL) {
   InMemoryAnnData$new(
     obs_names = obs_names,
     var_names = var_names,
@@ -78,6 +81,7 @@ AnnData <- function(
     obsm = obsm,
     varm = varm,
     obsp = obsp,
-    varp = varp
+    varp = varp,
+    uns = uns
   )
 }
diff --git a/R/HDF5AnnData.R b/R/HDF5AnnData.R
@@ -10,10 +10,6 @@ HDF5AnnData <- R6::R6Class("HDF5AnnData", # nolint
     .n_vars = NULL,
     .obs_names = NULL,
     .var_names = NULL,
-    .obsm = NULL,
-    .varm = NULL,
-    .obsp = NULL,
-    .varp = NULL,
     .compression = NULL
   ),
   active = list(
@@ -191,6 +187,17 @@ HDF5AnnData <- R6::R6Class("HDF5AnnData", # nolint
         write_h5ad_data_frame_index(value, private$.h5obj, "var", private$.compression, "_index")
         private$.var_names <- value
       }
+    },
+    #' @field uns The uns slot. Must be `NULL` or a named list.
+    uns = function(value) {
+      if (missing(value)) {
+        # trackstatus: class=HDF5AnnData, feature=get_uns, status=done
+        read_h5ad_element(private$.h5obj, "uns")
+      } else {
+        # trackstatus: class=HDF5AnnData, feature=set_uns, status=done
+        value <- private$.validate_named_list(value, "uns")
+        write_h5ad_element(value, private$.h5obj, "/uns")
+      }
     }
   ),
   public = list(
@@ -229,6 +236,8 @@ HDF5AnnData <- R6::R6Class("HDF5AnnData", # nolint
     #' @param varp The varp slot is used to store sparse multi-dimensional
     #'   annotation arrays. It must be either `NULL` or a named list, where each
     #'   element is a sparse matrix where each dimension has length `n_vars`.
+    #' @param uns The uns slot is used to store unstructured annotation. It must
+    #'   be either `NULL` or a named list.
     #' @param compression The compression algorithm to use when writing the
     #'  HDF5 file. Can be one of `"none"`, `"gzip"` or `"lzf"`. Defaults to
     #' `"none"`.
@@ -251,6 +260,7 @@ HDF5AnnData <- R6::R6Class("HDF5AnnData", # nolint
                           varm = NULL,
                           obsp = NULL,
                           varp = NULL,
+                          uns = NULL,
                           compression = c("none", "gzip", "lzf")) {
       if (!requireNamespace("rhdf5", quietly = TRUE)) {
         stop("The HDF5 interface requires the 'rhdf5' package to be installed")
@@ -333,6 +343,10 @@ HDF5AnnData <- R6::R6Class("HDF5AnnData", # nolint
       if (!is.null(varp)) {
         self$varp <- varp
       }
+
+      if (!is.null(uns)) {
+        self$uns <- uns
+      }
     },
 
     #' @description Number of observations in the AnnData object
@@ -400,6 +414,7 @@ to_HDF5AnnData <- function(adata, file, compression = c("none", "gzip", "lzf"))
     layers = adata$layers,
     obsp = adata$obsp,
     varp = adata$varp,
+    uns = adata$uns,
     compression = compression
   )
 }
diff --git a/R/InMemoryAnnData.R b/R/InMemoryAnnData.R
@@ -39,7 +39,8 @@ InMemoryAnnData <- R6::R6Class("InMemoryAnnData", # nolint
     .obsm = NULL,
     .varm = NULL,
     .obsp = NULL,
-    .varp = NULL
+    .varp = NULL,
+    .uns = NULL
   ),
   active = list(
     #' @field X NULL or an observation x variable matrix (without
@@ -204,6 +205,17 @@ InMemoryAnnData <- R6::R6Class("InMemoryAnnData", # nolint
         )
         self
       }
+    },
+    #' @field uns The uns slot. Must be `NULL` or a named list.
+    uns = function(value) {
+      if (missing(value)) {
+        # trackstatus: class=InMemoryAnnData, feature=get_uns, status=done
+        private$.uns
+      } else {
+        # trackstatus: class=InMemoryAnnData, feature=set_uns, status=done
+        private$.uns <- private$.validate_named_list(value, "uns")
+        self
+      }
     }
   ),
   public = list(
@@ -242,6 +254,8 @@ InMemoryAnnData <- R6::R6Class("InMemoryAnnData", # nolint
     #' @param varp The varp slot is used to store sparse multi-dimensional
     #'   annotation arrays. It must be either `NULL` or a named list, where each
     #'   element is a sparse matrix where each dimension has length `n_vars`.
+    #' @param uns The uns slot is used to store unstructured annotation.
+    #'   It must be either `NULL` or a named list.
     initialize = function(obs_names,
                           var_names,
                           X = NULL,
@@ -251,7 +265,8 @@ InMemoryAnnData <- R6::R6Class("InMemoryAnnData", # nolint
                           obsm = NULL,
                           varm = NULL,
                           obsp = NULL,
-                          varp = NULL) {
+                          varp = NULL,
+                          uns = NULL) {
       # write obs and var first, because these are used by other validators
       self$obs_names <- obs_names
       self$var_names <- var_names
@@ -265,6 +280,7 @@ InMemoryAnnData <- R6::R6Class("InMemoryAnnData", # nolint
       self$varm <- varm
       self$obsp <- obsp
       self$varp <- varp
+      self$uns <- uns
     }
   )
 )
@@ -308,6 +324,7 @@ to_InMemoryAnnData <- function(adata) { # nolint
     obsm = adata$obsm,
     varm = adata$varm,
     obsp = adata$obsp,
-    varp = adata$varp
+    varp = adata$varp,
+    uns = adata$uns
   )
 }
diff --git a/R/read_h5ad_helpers.R b/R/read_h5ad_helpers.R
@@ -358,7 +358,14 @@ read_h5ad_string_scalar <- function(file, name, version = "0.2.0") {
 #' @noRd
 read_h5ad_numeric_scalar <- function(file, name, version = "0.2.0") {
   version <- match.arg(version)
-  rhdf5::h5read(file, name)
+  scalar <- rhdf5::h5read(file, name)
+
+  # If the numeric vector is Boolean it gets read as a factor by {rhdf5}
+  if (is.factor(scalar)) {
+    scalar <- as.logical(scalar)
+  }
+
+  return(scalar)
 }
 
 #' Read H5AD mapping

diff --git a/R/write_h5ad.R b/R/write_h5ad.R
@@ -29,7 +29,6 @@
 #'
 #' # Write a SingleCellExperiment as an H5AD
 #' if (requireNamespace("SingleCellExperiment", quietly = TRUE)) {
-#'   h5ad_file <- tempfile(fileext = ".h5ad")
 #'   ncells <- 100
 #'   counts <- matrix(rpois(20000, 5), ncol = ncells)
 #'   logcounts <- log2(counts + 1)
@@ -41,12 +40,14 @@
 #'     assays = list(counts = counts, logcounts = logcounts),
 #'     reducedDims = list(PCA = pca, tSNE = tsne)
 #'   )
+#'
+#'   h5ad_file <- tempfile(fileext = ".h5ad")
+#'   write_h5ad(sce, h5ad_file)
 #' }
 #'
 #' # Write a Seurat as a H5AD
 #' if (requireNamespace("SeuratObject", quietly = TRUE)) {
 #'   # TODO: uncomment this code when the seurat converter is fixed
-#'   # h5ad_file <- tempfile(fileext = ".h5ad")
 #'   # counts <- matrix(1:15, 3L, 5L)
 #'   # dimnames(counts) <- list(
 #'   #   letters[1:3],
@@ -63,6 +64,7 @@
 #'   # )
 #'   # obj <- SeuratObject::AddMetaData(obj, cell.metadata)
 #'   #
+#'   # h5ad_file <- tempfile(fileext = ".h5ad")
 #'   # write_h5ad(obj, h5ad_file)
 #' }
 write_h5ad <- function(object, path, compression = c("none", "gzip", "lzf")) {

diff --git a/R/write_h5ad_helpers.R b/R/write_h5ad_helpers.R
@@ -53,6 +53,9 @@ write_h5ad_element <- function(value, file, name, compression = c("none", "gzip"
     } else if (is.logical(value)) { # Logical values
       if (any(is.na(value))) {
         write_h5ad_nullable_boolean
+      } else if (length(value) == 1) {
+        # Single Booleans should be written as numeric scalars
+        write_h5ad_numeric_scalar
       } else {
         write_h5ad_dense_array
       }
@@ -324,7 +327,7 @@ write_h5ad_numeric_scalar <- function(value, file, name, compression, version =
   hdf5_write_compressed(file, name, value, compression)
 
   # Write attributes
-  write_h5ad_encoding(file, name, "numeric", version)
+  write_h5ad_encoding(file, name, "numeric-scalar", version)
 }
 
 #' Write H5AD mapping

diff --git a/man/AbstractAnnData.Rd b/man/AbstractAnnData.Rd
diff --git a/man/AnnData.Rd b/man/AnnData.Rd
diff --git a/man/HDF5AnnData.Rd b/man/HDF5AnnData.Rd
diff --git a/man/InMemoryAnnData.Rd b/man/InMemoryAnnData.Rd
diff --git a/man/write_h5ad.Rd b/man/write_h5ad.Rd