Improve test design (#651)

Signed-off-by: zethson <[email protected]>
theislab · Feb 3, 2024 · a376f0c · a376f0c
1 parent 4725a33
commit a376f0c
Show file tree

Hide file tree

Showing 8 changed files with 702 additions and 698 deletions.
diff --git a/ehrapy/data/_datasets.py b/ehrapy/data/_datasets.py
@@ -4,7 +4,7 @@
 
 from ehrapy import ehrapy_settings
 from ehrapy.io._read import read_csv, read_fhir, read_h5ad
-from ehrapy.preprocessing._encode import encode
+from ehrapy.preprocessing._encoding import encode
 
 if TYPE_CHECKING:
     import pandas as pd

diff --git a/ehrapy/io/_read.py b/ehrapy/io/_read.py
@@ -14,7 +14,7 @@
 from ehrapy import ehrapy_settings, settings
 from ehrapy.anndata.anndata_ext import df_to_anndata
 from ehrapy.data._dataloader import download, remove_archive_extension
-from ehrapy.preprocessing._encode import encode
+from ehrapy.preprocessing._encoding import encode
 
 if TYPE_CHECKING:
     from collections.abc import Iterator
@@ -498,7 +498,7 @@ def _read_from_cache_dir(cache_dir: Path) -> dict[str, AnnData]:
 def _read_from_cache(path_cache: Path) -> AnnData:
     """Read AnnData object from cached file."""
     cached_adata = read_h5(path_cache)
-    # type cast required when dealing with non numerical data; otherwise all values in X would be treated as strings
+    # type cast required when dealing with non-numerical data; otherwise all values in X would be treated as strings
     if not np.issubdtype(cached_adata.X.dtype, np.number):
         cached_adata.X = cached_adata.X.astype("object")
     try:
@@ -530,7 +530,7 @@ def _write_cache_dir(
         index_column: The index columns for each object (if any)
 
     Returns:
-        A dict containing an unique identifier and an :class:`~anndata.AnnData` object for each file read
+        A dict containing a unique identifier and an :class:`~anndata.AnnData` object for each file read
     """
     for identifier in adata_objects:
         # for each identifier (for the AnnData object), we need the index column and obs_only cols (if any) for reuse when reading cache
@@ -549,7 +549,7 @@ def _write_cache(
     """Write AnnData object to cache"""
     original_x_dtype = raw_anndata.X.dtype
     if not np.issubdtype(original_x_dtype, np.number):
-        cached_adata = encode(data=raw_anndata, autodetect=True)
+        cached_adata = encode(adata=raw_anndata, autodetect=True)
     else:
         cached_adata = raw_anndata
     # temporary key that stores all column names that are obs only for this AnnData object

diff --git a/ehrapy/io/_write.py b/ehrapy/io/_write.py
@@ -6,7 +6,7 @@
 import numpy as np
 
 from ehrapy import settings
-from ehrapy.preprocessing._encode import encode
+from ehrapy.preprocessing._encoding import encode
 
 if TYPE_CHECKING:
     from anndata import AnnData

diff --git a/ehrapy/preprocessing/__init__.py b/ehrapy/preprocessing/__init__.py
@@ -1,4 +1,4 @@
-from ehrapy.preprocessing._encode import encode, undo_encoding
+from ehrapy.preprocessing._encoding import encode, undo_encoding
 from ehrapy.preprocessing._highly_variable_features import highly_variable_features
 from ehrapy.preprocessing._imputation import (
     explicit_impute,

diff --git a/ehrapy/preprocessing/_encode.py → ehrapy/preprocessing/_encoding.py b/ehrapy/preprocessing/_encode.py → ehrapy/preprocessing/_encoding.py