bug, typing and docstring fixes

NygenAnalytics · May 22, 2023 · 5215769 · 5215769
1 parent de4e866
commit 5215769
Show file tree

Hide file tree

Showing 4 changed files with 9 additions and 9 deletions.
diff --git a/VERSION b/VERSION
@@ -1 +1 @@
-0.28.0
+0.28.1
diff --git a/scarf/assay.py b/scarf/assay.py
@@ -517,7 +517,7 @@ def iter_normed_feature_wise(
         )
         logger.debug("Will iterate over data of shape: ", data.shape)
         chunks = np.array_split(
-            np.arange(0, data.shape[1]), int(data.shape[1] / batch_size)
+            np.arange(0, data.shape[1]), max(1, int(data.shape[1] / batch_size))
         )
         for chunk in tqdmbar(chunks, desc=msg, total=len(chunks)):
             if as_dataframe:

diff --git a/scarf/datastore/datastore.py b/scarf/datastore/datastore.py
@@ -6,7 +6,7 @@
 from .mapping_datastore import MappingDatastore
 from ..writers import create_zarr_obj_array, create_zarr_dataset
 from ..utils import tqdmbar, controlled_compute, ZARRLOC
-from ..assay import RNAassay, ATACassay, ADTassay
+from ..assay import RNAassay, ATACassay
 from ..feat_utils import hto_demux
 
 __all__ = ["DataStore"]
@@ -948,7 +948,7 @@ def make_bulk(
             secondary_group_key: Name of the column in cell metadata table to be used for sub-grouping cells.
             aggr_type: Type of aggregation to be used. Can be either 'mean' or 'sum'. (Default value: 'mean')
             return_fraction: Return the fraction of cells expressing a gene in each group. (Default value: False)
-            feature_labels: The column in feature metadata table to use as row labels. (Default value: 'index')
+            feature_label: The column in feature metadata table to use as row labels. (Default value: 'index')
             pseudo_reps: Within each group, cells will randomly be split into `pseudo_reps` partitions. Each partition
                          is considered a pseudo-replicate. (Default value: 3)
             remove_empty_features: Remove features that are not expressed in any cell. (Default value: True)
@@ -958,8 +958,8 @@ def make_bulk(
             random_seed: A random values to set seed while creating `pseudo_reps` partitions cells randomly.
 
         Returns:
-            A pandas dataframe containing the bulk profile. If `return_fraction` is True, then a tuple of two dataframes is returned.
-            The second dataframe contains the fraction of cells expressing each feature in each group.
+            A pandas dataframe containing the bulk profile. If `return_fraction` is True, then a tuple of two dataframes
+            is returned. The second dataframe contains the fraction of cells expressing each feature in each group.
         """
 
         def make_reps(v, n_reps: int, seed: int) -> List[np.ndarray]:
@@ -1169,7 +1169,7 @@ def smart_label(
             for n, k in enumerate(j, start=1):
                 a = chr(ord("@") + n)
                 new_names[k] = f"{i}{a.lower()}"
-        
+
         missing_vals = list(set(df.index).difference(idxmax.unique()))
         if len(missing_vals) > 0:
             miss_idxmax = df.loc[missing_vals].idxmax(axis=1).to_dict()

diff --git a/scarf/writers.py b/scarf/writers.py
@@ -1141,11 +1141,11 @@ class ZarrMerge:
 
     def __init__(
         self,
-        zarr_path: str,
+        zarr_path: ZARRLOC,
         assays: list,
         names: List[str],
         merge_assay_name: str,
-        in_workspaces: Union[str, None] = None,
+        in_workspaces: Union[list[str], None] = None,
         out_workspace: Union[str, None] = None,
         chunk_size=(1000, 1000),
         dtype: Optional[str] = None,