bedapub · bhoellbacher · Nov 6, 2024 · Nov 6, 2024 · Nov 7, 2024 · Nov 8, 2024
diff --git a/besca/Import/_read.py b/besca/Import/_read.py
@@ -107,7 +107,7 @@ def assert_adata(adata: AnnData, attempFix=True):
 
 
 def read_mtx(
-    filepath, annotation=True, use_genes="SYMBOL", species="human", citeseq=None
+    filepath, annotation=True, use_genes="SYMBOL", species="human", citeseq=None, read_cache=True
 ):
     """Read matrix.mtx, genes.tsv, barcodes.tsv to AnnData object.
     By specifiying an input folder this function reads the contained matrix.mtx,
@@ -129,6 +129,9 @@ def read_mtx(
     citeseq: 'gex_only' or 'citeseq_only' or False or None | default = None
         string indicating if only gene expression values (gex_only) or only protein
         expression values ('citeseq_only') or everything is read if None is specified
+    read_cache: `bool` (default=True)
+        boolian identifier if scanpy should read the AnnData object from fast h5ad
+        cache or from source
 
     Returns
     -------
@@ -138,7 +141,7 @@ def read_mtx(
     if gzfiles == "gz":
         print("reading matrix.mtx.gz")
         adata = read(
-            os.path.join(filepath, "matrix.mtx.gz"), cache=True
+            os.path.join(filepath, "matrix.mtx.gz"), cache=read_cache
         ).T  # transpose the data
         print("adding cell barcodes")
         adata.obs_names = pd.read_csv(
@@ -155,7 +158,7 @@ def read_mtx(
     else:
         print("reading matrix.mtx")
         adata = read(
-            os.path.join(filepath, "matrix.mtx"), cache=True
+            os.path.join(filepath, "matrix.mtx"), cache=read_cache
         ).T  # transpose the data
         print("adding cell barcodes")
         adata.obs_names = pd.read_csv(

diff --git a/besca/pp/_normalization.py b/besca/pp/_normalization.py
@@ -1,5 +1,6 @@
 import numpy as np
 from scipy.sparse.csr import csr_matrix
+from scipy.sparse._csc import csc_matrix
 from anndata._core.views import SparseCSRView
 
 def closure(mat):
@@ -180,6 +181,9 @@ def normalize_geometric(adata):
     # need to add a catch for newly encountered datatype
     elif type(X) == SparseCSRView:
         X = X.todense()
+    # need to add a catch for new sparse matrix datatype
+    elif type(X) == csc_matrix:
+        X = X.todense()
 
     # ensure that X is an array otherwise this will cause type issue with multiplicative replacement function
     X = np.array(X)

diff --git a/workbooks/standard_workflow_besca2.ipynb b/workbooks/standard_workflow_besca2.ipynb
@@ -760,7 +760,7 @@
     "        n_prots = len(adata_prot.var_names)\n",
     "        percent_top = (int(round(0.01*n_prots, 0)) if int(round(0.01*n_prots, 0)) >= 1 else 1, int(round(0.1*n_prots, 0)), int(round(0.25*n_prots, 0)))\n",
     "        qc_adata = sc.pp.calculate_qc_metrics(adata_prot, percent_top=percent_top, var_type=\"antibodies\", inplace=False)\n",
-    "        fig = sns.jointplot(\"log1p_total_counts\", \"n_antibodies_by_counts\", qc_adata[0], kind=\"hex\", norm=mpl.colors.LogNorm())\n",
+    "        fig = sns.jointplot(x=\"log1p_total_counts\", y=\"n_antibodies_by_counts\", data=qc_adata[0], kind=\"hex\", norm=mpl.colors.LogNorm())\n",
     "        fig.savefig(os.path.join(results_folder_citeseq, 'citeseq', 'figures', 'CITESEQ_QC_plot.png'))\n",
     "        \n",
     "        #generate overview of n_counts\n",