scdataloader 2.0.12__tar.gz → 2.1.0__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: scdataloader
3
- Version: 2.0.12
3
+ Version: 2.1.0
4
4
  Summary: a dataloader for single cell data in lamindb
5
5
  Project-URL: repository, https://github.com/jkobject/scDataLoader
6
6
  Author-email: jkobject <jkobject@gmail.com>
@@ -14,7 +14,7 @@ Requires-Dist: cellxgene-census>=0.1.0
14
14
  Requires-Dist: django>=4.0.0
15
15
  Requires-Dist: ipykernel>=6.20.0
16
16
  Requires-Dist: jupytext>=1.16.0
17
- Requires-Dist: lamindb[gcp]==2.0.1
17
+ Requires-Dist: lamindb[gcp]==2.1.1
18
18
  Requires-Dist: leidenalg>=0.8.0
19
19
  Requires-Dist: lightning>=2.3.0
20
20
  Requires-Dist: matplotlib>=3.5.0
@@ -1,6 +1,6 @@
1
1
  [project]
2
2
  name = "scdataloader"
3
- version = "2.0.12"
3
+ version = "2.1.0"
4
4
  description = "a dataloader for single cell data in lamindb"
5
5
  authors = [
6
6
  {name = "jkobject", email = "jkobject@gmail.com"}
@@ -11,7 +11,7 @@ requires-python = ">=3.10,<3.13"
11
11
  keywords = ["scRNAseq", "dataloader", "pytorch", "lamindb", "scPRINT"]
12
12
  dependencies = [
13
13
  "numpy<=2.2.0",
14
- "lamindb[gcp]==2.0.1",
14
+ "lamindb[gcp]==2.1.1",
15
15
  "cellxgene-census>=0.1.0",
16
16
  "torch>=2.2.0",
17
17
  "pytorch-lightning>=2.3.0",
@@ -264,8 +264,9 @@ class Preprocessor:
264
264
  # For genes that are already ENS IDs, use them directly
265
265
  prev_size = adata.shape[1]
266
266
  # Handle symbol genes
267
+ cols_to_use = adata.var.columns.difference(genesdf.columns)
267
268
  if self.is_symbol:
268
- new_var = adata.var.merge(
269
+ new_var = adata.var[cols_to_use].merge(
269
270
  genesdf.drop_duplicates("symbol").set_index("symbol", drop=False),
270
271
  left_index=True,
271
272
  right_index=True,
@@ -275,7 +276,7 @@ class Preprocessor:
275
276
  adata = adata[:, new_var.index]
276
277
  new_var.index = new_var["ensembl_gene_id"]
277
278
  else:
278
- new_var = adata.var.merge(
279
+ new_var = adata.var[cols_to_use].merge(
279
280
  genesdf, left_index=True, right_index=True, how="inner"
280
281
  )
281
282
  adata = adata[:, new_var.index]
@@ -440,6 +440,7 @@ def load_genes(
440
440
  "ncbi_gene_ids",
441
441
  "synonyms",
442
442
  "description",
443
+ "abbr",
443
444
  ]:
444
445
  if col in organismdf.columns:
445
446
  organismdf.drop(columns=[col], inplace=True)
File without changes
File without changes
File without changes