Skip to content

Commit b8528f7

Browse files
[pre-commit.ci] auto fixes from pre-commit.com hooks
for more information, see https://pre-commit.ci
1 parent bdbdb82 commit b8528f7

1 file changed

Lines changed: 32 additions & 31 deletions

File tree

use_cases/custom_dl/tiledb.ipynb

Lines changed: 32 additions & 31 deletions
Original file line numberDiff line numberDiff line change
@@ -85,20 +85,17 @@
8585
],
8686
"source": [
8787
"import warnings\n",
88-
"from typing import Any\n",
8988
"\n",
9089
"import cellxgene_census\n",
9190
"import numpy as np\n",
92-
"import pandas as pd\n",
9391
"import scanpy as sc\n",
9492
"import scvi\n",
9593
"import tiledbsoma as soma\n",
96-
"import tiledbsoma_ml\n",
97-
"import torch\n",
9894
"from cellxgene_census.experimental.pp import highly_variable_genes\n",
99-
"#from lightning import LightningDataModule\n",
100-
"#from sklearn.preprocessing import LabelEncoder\n",
101-
"#from torch.utils.data import DataLoader\n",
95+
"\n",
96+
"# from lightning import LightningDataModule\n",
97+
"# from sklearn.preprocessing import LabelEncoder\n",
98+
"# from torch.utils.data import DataLoader\n",
10299
"from scvi.dataloaders import TileDBDataModule\n",
103100
"\n",
104101
"warnings.filterwarnings(\"ignore\")"
@@ -142,11 +139,11 @@
142139
"outputs": [],
143140
"source": [
144141
"experiment_name = \"mus_musculus\"\n",
145-
"#obs_val_filt = 'is_primary_data == True and tissue_general in [\"spleen\", \"kidney\"] and nnz >= 500'\n",
142+
"# obs_val_filt = 'is_primary_data == True and tissue_general in [\"spleen\", \"kidney\"] and nnz >= 500'\n",
146143
"obs_val_filt = 'is_primary_data == True and tissue_general in [\"liver\"] and nnz >= 500'\n",
147-
"#obs_val_filt = 'is_primary_data == True and tissue_general in [\"liver\", \"heart\"] and nnz >= 500'\n",
144+
"# obs_val_filt = 'is_primary_data == True and tissue_general in [\"liver\", \"heart\"] and nnz >= 500'\n",
148145
"top_n_hvg = 500\n",
149-
"hvg_batch = [\"dataset_id\",\"donor_id\"]"
146+
"hvg_batch = [\"dataset_id\", \"donor_id\"]"
150147
]
151148
},
152149
{
@@ -171,7 +168,7 @@
171168
")\n",
172169
"hv = hvgs_df.highly_variable\n",
173170
"hv_idx = hv[hv].index\n",
174-
"#hv_idx = np.arange(10)"
171+
"# hv_idx = np.arange(10)"
175172
]
176173
},
177174
{
@@ -207,7 +204,7 @@
207204
"metadata": {},
208205
"outputs": [],
209206
"source": [
210-
"batch_keys = [\"dataset_id\",\"donor_id\"]"
207+
"batch_keys = [\"dataset_id\", \"donor_id\"]"
211208
]
212209
},
213210
{
@@ -242,11 +239,11 @@
242239
" batch_size=1024,\n",
243240
" shuffle=True,\n",
244241
" seed=42,\n",
245-
" batch_column_names = batch_keys,\n",
242+
" batch_column_names=batch_keys,\n",
246243
" dataloader_kwargs={\"num_workers\": 64, \"persistent_workers\": False},\n",
247244
" accelerator=\"gpu\",\n",
248245
" device=2,\n",
249-
" return_sparse_X=False\n",
246+
" return_sparse_X=False,\n",
250247
")\n",
251248
"print(datamodule.n_obs, datamodule.n_vars, datamodule.n_batch)"
252249
]
@@ -281,7 +278,12 @@
281278
"n_latent = 10\n",
282279
"datamodule.setup()\n",
283280
"model = scvi.model.SCVI(\n",
284-
" adata=None, registry=datamodule.registry ,n_layers=n_layers, n_latent=n_latent, gene_likelihood=\"nb\", encode_covariates=False\n",
281+
" adata=None,\n",
282+
" registry=datamodule.registry,\n",
283+
" n_layers=n_layers,\n",
284+
" n_latent=n_latent,\n",
285+
" gene_likelihood=\"nb\",\n",
286+
" encode_covariates=False,\n",
285287
")"
286288
]
287289
},
@@ -301,8 +303,7 @@
301303
"source": [
302304
"# creating the dataloader for trainset\n",
303305
"training_dataloader = (\n",
304-
" datamodule.on_before_batch_transfer(batch, None)\n",
305-
" for batch in datamodule.train_dataloader()\n",
306+
" datamodule.on_before_batch_transfer(batch, None) for batch in datamodule.train_dataloader()\n",
306307
")"
307308
]
308309
},
@@ -361,15 +362,16 @@
361362
],
362363
"source": [
363364
"import time\n",
365+
"\n",
364366
"start = time.time()\n",
365367
"model.train(\n",
366368
" datamodule=training_dataloader,\n",
367-
" #datamodule=datamodule,\n",
369+
" # datamodule=datamodule,\n",
368370
" max_epochs=10,\n",
369371
" batch_size=1024,\n",
370-
" #accelerator=\"gpu\",\n",
371-
" #devices=-1,\n",
372-
" #strategy=\"ddp_notebook_find_unused_parameters_true\",\n",
372+
" # accelerator=\"gpu\",\n",
373+
" # devices=-1,\n",
374+
" # strategy=\"ddp_notebook_find_unused_parameters_true\",\n",
373375
")\n",
374376
"end = time.time()\n",
375377
"print(f\"Elapsed time: {end - start:.2f} seconds\")"
@@ -610,7 +612,7 @@
610612
"source": [
611613
"sc.pp.neighbors(adata, use_rep=\"scvi\", key_added=\"scvi\")\n",
612614
"sc.tl.umap(adata, neighbors_key=\"scvi\")\n",
613-
"sc.pl.umap(adata, color=[\"dataset_id\",\"donor_id\"], title=\"SCVI\")"
615+
"sc.pl.umap(adata, color=[\"dataset_id\", \"donor_id\"], title=\"SCVI\")"
614616
]
615617
},
616618
{
@@ -641,7 +643,7 @@
641643
"metadata": {},
642644
"outputs": [],
643645
"source": [
644-
"#sc.pl.umap(adata, color=\"tissue_general\", title=\"SCVI\")"
646+
"# sc.pl.umap(adata, color=\"tissue_general\", title=\"SCVI\")"
645647
]
646648
},
647649
{
@@ -666,8 +668,7 @@
666668
"metadata": {},
667669
"outputs": [],
668670
"source": [
669-
"scvi.model.SCVI.setup_anndata(adata, \n",
670-
" batch_key=\"batch\")"
671+
"scvi.model.SCVI.setup_anndata(adata, batch_key=\"batch\")"
671672
]
672673
},
673674
{
@@ -676,7 +677,7 @@
676677
"metadata": {},
677678
"outputs": [],
678679
"source": [
679-
"#model_census3 = scvi.model.SCVI.load(\"census_model\", adata=adata)\n",
680+
"# model_census3 = scvi.model.SCVI.load(\"census_model\", adata=adata)\n",
680681
"model_census3 = scvi.model.SCVI(adata)"
681682
]
682683
},
@@ -769,7 +770,7 @@
769770
"source": [
770771
"sc.pp.neighbors(adata, use_rep=\"scvi_non_dataloder\", key_added=\"scvi_non_dataloder\")\n",
771772
"sc.tl.umap(adata, neighbors_key=\"scvi_non_dataloder\")\n",
772-
"sc.pl.umap(adata, color=[\"dataset_id\",\"donor_id\"], title=\"SCVI_non_dataloder\")"
773+
"sc.pl.umap(adata, color=[\"dataset_id\", \"donor_id\"], title=\"SCVI_non_dataloder\")"
773774
]
774775
},
775776
{
@@ -798,7 +799,7 @@
798799
"metadata": {},
799800
"outputs": [],
800801
"source": [
801-
"#sc.pl.umap(adata, color=\"tissue_general\", title=\"SCVI_non_dataloder\")"
802+
"# sc.pl.umap(adata, color=\"tissue_general\", title=\"SCVI_non_dataloder\")"
802803
]
803804
},
804805
{
@@ -945,7 +946,7 @@
945946
"metadata": {},
946947
"outputs": [],
947948
"source": [
948-
"#model_scanvi.save(\"census_model_scanvi\", save_anndata=False, overwrite=True, datamodule=datamodule_scanvi)"
949+
"# model_scanvi.save(\"census_model_scanvi\", save_anndata=False, overwrite=True, datamodule=datamodule_scanvi)"
949950
]
950951
},
951952
{
@@ -1037,7 +1038,7 @@
10371038
"source": [
10381039
"sc.pp.neighbors(adata, use_rep=\"scanvi\", key_added=\"scanvi\")\n",
10391040
"sc.tl.umap(adata, neighbors_key=\"scanvi\")\n",
1040-
"sc.pl.umap(adata, color=[\"dataset_id\",\"donor_id\"], title=\"SCANVI\")"
1041+
"sc.pl.umap(adata, color=[\"dataset_id\", \"donor_id\"], title=\"SCANVI\")"
10411042
]
10421043
},
10431044
{
@@ -1066,7 +1067,7 @@
10661067
"metadata": {},
10671068
"outputs": [],
10681069
"source": [
1069-
"#sc.pl.umap(adata, color=\"tissue_general\", title=\"SCANVI\")"
1070+
"# sc.pl.umap(adata, color=\"tissue_general\", title=\"SCANVI\")"
10701071
]
10711072
},
10721073
{

0 commit comments

Comments
 (0)