Skip to content

Commit 9d16650

Browse files
normalize strings
1 parent 86375dd commit 9d16650

34 files changed

Lines changed: 175 additions & 135 deletions

File tree

openproblems/api/hash.py

Lines changed: 6 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -46,8 +46,10 @@ def docker_token(image_name):
4646
[
4747
"curl",
4848
"--silent",
49-
f"https://auth.docker.io/token?scope=repository:{image_name}:"
50-
"pull&service=registry.docker.io",
49+
(
50+
f"https://auth.docker.io/token?scope=repository:{image_name}:"
51+
"pull&service=registry.docker.io"
52+
),
5153
]
5254
)
5355
)
@@ -88,8 +90,8 @@ def docker_hash(image_name):
8890
return docker_labels_from_api(image_name)["bio.openproblems.hash"]
8991
except Exception: # pragma: nocover
9092
warnings.warn(
91-
"Failed to access docker or the docker API; docker image hash failed. "
92-
f"All jobs using {image_name} will not be cached."
93+
"Failed to access docker or the docker API; docker image hash failed. All"
94+
f" jobs using {image_name} will not be cached."
9395
)
9496
return str(random.getrandbits(256))
9597

openproblems/data/tabula_muris_senis.py

Lines changed: 4 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -29,8 +29,8 @@ def check_unknown_organs(datasets, organ_list):
2929
unknown_organs = set(organ_list) - known_organs
3030
if unknown_organs:
3131
raise ValueError(
32-
f"Unknown organs provided in `organ_list': {', '.join(unknown_organs)}. "
33-
f"Known organs are {', '.join(known_organs)}"
32+
f"Unknown organs provided in `organ_list': {', '.join(unknown_organs)}."
33+
f" Known organs are {', '.join(known_organs)}"
3434
)
3535

3636

@@ -107,8 +107,8 @@ def load_tabula_muris_senis(test=False, method_list=None, organ_list=None):
107107
unknown_methods = set(method_list) - set(["facs", "droplet"])
108108
if unknown_methods:
109109
raise ValueError(
110-
f"Unknown methods provided in `method_list': {','.join(unknown_methods)}. "
111-
"Known methods are `facs' and `droplet'"
110+
f"Unknown methods provided in `method_list': {','.join(unknown_methods)}."
111+
" Known methods are `facs' and `droplet'"
112112
)
113113

114114
datasets_path = f"/curation/v1/collections/{COLLECTION_ID}"

openproblems/patch.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -52,7 +52,7 @@ def _download_aftp(
5252
if timeout:
5353
wget_command_list += ["-T", str(timeout)]
5454

55-
log.debug("Running: %s" % (" ".join(wget_command_list)))
55+
log.debug("Running: %s" % " ".join(wget_command_list))
5656
subprocess.call(wget_command_list)
5757
return tmp_path
5858

openproblems/tasks/_batch_integration/_common/datasets/immune.py

Lines changed: 4 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -9,9 +9,10 @@
99
dataset_name="Immune (by batch)",
1010
data_url=load_immune.metadata["data_url"],
1111
data_reference=load_immune.metadata["data_reference"],
12-
dataset_summary="Human immune cells from peripheral blood and bone marrow "
13-
"taken from 5 datasets comprising 10 batches across technologies (10X, "
14-
"Smart-seq2).",
12+
dataset_summary=(
13+
"Human immune cells from peripheral blood and bone marrow taken from 5 datasets"
14+
" comprising 10 batches across technologies (10X, Smart-seq2)."
15+
),
1516
image="openproblems",
1617
)
1718
def immune_batch(

openproblems/tasks/_batch_integration/_common/datasets/lung.py

Lines changed: 4 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -9,8 +9,10 @@
99
dataset_name="Lung (Viera Braga et al.)",
1010
data_url=load_lung.metadata["data_url"],
1111
data_reference=load_lung.metadata["data_reference"],
12-
dataset_summary="Human lung scRNA-seq data from 3 datasets with 32,472 cells. "
13-
"From Vieira Braga et al. Technologies: 10X and Drop-seq.",
12+
dataset_summary=(
13+
"Human lung scRNA-seq data from 3 datasets with 32,472 cells. From Vieira Braga"
14+
" et al. Technologies: 10X and Drop-seq."
15+
),
1416
image="openproblems",
1517
)
1618
def lung_batch(

openproblems/tasks/_batch_integration/_common/datasets/pancreas.py

Lines changed: 4 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -9,9 +9,10 @@
99
dataset_name="Pancreas (by batch)",
1010
data_url=load_pancreas.metadata["data_url"],
1111
data_reference=load_pancreas.metadata["data_reference"],
12-
dataset_summary="Human pancreatic islet scRNA-seq data from 6 datasets "
13-
"across technologies (CEL-seq, CEL-seq2, Smart-seq2, inDrop, Fluidigm C1, "
14-
"and SMARTER-seq).",
12+
dataset_summary=(
13+
"Human pancreatic islet scRNA-seq data from 6 datasets across technologies"
14+
" (CEL-seq, CEL-seq2, Smart-seq2, inDrop, Fluidigm C1, and SMARTER-seq)."
15+
),
1516
image="openproblems",
1617
)
1718
def pancreas_batch(

openproblems/tasks/_cell_cell_communication/cell_cell_communication_ligand_target/datasets/tnbc_wu2021.py

Lines changed: 6 additions & 5 deletions
Original file line numberDiff line numberDiff line change
@@ -10,11 +10,12 @@
1010
"Triple negative breast cancer atlas",
1111
data_url=load_tnbc_data.metadata["data_url"],
1212
data_reference=load_tnbc_data.metadata["data_reference"],
13-
dataset_summary="Human breast cancer atlas (Wu et al., 2021), "
14-
"with cytokine activities, inferred using a multivariate "
15-
"linear model with cytokine-focused signatures, as assumed true "
16-
"cell-cell communication (Dimitrov et al., 2022). "
17-
"42512 cells x 28078 features with 29 cell types from 10 patients",
13+
dataset_summary=(
14+
"Human breast cancer atlas (Wu et al., 2021), with cytokine activities,"
15+
" inferred using a multivariate linear model with cytokine-focused signatures,"
16+
" as assumed true cell-cell communication (Dimitrov et al., 2022). 42512 cells"
17+
" x 28078 features with 29 cell types from 10 patients"
18+
),
1819
image="openproblems-r-extras",
1920
)
2021
def tnbc_data(test=False):

openproblems/tasks/_cell_cell_communication/cell_cell_communication_source_target/datasets/allen_brain_atlas.py

Lines changed: 6 additions & 5 deletions
Original file line numberDiff line numberDiff line change
@@ -7,11 +7,12 @@
77
"Mouse brain atlas",
88
data_url=load_mouse_brain_atlas.metadata["data_url"],
99
data_reference=load_mouse_brain_atlas.metadata["data_reference"],
10-
dataset_summary="A murine brain atlas with adjacent cell types as assumed "
11-
"benchmark truth, inferred from deconvolution proportion "
12-
"correlations using matching 10x Visium slides "
13-
"(see Dimitrov et al., 2022). "
14-
"14249 cells x 34617 features with 23 cell type labels.",
10+
dataset_summary=(
11+
"A murine brain atlas with adjacent cell types as assumed benchmark truth,"
12+
" inferred from deconvolution proportion correlations using matching 10x Visium"
13+
" slides (see Dimitrov et al., 2022). 14249 cells x 34617 features with 23 cell"
14+
" type labels."
15+
),
1516
image="openproblems-r-extras",
1617
)
1718
def mouse_brain_atlas(test=False):

openproblems/tasks/denoising/datasets/pancreas.py

Lines changed: 5 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -7,10 +7,11 @@
77
dataset_name="Pancreas (inDrop)",
88
data_url=load_pancreas.metadata["data_url"],
99
data_reference=load_pancreas.metadata["data_reference"],
10-
dataset_summary="Human pancreatic islet scRNA-seq data from 6 datasets "
11-
"across technologies (CEL-seq, CEL-seq2, Smart-seq2, inDrop, Fluidigm C1, "
12-
"and SMARTER-seq). Here we just use the inDrop1 batch, which includes"
13-
"1937 cells × 15502 genes.",
10+
dataset_summary=(
11+
"Human pancreatic islet scRNA-seq data from 6 datasets across technologies"
12+
" (CEL-seq, CEL-seq2, Smart-seq2, inDrop, Fluidigm C1, and SMARTER-seq). Here"
13+
" we just use the inDrop1 batch, which includes1937 cells × 15502 genes."
14+
),
1415
image="openproblems-python-pytorch",
1516
)
1617
def pancreas(test=False):

openproblems/tasks/denoising/datasets/pbmc.py

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -8,8 +8,8 @@
88
data_url=load_tenx_1k_pbmc.metadata["data_url"],
99
data_reference=load_tenx_1k_pbmc.metadata["data_reference"],
1010
dataset_summary=(
11-
"1k Peripheral Blood Mononuclear Cells (PBMCs) from a healthy donor. "
12-
"Sequenced on 10X v3 chemistry in November 2018 by 10X Genomics."
11+
"1k Peripheral Blood Mononuclear Cells (PBMCs) from a healthy donor. Sequenced"
12+
" on 10X v3 chemistry in November 2018 by 10X Genomics."
1313
),
1414
image="openproblems-python-pytorch",
1515
)

0 commit comments

Comments
 (0)