-
Notifications
You must be signed in to change notification settings - Fork 8
Expand file tree
/
Copy pathdataset_info.json
More file actions
90 lines (90 loc) · 9.11 KB
/
dataset_info.json
File metadata and controls
90 lines (90 loc) · 9.11 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
[
{
"dataset_id": "openproblems_neurips2022/pbmc_multiome/swap",
"dataset_name": "OpenProblems NeurIPS2022 Multiome (ATAC2GEX)",
"dataset_summary": "Single-cell Multiome (GEX+ATAC) data collected from bone marrow mononuclear cells of 12 healthy human donors.",
"dataset_description": "Single-cell CITE-Seq data collected from bone marrow mononuclear cells of 12 healthy human donors using the 10X Multiome Gene Expression and Chromatin Accessibility kit. The dataset was generated to support Multimodal Single-Cell Data Integration Challenge at NeurIPS 2022. Samples were prepared using a standard protocol at four sites. The resulting data was then annotated to identify cell types and remove doublets. The dataset was designed with a nested batch layout such that some donor samples were measured at multiple sites with some donors measured at a single site.",
"data_reference": "lance2024predicting",
"data_url": "https://www.kaggle.com/competitions/open-problems-multimodal/data",
"date_created": "09-01-2025",
"file_size": 18717069,
"common_dataset_id": "openproblems_neurips2022/pbmc_multiome"
},
{
"dataset_id": "openproblems_neurips2021/bmmc_multiome/swap",
"dataset_name": "NeurIPS2021 Multiome (ATAC2GEX)",
"dataset_summary": "Single-cell Multiome (GEX+ATAC) data collected from bone marrow mononuclear cells of 12 healthy human donors.",
"dataset_description": "Single-cell CITE-Seq data collected from bone marrow mononuclear cells of 12 healthy human donors using the 10X Multiome Gene Expression and Chromatin Accessibility kit. The dataset was generated to support Multimodal Single-Cell Data Integration Challenge at NeurIPS 2021. Samples were prepared using a standard protocol at four sites. The resulting data was then annotated to identify cell types and remove doublets. The dataset was designed with a nested batch layout such that some donor samples were measured at multiple sites with some donors measured at a single site.",
"data_reference": "luecken2021neurips",
"data_url": "https://www.ncbi.nlm.nih.gov/geo/query/acc.cgi?acc=GSE194122",
"date_created": "09-01-2025",
"file_size": 7883109,
"common_dataset_id": "openproblems_neurips2021/bmmc_multiome"
},
{
"dataset_id": "openproblems_neurips2021/bmmc_cite/normal",
"dataset_name": "NeurIPS2021 CITE-Seq (GEX2ADT)",
"dataset_summary": "Single-cell CITE-Seq (GEX+ADT) data collected from bone marrow mononuclear cells of 12 healthy human donors.",
"dataset_description": "Single-cell CITE-Seq data collected from bone marrow mononuclear cells of 12 healthy human donors using the 10X 3 prime Single-Cell Gene Expression kit with Feature Barcoding in combination with the BioLegend TotalSeq B Universal Human Panel v1.0. The dataset was generated to support Multimodal Single-Cell Data Integration Challenge at NeurIPS 2021. Samples were prepared using a standard protocol at four sites. The resulting data was then annotated to identify cell types and remove doublets. The dataset was designed with a nested batch layout such that some donor samples were measured at multiple sites with some donors measured at a single site.",
"data_reference": "luecken2021neurips",
"data_url": "https://www.ncbi.nlm.nih.gov/geo/query/acc.cgi?acc=GSE194122",
"date_created": "09-01-2025",
"file_size": 704994,
"common_dataset_id": "openproblems_neurips2021/bmmc_cite"
},
{
"dataset_id": "openproblems_neurips2022/pbmc_cite/normal",
"dataset_name": "OpenProblems NeurIPS2022 CITE-Seq (GEX2ADT)",
"dataset_summary": "Single-cell CITE-Seq (GEX+ADT) data collected from bone marrow mononuclear cells of 12 healthy human donors.",
"dataset_description": "Single-cell CITE-Seq data collected from bone marrow mononuclear cells of 12 healthy human donors using the 10X 3 prime Single-Cell Gene Expression kit with Feature Barcoding in combination with the BioLegend TotalSeq B Universal Human Panel v1.0. The dataset was generated to support Multimodal Single-Cell Data Integration Challenge at NeurIPS 2022. Samples were prepared using a standard protocol at four sites. The resulting data was then annotated to identify cell types and remove doublets. The dataset was designed with a nested batch layout such that some donor samples were measured at multiple sites with some donors measured at a single site.",
"data_reference": "lance2024predicting",
"data_url": "https://www.kaggle.com/competitions/open-problems-multimodal/data",
"date_created": "09-01-2025",
"file_size": 591886,
"common_dataset_id": "openproblems_neurips2022/pbmc_cite"
},
{
"dataset_id": "openproblems_neurips2022/pbmc_cite/swap",
"dataset_name": "OpenProblems NeurIPS2022 CITE-Seq (ADT2GEX)",
"dataset_summary": "Single-cell CITE-Seq (GEX+ADT) data collected from bone marrow mononuclear cells of 12 healthy human donors.",
"dataset_description": "Single-cell CITE-Seq data collected from bone marrow mononuclear cells of 12 healthy human donors using the 10X 3 prime Single-Cell Gene Expression kit with Feature Barcoding in combination with the BioLegend TotalSeq B Universal Human Panel v1.0. The dataset was generated to support Multimodal Single-Cell Data Integration Challenge at NeurIPS 2022. Samples were prepared using a standard protocol at four sites. The resulting data was then annotated to identify cell types and remove doublets. The dataset was designed with a nested batch layout such that some donor samples were measured at multiple sites with some donors measured at a single site.",
"data_reference": "lance2024predicting",
"data_url": "https://www.kaggle.com/competitions/open-problems-multimodal/data",
"date_created": "09-01-2025",
"file_size": 32551804,
"common_dataset_id": "openproblems_neurips2022/pbmc_cite"
},
{
"dataset_id": "openproblems_neurips2021/bmmc_cite/swap",
"dataset_name": "NeurIPS2021 CITE-Seq (ADT2GEX)",
"dataset_summary": "Single-cell CITE-Seq (GEX+ADT) data collected from bone marrow mononuclear cells of 12 healthy human donors.",
"dataset_description": "Single-cell CITE-Seq data collected from bone marrow mononuclear cells of 12 healthy human donors using the 10X 3 prime Single-Cell Gene Expression kit with Feature Barcoding in combination with the BioLegend TotalSeq B Universal Human Panel v1.0. The dataset was generated to support Multimodal Single-Cell Data Integration Challenge at NeurIPS 2021. Samples were prepared using a standard protocol at four sites. The resulting data was then annotated to identify cell types and remove doublets. The dataset was designed with a nested batch layout such that some donor samples were measured at multiple sites with some donors measured at a single site.",
"data_reference": "luecken2021neurips",
"data_url": "https://www.ncbi.nlm.nih.gov/geo/query/acc.cgi?acc=GSE194122",
"date_created": "09-01-2025",
"file_size": 13467880,
"common_dataset_id": "openproblems_neurips2021/bmmc_cite"
},
{
"dataset_id": "openproblems_neurips2022/pbmc_multiome/normal",
"dataset_name": "OpenProblems NeurIPS2022 Multiome (GEX2ATAC)",
"dataset_summary": "Single-cell Multiome (GEX+ATAC) data collected from bone marrow mononuclear cells of 12 healthy human donors.",
"dataset_description": "Single-cell CITE-Seq data collected from bone marrow mononuclear cells of 12 healthy human donors using the 10X Multiome Gene Expression and Chromatin Accessibility kit. The dataset was generated to support Multimodal Single-Cell Data Integration Challenge at NeurIPS 2022. Samples were prepared using a standard protocol at four sites. The resulting data was then annotated to identify cell types and remove doublets. The dataset was designed with a nested batch layout such that some donor samples were measured at multiple sites with some donors measured at a single site.",
"data_reference": "lance2024predicting",
"data_url": "https://www.kaggle.com/competitions/open-problems-multimodal/data",
"date_created": "09-01-2025",
"file_size": 4322721,
"common_dataset_id": "openproblems_neurips2022/pbmc_multiome"
},
{
"dataset_id": "openproblems_neurips2021/bmmc_multiome/normal",
"dataset_name": "NeurIPS2021 Multiome (GEX2ATAC)",
"dataset_summary": "Single-cell Multiome (GEX+ATAC) data collected from bone marrow mononuclear cells of 12 healthy human donors.",
"dataset_description": "Single-cell CITE-Seq data collected from bone marrow mononuclear cells of 12 healthy human donors using the 10X Multiome Gene Expression and Chromatin Accessibility kit. The dataset was generated to support Multimodal Single-Cell Data Integration Challenge at NeurIPS 2021. Samples were prepared using a standard protocol at four sites. The resulting data was then annotated to identify cell types and remove doublets. The dataset was designed with a nested batch layout such that some donor samples were measured at multiple sites with some donors measured at a single site.",
"data_reference": "luecken2021neurips",
"data_url": "https://www.ncbi.nlm.nih.gov/geo/query/acc.cgi?acc=GSE194122",
"date_created": "09-01-2025",
"file_size": 31080807,
"common_dataset_id": "openproblems_neurips2021/bmmc_multiome"
}
]