|
| 1 | +type: file |
| 2 | +example: "resources_test/task_ist_preprocessing/mouse_brain_combined/spatial_processed_complete.zarr" |
| 3 | +label: "Spatial Processed Complete" |
| 4 | +summary: A spatial transcriptomics dataset that includes all raw and processed data. |
| 5 | +description: | |
| 6 | + This dataset contains images, points with cell ids, and an anndata table with processed counts and cell type annotations. |
| 7 | + |
| 8 | +info: |
| 9 | + format: |
| 10 | + type: spatialdata_zarr |
| 11 | + images: |
| 12 | + - type: object |
| 13 | + name: image |
| 14 | + description: The raw image data |
| 15 | + required: true |
| 16 | + - type: object |
| 17 | + name: image_3D |
| 18 | + description: The raw 3D image data |
| 19 | + required: false |
| 20 | + - type: object |
| 21 | + name: he_image |
| 22 | + description: H&E image data |
| 23 | + required: false |
| 24 | + points: |
| 25 | + - type: dataframe |
| 26 | + name: transcripts |
| 27 | + description: Point cloud data of transcripts |
| 28 | + required: true |
| 29 | + columns: |
| 30 | + - type: float |
| 31 | + name: "x" |
| 32 | + required: true |
| 33 | + description: x-coordinate of the point |
| 34 | + - type: float |
| 35 | + name: "y" |
| 36 | + required: true |
| 37 | + description: y-coordinate of the point |
| 38 | + - type: float |
| 39 | + name: "z" |
| 40 | + required: false |
| 41 | + description: z-coordinate of the point |
| 42 | + - type: categorical |
| 43 | + name: feature_name |
| 44 | + required: true |
| 45 | + description: Name of the feature |
| 46 | + - type: integer |
| 47 | + name: "cell_id" |
| 48 | + required: true |
| 49 | + description: Unique identifier of the cell |
| 50 | + - type: long |
| 51 | + name: transcript_id |
| 52 | + required: true |
| 53 | + description: Unique identifier of the transcript |
| 54 | + shapes: |
| 55 | + - type: dataframe |
| 56 | + name: "cell_boundaries" |
| 57 | + description: Cell boundaries |
| 58 | + required: false |
| 59 | + columns: |
| 60 | + - type: object |
| 61 | + name: "geometry" |
| 62 | + required: true |
| 63 | + description: Geometry of the cell boundary |
| 64 | + tables: |
| 65 | + - type: anndata |
| 66 | + name: "counts" |
| 67 | + description: Counts of the transcripts |
| 68 | + required: true |
| 69 | + layers: |
| 70 | + - type: integer |
| 71 | + name: counts |
| 72 | + description: Raw counts |
| 73 | + required: true |
| 74 | + - type: integer |
| 75 | + name: normalized |
| 76 | + description: Normalized counts |
| 77 | + required: true |
| 78 | + - type: double |
| 79 | + name: normalized_uncorrected |
| 80 | + description: Uncorrected normalized expression |
| 81 | + required: false |
| 82 | + obs: |
| 83 | + - type: string |
| 84 | + name: cell_id |
| 85 | + description: Unique identifier for the cell (from assignment step) |
| 86 | + required: true |
| 87 | + - type: string |
| 88 | + name: centroid_x |
| 89 | + description: X coordinate of the cell |
| 90 | + required: true |
| 91 | + - type: string |
| 92 | + name: centroid_y |
| 93 | + description: Y coordinate of the cell |
| 94 | + required: true |
| 95 | + - type: string |
| 96 | + name: centroid_z |
| 97 | + description: Z coordinate of the cell |
| 98 | + required: false |
| 99 | + - type: string |
| 100 | + name: n_counts |
| 101 | + description: Number of counts in the cell |
| 102 | + required: true |
| 103 | + - type: string |
| 104 | + name: n_genes |
| 105 | + description: Number of genes in the cell |
| 106 | + required: true |
| 107 | + - type: string |
| 108 | + name: volume |
| 109 | + description: Volume of the cell |
| 110 | + required: true |
| 111 | + - type: string |
| 112 | + name: cell_type |
| 113 | + description: Cell type of the cell |
| 114 | + required: true |
| 115 | + var: |
| 116 | + - type: string |
| 117 | + name: gene_name |
| 118 | + description: Name of the gene |
| 119 | + required: true |
| 120 | + - type: string |
| 121 | + name: n_counts |
| 122 | + description: Number of counts of the gene |
| 123 | + required: true |
| 124 | + - type: string |
| 125 | + name: n_cells |
| 126 | + description: Number of cells expressing the gene |
| 127 | + required: true |
| 128 | + - type: anndata |
| 129 | + name: "metadata" |
| 130 | + description: Metadata of spatial dataset |
| 131 | + required: true |
| 132 | + uns: |
| 133 | + - type: string |
| 134 | + name: dataset_id |
| 135 | + required: true |
| 136 | + description: A unique identifier for the dataset |
| 137 | + - type: string |
| 138 | + name: dataset_name |
| 139 | + required: true |
| 140 | + description: A human-readable name for the dataset |
| 141 | + - type: string |
| 142 | + name: dataset_url |
| 143 | + required: true |
| 144 | + description: Link to the original source of the dataset |
| 145 | + - type: string |
| 146 | + name: dataset_reference |
| 147 | + required: true |
| 148 | + description: Bibtex reference of the paper in which the dataset was published |
| 149 | + - type: string |
| 150 | + name: dataset_summary |
| 151 | + required: true |
| 152 | + description: Short description of the dataset |
| 153 | + - type: string |
| 154 | + name: dataset_description |
| 155 | + required: true |
| 156 | + description: Long description of the dataset |
| 157 | + - type: string |
| 158 | + name: dataset_organism |
| 159 | + required: true |
| 160 | + description: The organism of the sample in the dataset |
| 161 | + - type: string |
| 162 | + name: segmentation_id |
| 163 | + required: true |
| 164 | + multiple: true |
| 165 | + description: A unique identifier for the segmentation |
| 166 | + obs: |
| 167 | + - type: string |
| 168 | + name: cell_id |
| 169 | + required: true |
| 170 | + description: A unique identifier for the cell |
| 171 | + var: |
| 172 | + - type: string |
| 173 | + name: gene_ids |
| 174 | + required: true |
| 175 | + description: Unique identifier for the gene |
| 176 | + - type: string |
| 177 | + name: feature_types |
| 178 | + required: true |
| 179 | + description: Type of the feature |
| 180 | + obsm: |
| 181 | + - type: double |
| 182 | + name: spatial |
| 183 | + required: true |
| 184 | + description: Spatial coordinates of the cell |
| 185 | + coordinate_systems: |
| 186 | + - type: object |
| 187 | + name: global |
| 188 | + description: Coordinate system of the replicate |
| 189 | + required: true |
0 commit comments