Skip to content

Commit 36c9bdd

Browse files
committed
update disk file structure
1 parent d9c1a79 commit 36c9bdd

5 files changed

Lines changed: 22 additions & 22 deletions

File tree

src/pasteur/kedro/pipelines/dataset.py

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -29,7 +29,7 @@ def create_dataset_pipeline(
2929
for t in dataset.raw_tables
3030
]
3131
outputs += [
32-
D("typed", f"{dataset}.typed.{t}", ["orig", "typed", dataset, t], type="pq")
32+
D("typed", f"{dataset}.typed.{t}", ["ds", dataset, "typed", t], type="pq")
3333
for t in dataset.raw_tables
3434
]
3535
prefix = "typed."
@@ -49,7 +49,7 @@ def create_dataset_pipeline(
4949
]
5050

5151
outputs += [
52-
D("interim", f"{dataset}.{t}", ["orig", "interim", dataset, t], type="pq")
52+
D("interim", f"{dataset}.{t}", ["ds", dataset, "tables", t], type="pq")
5353
for t in tables
5454
]
5555
meta_tables = PipelineMeta(
@@ -72,7 +72,7 @@ def create_dataset_pipeline(
7272

7373
meta_keys = PipelineMeta(
7474
pipe,
75-
[D("keys", f"{dataset}.keys", ["orig", "keys", dataset])],
75+
[D("keys", f"{dataset}.keys", ["ds", dataset, "keys"])],
7676
)
7777

7878
return meta_tables + meta_keys

src/pasteur/kedro/pipelines/metrics.py

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -124,13 +124,13 @@ def _create_fit_pipeline(
124124
D(
125125
"measure",
126126
f"{view}.msr.{name}",
127-
["measure", "dataset", view, name, "metric"],
127+
['view', view, 'msr', name, "metric"],
128128
type="pkl",
129129
),
130130
D(
131131
"measure",
132132
f"{view}.msr.{name}_pre",
133-
["measure", "dataset", view, name, "pre"],
133+
['view', view, 'msr', name, "pre"],
134134
type="pkl",
135135
),
136136
]
@@ -173,7 +173,7 @@ def _create_process_pipeline(
173173
D(
174174
"measure",
175175
f"{view}.{syn_split}.{name}_data",
176-
["synth", "measure", "dataset", view, name, "data"],
176+
['synth', view, syn_split, 'msr', name],
177177
type="pkl",
178178
versioned=True,
179179
),

src/pasteur/kedro/pipelines/synth.py

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -50,14 +50,14 @@ def create_synth_pipeline(
5050
D(
5151
"synth_models",
5252
f"{view}.{fr.name}.model",
53-
["synth", "models", f"{view}.{fr.name}"],
53+
["synth", view, fr.name, 'model'],
5454
versioned=True,
5555
type="pkl",
5656
),
5757
D(
5858
"synth_output",
5959
f"{view}.{fr.name}.enc",
60-
["synth", "enc", f"{view}.{fr.name}"],
60+
["synth", view, fr.name, 'enc'],
6161
versioned=True,
6262
type="multi",
6363
),

src/pasteur/kedro/pipelines/transform.py

Lines changed: 10 additions & 10 deletions
Original file line numberDiff line numberDiff line change
@@ -135,11 +135,11 @@ def create_fit_pipeline(
135135
return PipelineMeta(
136136
pipeline(trn_fit_nodes + enc_fit_nodes, tags=TAGS_TRANSFORM),
137137
[
138-
D("transformers", f"{view}.trn.{t}", ["views", "trn", view, t], type="pkl")
138+
D("transformers", f"{view}.trn.{t}", ["views", view, "trn", t], type="pkl")
139139
for t in view.tables
140140
]
141141
+ [
142-
D("encoders", f"{view}.enc.{enc}", ["views", "enc", view, enc], type="pkl")
142+
D("encoders", f"{view}.enc.{enc}", ["views", view, 'enc', enc], type="pkl")
143143
for enc in encs
144144
],
145145
)
@@ -177,21 +177,21 @@ def create_transform_pipeline(
177177
D(
178178
"split_transformed",
179179
f"{view}.{split}.ctx_{t}",
180-
["views", "ctx", f"{view}.{split}", t],
180+
["views", view, split, "ctx", t],
181181
)
182182
)
183183
outputs.append(
184184
D(
185185
"split_transformed",
186186
f"{view}.{split}.bst_{t}",
187-
["views", "bst", f"{view}.{split}", t],
187+
["views", view, split, "bst", t],
188188
)
189189
)
190190
outputs.append(
191191
D(
192192
"split_transformed",
193193
f"{view}.{split}.ids_{t}",
194-
["views", "ids", f"{view}.{split}", t],
194+
["views", view, split, "ids", t],
195195
)
196196
)
197197

@@ -218,7 +218,7 @@ def create_transform_pipeline(
218218
# FIXME: Pass proper layer properly, don't infer
219219
"synth_reencoded" if retransform else "split_encoded",
220220
f"{view}.{split}.{enc}",
221-
["synth" if retransform else "views", enc, f"{view}.{split}"],
221+
["synth" if retransform else "views", view, split],
222222
versioned=retransform,
223223
)
224224
)
@@ -272,26 +272,26 @@ def create_reverse_pipeline(view: View, alg: str, enc: str):
272272
D(
273273
"synth_decoded",
274274
f"{view}.{alg}.bst_{t}",
275-
["synth", "bst", f"{view}.{alg}", t],
275+
["synth", view, alg, "bst", t],
276276
versioned=True,
277277
),
278278
D(
279279
"synth_decoded",
280280
f"{view}.{alg}.ids_{t}",
281-
["synth", "ids", f"{view}.{alg}", t],
281+
["synth", view, alg, "ids", t],
282282
versioned=True,
283283
),
284284
D(
285285
"synth_decoded",
286286
f"{view}.{alg}.ctx_{t}",
287-
["synth", "ctx", f"{view}.{alg}", t],
287+
["synth", view, alg, "ctx", t],
288288
versioned=True,
289289
type="multi",
290290
),
291291
D(
292292
"synth_reversed",
293293
f"{view}.{alg}.{t}",
294-
["synth", "dec", f"{view}.{alg}", t],
294+
["synth", view, alg, 'tables', t],
295295
versioned=True,
296296
),
297297
]

src/pasteur/kedro/pipelines/views.py

Lines changed: 4 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -60,7 +60,7 @@ def create_view_pipeline(view: View):
6060
]
6161
),
6262
[
63-
D("primary", f"{view}.view.{t}", ["views", "primary", view, t], type="pq")
63+
D("primary", f"{view}.view.{t}", ["view", view, "tables", t], type="pq")
6464
for t in view.tables
6565
],
6666
)
@@ -81,7 +81,7 @@ def create_meta_pipeline(view: View):
8181
],
8282
tags=TAGS_VIEW_META,
8383
),
84-
[D("metadata", f"{view}.metadata", ["views", "metadata", view], type="pkl")],
84+
[D("metadata", f"{view}.metadata", ["view", view, "metadata"], type="pkl")],
8585
)
8686

8787

@@ -121,7 +121,7 @@ def create_keys_pipeline(view: View, splits: list[str]):
121121

122122
return PipelineMeta(
123123
pipe,
124-
[D("keys", f"{view}.keys.{s}", ["views", "keys", view, s]) for s in splits],
124+
[D("keys", f"{view}.keys.{s}", ["view", view, "keys", s]) for s in splits],
125125
)
126126

127127

@@ -152,7 +152,7 @@ def create_filter_pipeline(view: View, splits: list[str]):
152152
namespace=view.name,
153153
),
154154
[
155-
D("splits", f"{view}.{s}.{t}", ["views", "primary", f"{view}.{s}", t])
155+
D("splits", f"{view}.{s}.{t}", ["views", view, s, 'tables', t])
156156
for t in tables
157157
for s in splits
158158
],

0 commit comments

Comments
 (0)