File tree Expand file tree Collapse file tree
Expand file tree Collapse file tree Original file line number Diff line number Diff line change 1111.venv /
1212.idea /
1313results /
14- logs /
14+ logs /
15+
16+ # AI rules
17+ CLAUDE.md
18+ AGENTS.md
Original file line number Diff line number Diff line change 66
77import logging
88import pathlib
9- import typing
109from enum import Enum
10+ from typing import Any , NamedTuple
1111
1212import pandas as pd
1313import polars as pl
2525log = logging .getLogger (__name__ )
2626
2727
28- class SizeLabel (typing . NamedTuple ):
28+ class SizeLabel (NamedTuple ):
2929 size : int
3030 label : str
3131 file_count : int
@@ -405,6 +405,17 @@ def __init__(self, dataset: DatasetManager):
405405 self ._cur = None
406406 self ._sub_idx = [0 for i in range (len (self ._ds .train_files ))] # iter num for each file
407407
408+ def __getstate__ (self ):
409+ """Custom pickle support to handle unpicklable generator."""
410+ state = self .__dict__ .copy ()
411+ # Remove the unpicklable generator from ParquetFile.iter_batches()
412+ state ["_cur" ] = None
413+ return state
414+
415+ def __setstate__ (self , state : Any ):
416+ """Restore state after unpickling."""
417+ self .__dict__ .update (state )
418+
408419 def __iter__ (self ):
409420 return self
410421
You can’t perform that action at this time.
0 commit comments