from torch.utils.data.datapipes.datapipe import DataChunk from torch.utils.data.datapipes.dataframe import dataframe_wrapper as df_wrapper __all__ = ["DataChunkDF", ] class DataChunkDF(DataChunk): """ DataChunkDF iterating over individual items inside of DataFrame containers, to access DataFrames user `raw_iterator` """ def __iter__(self): for df in self.items: for record in df_wrapper.iterate(df): yield record def __len__(self): total_len = 0 for df in self.items: total_len += df_wrapper.get_len(df) return total_len