Diffsplat / src /data /utils /chunk_data_source.py
paulpanwang's picture
Upload folder using huggingface_hub
476e0f0 verified
raw
history blame
170 Bytes
# This is a pseudo class that collect data in chunks from HDFS
class ParquetChunkDataSource:
raise NotImplementedError("Please implement your own dataloading logic")