Skip to content
Merged
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
4 changes: 0 additions & 4 deletions fast_llm/data/auto.py
Original file line number Diff line number Diff line change
Expand Up @@ -17,7 +17,3 @@
from fast_llm.data.preparator.dataset_discovery.config import DatasetDiscoveryConfig # isort: skip
from fast_llm.data.preparator.gpt_memmap.config import GPTMemmapDatasetPreparatorConfig # isort: skip
from fast_llm.data.sample.abstract import NullReaderConfig # isort: skip
from fast_llm.data.sample.language_model import LanguageModelReaderConfig # isort: skip
from fast_llm.data.sample.patch import PatchReaderConfig # isort: skip
from fast_llm.data.sample.range import RangeReaderConfig # isort: skip
from fast_llm.data.sample.token import TokenReaderConfig # isort: skip
6 changes: 6 additions & 0 deletions fast_llm/data/dataset/memmap.py
Original file line number Diff line number Diff line change
Expand Up @@ -28,6 +28,12 @@ def read_reader_config(path: pathlib.Path | str) -> MemmapIndexDatasetReaderConf
"""
Read the MemmapIndexDatasetReaderConfig from a memmap file.
"""
# Import reader configs to register them in the dynamic class registry
from fast_llm.data.sample.language_model import LanguageModelReaderConfig # noqa: F401
from fast_llm.data.sample.patch import PatchReaderConfig # noqa: F401
from fast_llm.data.sample.range import RangeReaderConfig # noqa: F401
from fast_llm.data.sample.token import TokenReaderConfig # noqa: F401

path = pathlib.Path(path) if isinstance(path, str) else path
with path.open("rb") as stream:
# Verify file type.
Expand Down
4 changes: 0 additions & 4 deletions fast_llm/data/preparator/dataset_discovery/__init__.py
Original file line number Diff line number Diff line change
@@ -1,4 +0,0 @@
from fast_llm.data.preparator.dataset_discovery.config import DatasetDiscoveryConfig
from fast_llm.data.preparator.dataset_discovery.prepare import DatasetDiscoveryPreparator

__all__ = ["DatasetDiscoveryConfig", "DatasetDiscoveryPreparator"]