mvi-ai-engine / train_language.py
Musombi's picture
Upload folder using huggingface_hub
c1e438c
from data.registry import DatasetRegistry
from data.loaders.language import LanguageTextLoader
registry = DatasetRegistry()
registry.register(LanguageTextLoader("data/raw/wikipedia"))
texts = [s["text"] for s in registry.all_samples()]