data: tokenizer: name: huggingface path: bigscience/bloom