moPPIt-v2 / configs /data /text8.yaml
AlienChen's picture
Upload 106 files
c4b1fea verified
Raw
History Blame Contribute Delete
260 Bytes
# TODO: When using this dataset, set model.length = 256 to match D3PM setup
train: text8
valid: text8
tokenizer_name_or_path: text8
cache_dir: /share/kuleshov/ssahoo/textdiffusion/data
wrap: True
streaming: False
override_cache: False
add_special_tokens: False