mt5-gigatrue-embmodtest / coreconfig.json
Plasmoxy's picture
End of training
8155e6e verified
{
"out_name": "mt5-gigatrue-embmodtest",
"remove_layers": false,
"model_archetype": "mt5",
"model_name": "../embedding_prune/mod",
"tokenizer_name": "../embedding_prune/mod",
"model_torch_dtype": "bfloat16",
"dataset_lang": "en",
"dataset_name": "Plasmoxy/gigatrue",
"cache_tokens": false,
"dataset_tokenized_cache_name": "gigatrue_tokenized_mt5_embmodtest-default_110-35",
"use_half_val_dataset": true,
"vocab_size": 160906,
"max_input_length": 110,
"max_target_length": 35,
"batch_size": 128,
"learning_rate": 0.0003,
"num_train_epochs": 1,
"pkg_versions": {
"optimum": "1.23.3",
"transformers": "4.45.2",
"openvino": "2024.6.0",
"nncf": "2.14.1",
"torch": "2.5.1",
"datasets": "3.2.0",
"peft": "0.13.3.dev0"
}
}