chatdoco_model2_lora / training_log.json
smartrichard's picture
Upload 7 files
02312c0 verified
raw
history blame contribute delete
439 Bytes
{
"base_model_name": "Llama-2-7b-chat-hf",
"base_model_class": "LlamaForCausalLM",
"base_loaded_in_4bit": true,
"base_loaded_in_8bit": false,
"projections": "q, v",
"loss": 1.3806,
"learning_rate": 0.0,
"epoch": 10.0,
"current_steps": 280293,
"train_runtime": 197834.3533,
"train_samples_per_second": 5.67,
"train_steps_per_second": 0.044,
"total_flos": 5.831723715554968e+18,
"train_loss": 1.4700200526681664
}