aicang-22B / training_log.json
Dogge's picture
Upload 6 files
82b71e4
raw
history blame contribute delete
459 Bytes
{
"base_model_name": "grimpep_L2-MythoMax22b-instruct-Falseblock",
"base_model_class": "LlamaForCausalLM",
"base_loaded_in_4bit": true,
"base_loaded_in_8bit": false,
"projections": "q, v",
"loss": 1.3766,
"learning_rate": 0.0,
"epoch": 2.53,
"current_steps": 451,
"train_runtime": 998.8868,
"train_samples_per_second": 2.274,
"train_steps_per_second": 0.015,
"total_flos": 3.2187033092358144e+16,
"train_loss": 1.9135538736979167
}