gemma3-4b-it-qlora / trainer_log.jsonl
enapeace's picture
Upload folder using huggingface_hub
41ba510 verified
{"current_steps": 10, "total_steps": 408, "loss": 3.0445, "lr": 3.461538461538462e-05, "epoch": 0.049170251997541485, "percentage": 2.45, "elapsed_time": "0:01:04", "remaining_time": "0:42:49"}
{"current_steps": 20, "total_steps": 408, "loss": 1.2916, "lr": 4.997153995054481e-05, "epoch": 0.09834050399508297, "percentage": 4.9, "elapsed_time": "0:02:07", "remaining_time": "0:41:19"}
{"current_steps": 30, "total_steps": 408, "loss": 0.7916, "lr": 4.9797852029940475e-05, "epoch": 0.14751075599262448, "percentage": 7.35, "elapsed_time": "0:03:17", "remaining_time": "0:41:23"}
{"current_steps": 40, "total_steps": 408, "loss": 0.6026, "lr": 4.946738410462334e-05, "epoch": 0.19668100799016594, "percentage": 9.8, "elapsed_time": "0:04:27", "remaining_time": "0:41:00"}
{"current_steps": 50, "total_steps": 408, "loss": 0.563, "lr": 4.8982225499218236e-05, "epoch": 0.24585125998770743, "percentage": 12.25, "elapsed_time": "0:05:36", "remaining_time": "0:40:07"}
{"current_steps": 60, "total_steps": 408, "loss": 0.515, "lr": 4.834544354263534e-05, "epoch": 0.29502151198524895, "percentage": 14.71, "elapsed_time": "0:06:43", "remaining_time": "0:39:00"}
{"current_steps": 70, "total_steps": 408, "loss": 0.4954, "lr": 4.756106417542925e-05, "epoch": 0.3441917639827904, "percentage": 17.16, "elapsed_time": "0:07:47", "remaining_time": "0:37:38"}
{"current_steps": 80, "total_steps": 408, "loss": 0.5008, "lr": 4.6634046496506536e-05, "epoch": 0.3933620159803319, "percentage": 19.61, "elapsed_time": "0:08:52", "remaining_time": "0:36:25"}
{"current_steps": 90, "total_steps": 408, "loss": 0.4653, "lr": 4.55702514101058e-05, "epoch": 0.4425322679778734, "percentage": 22.06, "elapsed_time": "0:09:56", "remaining_time": "0:35:06"}
{"current_steps": 100, "total_steps": 408, "loss": 0.4553, "lr": 4.437640457127401e-05, "epoch": 0.49170251997541486, "percentage": 24.51, "elapsed_time": "0:11:05", "remaining_time": "0:34:08"}
{"current_steps": 110, "total_steps": 408, "loss": 0.4598, "lr": 4.306005386410986e-05, "epoch": 0.5408727719729564, "percentage": 26.96, "elapsed_time": "0:12:07", "remaining_time": "0:32:52"}
{"current_steps": 120, "total_steps": 408, "loss": 0.4462, "lr": 4.162952168161028e-05, "epoch": 0.5900430239704979, "percentage": 29.41, "elapsed_time": "0:13:15", "remaining_time": "0:31:48"}
{"current_steps": 130, "total_steps": 408, "loss": 0.4477, "lr": 4.009385230882235e-05, "epoch": 0.6392132759680393, "percentage": 31.86, "elapsed_time": "0:14:24", "remaining_time": "0:30:47"}
{"current_steps": 140, "total_steps": 408, "loss": 0.4339, "lr": 3.846275474196124e-05, "epoch": 0.6883835279655808, "percentage": 34.31, "elapsed_time": "0:15:27", "remaining_time": "0:29:35"}
{"current_steps": 150, "total_steps": 408, "loss": 0.4131, "lr": 3.674654130501011e-05, "epoch": 0.7375537799631223, "percentage": 36.76, "elapsed_time": "0:16:33", "remaining_time": "0:28:28"}
{"current_steps": 160, "total_steps": 408, "loss": 0.4455, "lr": 3.4956062451887664e-05, "epoch": 0.7867240319606638, "percentage": 39.22, "elapsed_time": "0:17:38", "remaining_time": "0:27:21"}
{"current_steps": 170, "total_steps": 408, "loss": 0.4217, "lr": 3.31026381663849e-05, "epoch": 0.8358942839582053, "percentage": 41.67, "elapsed_time": "0:18:46", "remaining_time": "0:26:16"}
{"current_steps": 180, "total_steps": 408, "loss": 0.4357, "lr": 3.119798639358291e-05, "epoch": 0.8850645359557467, "percentage": 44.12, "elapsed_time": "0:19:53", "remaining_time": "0:25:11"}
{"current_steps": 190, "total_steps": 408, "loss": 0.4287, "lr": 2.925414895523123e-05, "epoch": 0.9342347879532883, "percentage": 46.57, "elapsed_time": "0:20:59", "remaining_time": "0:24:04"}
{"current_steps": 200, "total_steps": 408, "loss": 0.4071, "lr": 2.7283415417473657e-05, "epoch": 0.9834050399508297, "percentage": 49.02, "elapsed_time": "0:22:04", "remaining_time": "0:22:57"}
{"current_steps": 210, "total_steps": 408, "loss": 0.3991, "lr": 2.5298245392254172e-05, "epoch": 1.029502151198525, "percentage": 51.47, "elapsed_time": "0:23:10", "remaining_time": "0:21:51"}
{"current_steps": 220, "total_steps": 408, "loss": 0.3927, "lr": 2.3311189763638598e-05, "epoch": 1.0786724031960664, "percentage": 53.92, "elapsed_time": "0:24:18", "remaining_time": "0:20:46"}
{"current_steps": 230, "total_steps": 408, "loss": 0.4027, "lr": 2.1334811337084555e-05, "epoch": 1.1278426551936078, "percentage": 56.37, "elapsed_time": "0:25:26", "remaining_time": "0:19:41"}
{"current_steps": 240, "total_steps": 408, "loss": 0.3817, "lr": 1.938160541334049e-05, "epoch": 1.1770129071911493, "percentage": 58.82, "elapsed_time": "0:26:31", "remaining_time": "0:18:34"}
{"current_steps": 250, "total_steps": 408, "loss": 0.3884, "lr": 1.746392078913122e-05, "epoch": 1.226183159188691, "percentage": 61.27, "elapsed_time": "0:27:38", "remaining_time": "0:17:28"}
{"current_steps": 260, "total_steps": 408, "loss": 0.3922, "lr": 1.559388168408906e-05, "epoch": 1.2753534111862324, "percentage": 63.73, "elapsed_time": "0:28:44", "remaining_time": "0:16:21"}
{"current_steps": 270, "total_steps": 408, "loss": 0.3902, "lr": 1.3783311087533724e-05, "epoch": 1.3245236631837738, "percentage": 66.18, "elapsed_time": "0:29:50", "remaining_time": "0:15:15"}
{"current_steps": 280, "total_steps": 408, "loss": 0.3771, "lr": 1.2043656009727161e-05, "epoch": 1.3736939151813152, "percentage": 68.63, "elapsed_time": "0:30:55", "remaining_time": "0:14:08"}
{"current_steps": 290, "total_steps": 408, "loss": 0.3926, "lr": 1.0385915110189057e-05, "epoch": 1.4228641671788567, "percentage": 71.08, "elapsed_time": "0:32:00", "remaining_time": "0:13:01"}
{"current_steps": 300, "total_steps": 408, "loss": 0.3903, "lr": 8.820569160630129e-06, "epoch": 1.4720344191763983, "percentage": 73.53, "elapsed_time": "0:33:05", "remaining_time": "0:11:54"}
{"current_steps": 310, "total_steps": 408, "loss": 0.3742, "lr": 7.357514782138896e-06, "epoch": 1.5212046711739398, "percentage": 75.98, "elapsed_time": "0:34:14", "remaining_time": "0:10:49"}
{"current_steps": 320, "total_steps": 408, "loss": 0.3701, "lr": 6.006001875556672e-06, "epoch": 1.5703749231714812, "percentage": 78.43, "elapsed_time": "0:35:21", "remaining_time": "0:09:43"}
{"current_steps": 330, "total_steps": 408, "loss": 0.3915, "lr": 4.7745751406263165e-06, "epoch": 1.6195451751690229, "percentage": 80.88, "elapsed_time": "0:36:27", "remaining_time": "0:08:37"}
{"current_steps": 340, "total_steps": 408, "loss": 0.3808, "lr": 3.6710200536492655e-06, "epoch": 1.668715427166564, "percentage": 83.33, "elapsed_time": "0:37:31", "remaining_time": "0:07:30"}
{"current_steps": 350, "total_steps": 408, "loss": 0.389, "lr": 2.702313645197685e-06, "epoch": 1.7178856791641057, "percentage": 85.78, "elapsed_time": "0:38:39", "remaining_time": "0:06:24"}
{"current_steps": 360, "total_steps": 408, "loss": 0.361, "lr": 1.87458038908081e-06, "epoch": 1.7670559311616472, "percentage": 88.24, "elapsed_time": "0:39:45", "remaining_time": "0:05:18"}
{"current_steps": 370, "total_steps": 408, "loss": 0.3957, "lr": 1.1930534814495824e-06, "epoch": 1.8162261831591886, "percentage": 90.69, "elapsed_time": "0:40:50", "remaining_time": "0:04:11"}
{"current_steps": 380, "total_steps": 408, "loss": 0.3894, "lr": 6.620417548456853e-07, "epoch": 1.8653964351567303, "percentage": 93.14, "elapsed_time": "0:41:58", "remaining_time": "0:03:05"}
{"current_steps": 390, "total_steps": 408, "loss": 0.3944, "lr": 2.8490243637487313e-07, "epoch": 1.9145666871542717, "percentage": 95.59, "elapsed_time": "0:43:01", "remaining_time": "0:01:59"}
{"current_steps": 400, "total_steps": 408, "loss": 0.3871, "lr": 6.401992223629694e-08, "epoch": 1.9637369391518131, "percentage": 98.04, "elapsed_time": "0:44:08", "remaining_time": "0:00:52"}
{"current_steps": 408, "total_steps": 408, "epoch": 2.0, "percentage": 100.0, "elapsed_time": "0:45:03", "remaining_time": "0:00:00"}