lillian039 commited on
Commit
b4dbcb3
·
verified ·
1 Parent(s): e2948f0

Training in progress, step 50

Browse files
Files changed (4) hide show
  1. config.json +1 -1
  2. model.safetensors +1 -1
  3. trainer_log.jsonl +44 -12
  4. training_args.bin +2 -2
config.json CHANGED
@@ -30,7 +30,7 @@
30
  "sliding_window": 32768,
31
  "tie_word_embeddings": true,
32
  "torch_dtype": "bfloat16",
33
- "transformers_version": "4.51.3",
34
  "use_cache": false,
35
  "use_sliding_window": false,
36
  "video_token_id": 151656,
 
30
  "sliding_window": 32768,
31
  "tie_word_embeddings": true,
32
  "torch_dtype": "bfloat16",
33
+ "transformers_version": "4.50.0",
34
  "use_cache": false,
35
  "use_sliding_window": false,
36
  "video_token_id": 151656,
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2fc866e2d1d97c35473e3ae83853bc884a4bcef89c0077e570496c76de4f9e8b
3
  size 4418050848
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a21ee6c8112d95db7f5afd08444efdc37d75c25235187d0d16f1b73b8d358745
3
  size 4418050848
trainer_log.jsonl CHANGED
@@ -1,12 +1,44 @@
1
- {"current_steps": 110, "total_steps": 1266, "loss": 0.0228, "lr": 8.582677165354332e-06, "epoch": 0.26066350710900477, "percentage": 8.69, "elapsed_time": "0:08:04", "remaining_time": "1:24:51"}
2
- {"current_steps": 120, "total_steps": 1266, "loss": 0.0232, "lr": 9.370078740157481e-06, "epoch": 0.2843601895734597, "percentage": 9.48, "elapsed_time": "0:15:54", "remaining_time": "2:31:51"}
3
- {"current_steps": 130, "total_steps": 1266, "loss": 0.0236, "lr": 9.999923923382317e-06, "epoch": 0.3080568720379147, "percentage": 10.27, "elapsed_time": "0:23:41", "remaining_time": "3:26:59"}
4
- {"current_steps": 140, "total_steps": 1266, "loss": 0.0226, "lr": 9.997261484836916e-06, "epoch": 0.33175355450236965, "percentage": 11.06, "elapsed_time": "0:31:33", "remaining_time": "4:13:46"}
5
- {"current_steps": 150, "total_steps": 1266, "loss": 0.0207, "lr": 9.990797530151441e-06, "epoch": 0.35545023696682465, "percentage": 11.85, "elapsed_time": "0:39:21", "remaining_time": "4:52:46"}
6
- {"current_steps": 160, "total_steps": 1266, "loss": 0.0198, "lr": 9.980536976584711e-06, "epoch": 0.3791469194312796, "percentage": 12.64, "elapsed_time": "0:47:07", "remaining_time": "5:25:48"}
7
- {"current_steps": 170, "total_steps": 1266, "loss": 0.0202, "lr": 9.966487629543766e-06, "epoch": 0.4028436018957346, "percentage": 13.43, "elapsed_time": "0:54:58", "remaining_time": "5:54:26"}
8
- {"current_steps": 180, "total_steps": 1266, "loss": 0.0183, "lr": 9.948660176646152e-06, "epoch": 0.4265402843601896, "percentage": 14.22, "elapsed_time": "1:02:48", "remaining_time": "6:18:53"}
9
- {"current_steps": 190, "total_steps": 1266, "loss": 0.0195, "lr": 9.92706817958964e-06, "epoch": 0.45023696682464454, "percentage": 15.01, "elapsed_time": "1:10:38", "remaining_time": "6:40:03"}
10
- {"current_steps": 200, "total_steps": 1266, "loss": 0.0188, "lr": 9.901728063835561e-06, "epoch": 0.47393364928909953, "percentage": 15.8, "elapsed_time": "1:18:23", "remaining_time": "6:57:52"}
11
- {"current_steps": 200, "total_steps": 1266, "eval_loss": 0.018838880583643913, "epoch": 0.47393364928909953, "percentage": 15.8, "elapsed_time": "1:52:36", "remaining_time": "10:00:12"}
12
- {"current_steps": 210, "total_steps": 1266, "loss": 0.0189, "lr": 9.87265910611365e-06, "epoch": 0.4976303317535545, "percentage": 16.59, "elapsed_time": "2:00:37", "remaining_time": "10:06:33"}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {"current_steps": 10, "total_steps": 5571, "loss": 2.4399, "lr": 1.7921146953405018e-07, "epoch": 0.005385029617662897, "percentage": 0.18, "elapsed_time": "0:00:22", "remaining_time": "3:28:01"}
2
+ {"current_steps": 20, "total_steps": 5571, "loss": 2.4093, "lr": 3.5842293906810036e-07, "epoch": 0.010770059235325794, "percentage": 0.36, "elapsed_time": "0:00:34", "remaining_time": "2:39:35"}
3
+ {"current_steps": 30, "total_steps": 5571, "loss": 2.1829, "lr": 5.376344086021506e-07, "epoch": 0.01615508885298869, "percentage": 0.54, "elapsed_time": "0:00:46", "remaining_time": "2:23:25"}
4
+ {"current_steps": 40, "total_steps": 5571, "loss": 1.5203, "lr": 7.168458781362007e-07, "epoch": 0.021540118470651588, "percentage": 0.72, "elapsed_time": "0:00:58", "remaining_time": "2:15:20"}
5
+ {"current_steps": 50, "total_steps": 5571, "loss": 0.4885, "lr": 8.96057347670251e-07, "epoch": 0.026925148088314487, "percentage": 0.9, "elapsed_time": "0:01:10", "remaining_time": "2:10:31"}
6
+ {"current_steps": 60, "total_steps": 5571, "loss": 0.1434, "lr": 1.0752688172043011e-06, "epoch": 0.03231017770597738, "percentage": 1.08, "elapsed_time": "0:01:36", "remaining_time": "2:27:56"}
7
+ {"current_steps": 70, "total_steps": 5571, "loss": 0.0447, "lr": 1.2544802867383513e-06, "epoch": 0.03769520732364028, "percentage": 1.26, "elapsed_time": "0:01:48", "remaining_time": "2:22:29"}
8
+ {"current_steps": 80, "total_steps": 5571, "loss": 0.0384, "lr": 1.4336917562724014e-06, "epoch": 0.043080236941303175, "percentage": 1.44, "elapsed_time": "0:02:00", "remaining_time": "2:18:22"}
9
+ {"current_steps": 90, "total_steps": 5571, "loss": 0.0351, "lr": 1.6129032258064516e-06, "epoch": 0.048465266558966075, "percentage": 1.62, "elapsed_time": "0:02:13", "remaining_time": "2:15:08"}
10
+ {"current_steps": 100, "total_steps": 5571, "loss": 0.0316, "lr": 1.792114695340502e-06, "epoch": 0.053850296176628974, "percentage": 1.8, "elapsed_time": "0:02:25", "remaining_time": "2:12:31"}
11
+ {"current_steps": 110, "total_steps": 5571, "loss": 0.028, "lr": 1.9713261648745523e-06, "epoch": 0.05923532579429187, "percentage": 1.97, "elapsed_time": "0:02:46", "remaining_time": "2:17:33"}
12
+ {"current_steps": 120, "total_steps": 5571, "loss": 0.0332, "lr": 2.1505376344086023e-06, "epoch": 0.06462035541195477, "percentage": 2.15, "elapsed_time": "0:02:58", "remaining_time": "2:15:10"}
13
+ {"current_steps": 130, "total_steps": 5571, "loss": 0.0274, "lr": 2.3297491039426526e-06, "epoch": 0.07000538502961766, "percentage": 2.33, "elapsed_time": "0:03:10", "remaining_time": "2:13:03"}
14
+ {"current_steps": 140, "total_steps": 5571, "loss": 0.0285, "lr": 2.5089605734767026e-06, "epoch": 0.07539041464728057, "percentage": 2.51, "elapsed_time": "0:03:22", "remaining_time": "2:11:14"}
15
+ {"current_steps": 150, "total_steps": 5571, "loss": 0.0228, "lr": 2.688172043010753e-06, "epoch": 0.08077544426494346, "percentage": 2.69, "elapsed_time": "0:03:35", "remaining_time": "2:09:37"}
16
+ {"current_steps": 160, "total_steps": 5571, "loss": 0.0279, "lr": 2.867383512544803e-06, "epoch": 0.08616047388260635, "percentage": 2.87, "elapsed_time": "0:03:56", "remaining_time": "2:13:17"}
17
+ {"current_steps": 170, "total_steps": 5571, "loss": 0.0301, "lr": 3.0465949820788532e-06, "epoch": 0.09154550350026926, "percentage": 3.05, "elapsed_time": "0:04:08", "remaining_time": "2:11:40"}
18
+ {"current_steps": 180, "total_steps": 5571, "loss": 0.0209, "lr": 3.225806451612903e-06, "epoch": 0.09693053311793215, "percentage": 3.23, "elapsed_time": "0:04:20", "remaining_time": "2:10:14"}
19
+ {"current_steps": 190, "total_steps": 5571, "loss": 0.0197, "lr": 3.4050179211469536e-06, "epoch": 0.10231556273559504, "percentage": 3.41, "elapsed_time": "0:04:33", "remaining_time": "2:08:55"}
20
+ {"current_steps": 200, "total_steps": 5571, "loss": 0.0234, "lr": 3.584229390681004e-06, "epoch": 0.10770059235325795, "percentage": 3.59, "elapsed_time": "0:04:45", "remaining_time": "2:07:43"}
21
+ {"current_steps": 210, "total_steps": 5571, "loss": 0.0184, "lr": 3.763440860215054e-06, "epoch": 0.11308562197092084, "percentage": 3.77, "elapsed_time": "0:05:07", "remaining_time": "2:10:37"}
22
+ {"current_steps": 220, "total_steps": 5571, "loss": 0.0159, "lr": 3.942652329749105e-06, "epoch": 0.11847065158858373, "percentage": 3.95, "elapsed_time": "0:05:19", "remaining_time": "2:09:24"}
23
+ {"current_steps": 230, "total_steps": 5571, "loss": 0.0192, "lr": 4.121863799283155e-06, "epoch": 0.12385568120624664, "percentage": 4.13, "elapsed_time": "0:05:31", "remaining_time": "2:08:15"}
24
+ {"current_steps": 240, "total_steps": 5571, "loss": 0.0196, "lr": 4.3010752688172045e-06, "epoch": 0.12924071082390953, "percentage": 4.31, "elapsed_time": "0:05:43", "remaining_time": "2:07:12"}
25
+ {"current_steps": 250, "total_steps": 5571, "loss": 0.0199, "lr": 4.480286738351255e-06, "epoch": 0.13462574044157244, "percentage": 4.49, "elapsed_time": "0:05:55", "remaining_time": "2:06:13"}
26
+ {"current_steps": 260, "total_steps": 5571, "loss": 0.0177, "lr": 4.659498207885305e-06, "epoch": 0.14001077005923532, "percentage": 4.67, "elapsed_time": "0:06:17", "remaining_time": "2:08:24"}
27
+ {"current_steps": 270, "total_steps": 5571, "loss": 0.0178, "lr": 4.838709677419355e-06, "epoch": 0.14539579967689822, "percentage": 4.85, "elapsed_time": "0:06:29", "remaining_time": "2:07:24"}
28
+ {"current_steps": 280, "total_steps": 5571, "loss": 0.0157, "lr": 5.017921146953405e-06, "epoch": 0.15078082929456113, "percentage": 5.03, "elapsed_time": "0:06:41", "remaining_time": "2:06:27"}
29
+ {"current_steps": 290, "total_steps": 5571, "loss": 0.0145, "lr": 5.197132616487456e-06, "epoch": 0.156165858912224, "percentage": 5.21, "elapsed_time": "0:06:53", "remaining_time": "2:05:34"}
30
+ {"current_steps": 300, "total_steps": 5571, "loss": 0.0134, "lr": 5.376344086021506e-06, "epoch": 0.16155088852988692, "percentage": 5.39, "elapsed_time": "0:07:05", "remaining_time": "2:04:44"}
31
+ {"current_steps": 300, "total_steps": 5571, "eval_loss": 0.016489772126078606, "epoch": 0.16155088852988692, "percentage": 5.39, "elapsed_time": "0:07:19", "remaining_time": "2:08:42"}
32
+ {"current_steps": 310, "total_steps": 5571, "loss": 0.0137, "lr": 5.555555555555557e-06, "epoch": 0.16693591814754982, "percentage": 5.56, "elapsed_time": "0:07:40", "remaining_time": "2:10:18"}
33
+ {"current_steps": 320, "total_steps": 5571, "loss": 0.0155, "lr": 5.734767025089606e-06, "epoch": 0.1723209477652127, "percentage": 5.74, "elapsed_time": "0:07:52", "remaining_time": "2:09:18"}
34
+ {"current_steps": 330, "total_steps": 5571, "loss": 0.0175, "lr": 5.9139784946236566e-06, "epoch": 0.1777059773828756, "percentage": 5.92, "elapsed_time": "0:08:04", "remaining_time": "2:08:20"}
35
+ {"current_steps": 340, "total_steps": 5571, "loss": 0.0143, "lr": 6.0931899641577065e-06, "epoch": 0.1830910070005385, "percentage": 6.1, "elapsed_time": "0:08:16", "remaining_time": "2:07:25"}
36
+ {"current_steps": 350, "total_steps": 5571, "loss": 0.0145, "lr": 6.272401433691757e-06, "epoch": 0.1884760366182014, "percentage": 6.28, "elapsed_time": "0:08:28", "remaining_time": "2:06:32"}
37
+ {"current_steps": 360, "total_steps": 5571, "loss": 0.0124, "lr": 6.451612903225806e-06, "epoch": 0.1938610662358643, "percentage": 6.46, "elapsed_time": "0:08:50", "remaining_time": "2:07:55"}
38
+ {"current_steps": 370, "total_steps": 5571, "loss": 0.0128, "lr": 6.630824372759857e-06, "epoch": 0.1992460958535272, "percentage": 6.64, "elapsed_time": "0:09:02", "remaining_time": "2:07:03"}
39
+ {"current_steps": 380, "total_steps": 5571, "loss": 0.013, "lr": 6.810035842293907e-06, "epoch": 0.20463112547119008, "percentage": 6.82, "elapsed_time": "0:09:14", "remaining_time": "2:06:13"}
40
+ {"current_steps": 390, "total_steps": 5571, "loss": 0.0125, "lr": 6.989247311827958e-06, "epoch": 0.210016155088853, "percentage": 7.0, "elapsed_time": "0:09:26", "remaining_time": "2:05:25"}
41
+ {"current_steps": 400, "total_steps": 5571, "loss": 0.0136, "lr": 7.168458781362008e-06, "epoch": 0.2154011847065159, "percentage": 7.18, "elapsed_time": "0:09:38", "remaining_time": "2:04:38"}
42
+ {"current_steps": 410, "total_steps": 5571, "loss": 0.0116, "lr": 7.347670250896059e-06, "epoch": 0.22078621432417878, "percentage": 7.36, "elapsed_time": "0:10:00", "remaining_time": "2:05:55"}
43
+ {"current_steps": 420, "total_steps": 5571, "loss": 0.0107, "lr": 7.526881720430108e-06, "epoch": 0.22617124394184168, "percentage": 7.54, "elapsed_time": "0:10:12", "remaining_time": "2:05:08"}
44
+ {"current_steps": 430, "total_steps": 5571, "loss": 0.0117, "lr": 7.706093189964159e-06, "epoch": 0.2315562735595046, "percentage": 7.72, "elapsed_time": "0:10:24", "remaining_time": "2:04:23"}
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:524dbbcfbc78f327015396f99c1bab3f26989726bdfda96be842d9ef64f8cdbc
3
- size 7480
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:aeaddb2549bffea5cf2713518a74223a1b965d3584290eb56033f2543899c503
3
+ size 7544