penfever commited on
Commit
604bcfb
·
verified ·
1 Parent(s): 3f734ce

Training in progress, step 400

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a8e4be56d38abb98b9d459369d46428853f621d6d093a6a81f32823bc720f83c
3
  size 4902257696
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1df44194b32f263dfba9be329058741d708b94cbc88cb1cc7374fe58909d7781
3
  size 4902257696
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ed2fc04ef24b0a46667cedd919cf34a64e51dcf1c65560a5c4cd1f081bbe36b2
3
  size 4915960368
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4635e0d935a82a93b0fe29e2245045b9f217cf10c0525770fe9288ef6277b587
3
  size 4915960368
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b98c5a2c02a40dfa661e83efa6741e8ffb344db28c5f6724366a18ddb909b04d
3
  size 4983068496
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2a471a7dd491963f9a6995dfed0a64b573e7c83e307c354435a8b2bf02896362
3
  size 4983068496
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:05efc445e66fc1fc90a6947cd7e7474a4df2906e0f333b4d53ac8b346740c0e1
3
  size 1580230264
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cc2746917e9269045dbae911a97213dca3a1fa65366972b4eac2c390bdfc2e31
3
  size 1580230264
trainer_log.jsonl CHANGED
@@ -51,3 +51,30 @@
51
  {"current_steps": 255, "total_steps": 9128, "loss": 0.2757, "lr": 1.1128148959474261e-05, "epoch": 0.1956271576524741, "percentage": 2.79, "elapsed_time": "2:26:03", "remaining_time": "3 days, 12:42:25"}
52
  {"current_steps": 260, "total_steps": 9128, "loss": 0.2808, "lr": 1.1347207009857613e-05, "epoch": 0.19946298427311085, "percentage": 2.85, "elapsed_time": "2:28:56", "remaining_time": "3 days, 12:40:07"}
53
  {"current_steps": 265, "total_steps": 9128, "loss": 0.2751, "lr": 1.1566265060240964e-05, "epoch": 0.2032988108937476, "percentage": 2.9, "elapsed_time": "2:31:37", "remaining_time": "3 days, 12:31:18"}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
51
  {"current_steps": 255, "total_steps": 9128, "loss": 0.2757, "lr": 1.1128148959474261e-05, "epoch": 0.1956271576524741, "percentage": 2.79, "elapsed_time": "2:26:03", "remaining_time": "3 days, 12:42:25"}
52
  {"current_steps": 260, "total_steps": 9128, "loss": 0.2808, "lr": 1.1347207009857613e-05, "epoch": 0.19946298427311085, "percentage": 2.85, "elapsed_time": "2:28:56", "remaining_time": "3 days, 12:40:07"}
53
  {"current_steps": 265, "total_steps": 9128, "loss": 0.2751, "lr": 1.1566265060240964e-05, "epoch": 0.2032988108937476, "percentage": 2.9, "elapsed_time": "2:31:37", "remaining_time": "3 days, 12:31:18"}
54
+ {"current_steps": 270, "total_steps": 9128, "loss": 0.2608, "lr": 1.1785323110624316e-05, "epoch": 0.20713463751438435, "percentage": 2.96, "elapsed_time": "2:34:31", "remaining_time": "3 days, 12:29:30"}
55
+ {"current_steps": 275, "total_steps": 9128, "loss": 0.2757, "lr": 1.2004381161007668e-05, "epoch": 0.2109704641350211, "percentage": 3.01, "elapsed_time": "2:37:27", "remaining_time": "3 days, 12:28:58"}
56
+ {"current_steps": 280, "total_steps": 9128, "loss": 0.3343, "lr": 1.222343921139102e-05, "epoch": 0.21480629075565785, "percentage": 3.07, "elapsed_time": "2:39:41", "remaining_time": "3 days, 12:06:05"}
57
+ {"current_steps": 285, "total_steps": 9128, "loss": 0.4158, "lr": 1.2442497261774372e-05, "epoch": 0.2186421173762946, "percentage": 3.12, "elapsed_time": "2:40:56", "remaining_time": "3 days, 11:13:35"}
58
+ {"current_steps": 290, "total_steps": 9128, "loss": 0.3653, "lr": 1.2661555312157722e-05, "epoch": 0.22247794399693133, "percentage": 3.18, "elapsed_time": "2:42:11", "remaining_time": "3 days, 10:23:07"}
59
+ {"current_steps": 295, "total_steps": 9128, "loss": 0.3475, "lr": 1.2880613362541074e-05, "epoch": 0.22631377061756808, "percentage": 3.23, "elapsed_time": "2:43:26", "remaining_time": "3 days, 9:33:55"}
60
+ {"current_steps": 300, "total_steps": 9128, "loss": 0.337, "lr": 1.3099671412924427e-05, "epoch": 0.23014959723820483, "percentage": 3.29, "elapsed_time": "2:44:45", "remaining_time": "3 days, 8:48:14"}
61
+ {"current_steps": 305, "total_steps": 9128, "loss": 0.3226, "lr": 1.3318729463307779e-05, "epoch": 0.23398542385884158, "percentage": 3.34, "elapsed_time": "2:46:01", "remaining_time": "3 days, 8:02:34"}
62
+ {"current_steps": 310, "total_steps": 9128, "loss": 0.3273, "lr": 1.3537787513691129e-05, "epoch": 0.23782125047947833, "percentage": 3.4, "elapsed_time": "2:47:17", "remaining_time": "3 days, 7:18:27"}
63
+ {"current_steps": 315, "total_steps": 9128, "loss": 0.2963, "lr": 1.3756845564074481e-05, "epoch": 0.24165707710011508, "percentage": 3.45, "elapsed_time": "2:48:32", "remaining_time": "3 days, 6:35:16"}
64
+ {"current_steps": 320, "total_steps": 9128, "loss": 0.3139, "lr": 1.3975903614457833e-05, "epoch": 0.24549290372075183, "percentage": 3.51, "elapsed_time": "2:49:46", "remaining_time": "3 days, 5:53:03"}
65
+ {"current_steps": 325, "total_steps": 9128, "loss": 0.2929, "lr": 1.4194961664841185e-05, "epoch": 0.24932873034138858, "percentage": 3.56, "elapsed_time": "2:51:00", "remaining_time": "3 days, 5:12:02"}
66
+ {"current_steps": 330, "total_steps": 9128, "loss": 0.2917, "lr": 1.4414019715224536e-05, "epoch": 0.25316455696202533, "percentage": 3.62, "elapsed_time": "2:52:17", "remaining_time": "3 days, 4:33:25"}
67
+ {"current_steps": 335, "total_steps": 9128, "loss": 0.3017, "lr": 1.4633077765607888e-05, "epoch": 0.2570003835826621, "percentage": 3.67, "elapsed_time": "2:53:34", "remaining_time": "3 days, 3:55:51"}
68
+ {"current_steps": 340, "total_steps": 9128, "loss": 0.2892, "lr": 1.485213581599124e-05, "epoch": 0.26083621020329883, "percentage": 3.72, "elapsed_time": "2:54:49", "remaining_time": "3 days, 3:18:55"}
69
+ {"current_steps": 345, "total_steps": 9128, "loss": 0.2705, "lr": 1.5071193866374592e-05, "epoch": 0.2646720368239356, "percentage": 3.78, "elapsed_time": "2:56:03", "remaining_time": "3 days, 2:42:09"}
70
+ {"current_steps": 350, "total_steps": 9128, "loss": 0.2785, "lr": 1.5290251916757942e-05, "epoch": 0.2685078634445723, "percentage": 3.83, "elapsed_time": "2:57:17", "remaining_time": "3 days, 2:06:38"}
71
+ {"current_steps": 355, "total_steps": 9128, "loss": 0.2818, "lr": 1.5509309967141293e-05, "epoch": 0.27234369006520903, "percentage": 3.89, "elapsed_time": "2:58:35", "remaining_time": "3 days, 1:33:25"}
72
+ {"current_steps": 360, "total_steps": 9128, "loss": 0.279, "lr": 1.5728368017524643e-05, "epoch": 0.2761795166858458, "percentage": 3.94, "elapsed_time": "2:59:50", "remaining_time": "3 days, 1:00:10"}
73
+ {"current_steps": 365, "total_steps": 9128, "loss": 0.2851, "lr": 1.5947426067907997e-05, "epoch": 0.28001534330648253, "percentage": 4.0, "elapsed_time": "3:01:09", "remaining_time": "3 days, 0:29:19"}
74
+ {"current_steps": 370, "total_steps": 9128, "loss": 0.2818, "lr": 1.6166484118291347e-05, "epoch": 0.2838511699271193, "percentage": 4.05, "elapsed_time": "3:02:23", "remaining_time": "2 days, 23:57:10"}
75
+ {"current_steps": 375, "total_steps": 9128, "loss": 0.2841, "lr": 1.63855421686747e-05, "epoch": 0.28768699654775604, "percentage": 4.11, "elapsed_time": "3:03:40", "remaining_time": "2 days, 23:27:22"}
76
+ {"current_steps": 380, "total_steps": 9128, "loss": 0.2694, "lr": 1.660460021905805e-05, "epoch": 0.2915228231683928, "percentage": 4.16, "elapsed_time": "3:04:58", "remaining_time": "2 days, 22:58:26"}
77
+ {"current_steps": 385, "total_steps": 9128, "loss": 0.2791, "lr": 1.6823658269441402e-05, "epoch": 0.29535864978902954, "percentage": 4.22, "elapsed_time": "3:06:20", "remaining_time": "2 days, 22:31:41"}
78
+ {"current_steps": 390, "total_steps": 9128, "loss": 0.2846, "lr": 1.7042716319824756e-05, "epoch": 0.2991944764096663, "percentage": 4.27, "elapsed_time": "3:07:35", "remaining_time": "2 days, 22:02:57"}
79
+ {"current_steps": 395, "total_steps": 9128, "loss": 0.2566, "lr": 1.7261774370208106e-05, "epoch": 0.30303030303030304, "percentage": 4.33, "elapsed_time": "3:08:49", "remaining_time": "2 days, 21:34:38"}
80
+ {"current_steps": 400, "total_steps": 9128, "loss": 0.2695, "lr": 1.7480832420591457e-05, "epoch": 0.3068661296509398, "percentage": 4.38, "elapsed_time": "3:10:04", "remaining_time": "2 days, 21:07:21"}