Video-Text-to-Text
Transformers
Safetensors
qwen3_vl
image-text-to-text
llama-factory
full
Generated from Trainer
video-language-model
video-captioning
Instructions to use chancharikm/CHAI_SFT_model_8b with libraries, inference providers, notebooks, and local apps. Follow these links to get started.
- Libraries
- Transformers
How to use chancharikm/CHAI_SFT_model_8b with Transformers:
# Load model directly from transformers import AutoProcessor, AutoModelForImageTextToText processor = AutoProcessor.from_pretrained("chancharikm/CHAI_SFT_model_8b") model = AutoModelForImageTextToText.from_pretrained("chancharikm/CHAI_SFT_model_8b") - Notebooks
- Google Colab
- Kaggle
Training in progress, step 100
Browse files- model-00001-of-00004.safetensors +1 -1
- model-00002-of-00004.safetensors +1 -1
- model-00003-of-00004.safetensors +1 -1
- model-00004-of-00004.safetensors +1 -1
- tokenizer_config.json +1 -0
- trainer_log.jsonl +50 -0
model-00001-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4998056552
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0a911539e7f25a28f3ad9780195aaef6f434e1328192c4ec5b377848e723f808
|
| 3 |
size 4998056552
|
model-00002-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4915962464
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f7e330692c5cd0b1bf9d409dd671819a6fdf8d0b94f867baaddab71c16922d23
|
| 3 |
size 4915962464
|
model-00003-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4915962496
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1270438dc14e5bebef80bda50d2262cedac8fb28b17a04ee1bf92ccd61144005
|
| 3 |
size 4915962496
|
model-00004-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 2704357976
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ae5297306f4058b93cd62d5b31ed3c8868e056d884c1336c14cebe8b466e7e14
|
| 3 |
size 2704357976
|
tokenizer_config.json
CHANGED
|
@@ -234,6 +234,7 @@
|
|
| 234 |
"model_max_length": 262144,
|
| 235 |
"pad_token": "<|endoftext|>",
|
| 236 |
"padding_side": "right",
|
|
|
|
| 237 |
"split_special_tokens": false,
|
| 238 |
"tokenizer_class": "Qwen2Tokenizer",
|
| 239 |
"unk_token": null
|
|
|
|
| 234 |
"model_max_length": 262144,
|
| 235 |
"pad_token": "<|endoftext|>",
|
| 236 |
"padding_side": "right",
|
| 237 |
+
"processor_class": "Qwen3VLProcessor",
|
| 238 |
"split_special_tokens": false,
|
| 239 |
"tokenizer_class": "Qwen2Tokenizer",
|
| 240 |
"unk_token": null
|
trainer_log.jsonl
CHANGED
|
@@ -48,3 +48,53 @@
|
|
| 48 |
{"current_steps": 48, "total_steps": 741, "loss": 0.4208, "lr": 2.9987869552193653e-05, "epoch": 0.1947261663286004, "percentage": 6.48, "elapsed_time": "4:22:11", "remaining_time": "2 days, 15:05:16"}
|
| 49 |
{"current_steps": 49, "total_steps": 741, "loss": 0.3992, "lr": 2.9985024612053743e-05, "epoch": 0.19878296146044624, "percentage": 6.61, "elapsed_time": "4:27:35", "remaining_time": "2 days, 14:59:09"}
|
| 50 |
{"current_steps": 50, "total_steps": 741, "loss": 0.3999, "lr": 2.9981880413869707e-05, "epoch": 0.2028397565922921, "percentage": 6.75, "elapsed_time": "4:32:48", "remaining_time": "2 days, 14:50:09"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 48 |
{"current_steps": 48, "total_steps": 741, "loss": 0.4208, "lr": 2.9987869552193653e-05, "epoch": 0.1947261663286004, "percentage": 6.48, "elapsed_time": "4:22:11", "remaining_time": "2 days, 15:05:16"}
|
| 49 |
{"current_steps": 49, "total_steps": 741, "loss": 0.3992, "lr": 2.9985024612053743e-05, "epoch": 0.19878296146044624, "percentage": 6.61, "elapsed_time": "4:27:35", "remaining_time": "2 days, 14:59:09"}
|
| 50 |
{"current_steps": 50, "total_steps": 741, "loss": 0.3999, "lr": 2.9981880413869707e-05, "epoch": 0.2028397565922921, "percentage": 6.75, "elapsed_time": "4:32:48", "remaining_time": "2 days, 14:50:09"}
|
| 51 |
+
{"current_steps": 51, "total_steps": 741, "loss": 0.4206, "lr": 2.9978437020432673e-05, "epoch": 0.20689655172413793, "percentage": 6.88, "elapsed_time": "4:39:09", "remaining_time": "2 days, 14:56:51"}
|
| 52 |
+
{"current_steps": 52, "total_steps": 741, "loss": 0.422, "lr": 2.997469450050883e-05, "epoch": 0.21095334685598377, "percentage": 7.02, "elapsed_time": "4:44:16", "remaining_time": "2 days, 14:46:33"}
|
| 53 |
+
{"current_steps": 53, "total_steps": 741, "loss": 0.4132, "lr": 2.997065292883808e-05, "epoch": 0.2150101419878296, "percentage": 7.15, "elapsed_time": "4:49:38", "remaining_time": "2 days, 14:39:56"}
|
| 54 |
+
{"current_steps": 54, "total_steps": 741, "loss": 0.4014, "lr": 2.9966312386132533e-05, "epoch": 0.21906693711967545, "percentage": 7.29, "elapsed_time": "4:54:29", "remaining_time": "2 days, 14:26:33"}
|
| 55 |
+
{"current_steps": 55, "total_steps": 741, "loss": 0.4125, "lr": 2.9961672959074872e-05, "epoch": 0.2231237322515213, "percentage": 7.42, "elapsed_time": "4:59:53", "remaining_time": "2 days, 14:20:33"}
|
| 56 |
+
{"current_steps": 56, "total_steps": 741, "loss": 0.4394, "lr": 2.995673474031666e-05, "epoch": 0.22718052738336714, "percentage": 7.56, "elapsed_time": "5:05:02", "remaining_time": "2 days, 14:11:18"}
|
| 57 |
+
{"current_steps": 57, "total_steps": 741, "loss": 0.4109, "lr": 2.9951497828476462e-05, "epoch": 0.23123732251521298, "percentage": 7.69, "elapsed_time": "5:10:32", "remaining_time": "2 days, 14:06:30"}
|
| 58 |
+
{"current_steps": 58, "total_steps": 741, "loss": 0.4078, "lr": 2.9945962328137898e-05, "epoch": 0.23529411764705882, "percentage": 7.83, "elapsed_time": "5:15:01", "remaining_time": "2 days, 13:49:43"}
|
| 59 |
+
{"current_steps": 59, "total_steps": 741, "loss": 0.3654, "lr": 2.9940128349847526e-05, "epoch": 0.23935091277890466, "percentage": 7.96, "elapsed_time": "5:20:03", "remaining_time": "2 days, 13:39:45"}
|
| 60 |
+
{"current_steps": 60, "total_steps": 741, "loss": 0.378, "lr": 2.993399601011266e-05, "epoch": 0.2434077079107505, "percentage": 8.1, "elapsed_time": "5:24:53", "remaining_time": "2 days, 13:27:28"}
|
| 61 |
+
{"current_steps": 61, "total_steps": 741, "loss": 0.3977, "lr": 2.992756543139904e-05, "epoch": 0.24746450304259635, "percentage": 8.23, "elapsed_time": "5:29:48", "remaining_time": "2 days, 13:16:29"}
|
| 62 |
+
{"current_steps": 62, "total_steps": 741, "loss": 0.3893, "lr": 2.9920836742128352e-05, "epoch": 0.2515212981744422, "percentage": 8.37, "elapsed_time": "5:35:26", "remaining_time": "2 days, 13:13:34"}
|
| 63 |
+
{"current_steps": 63, "total_steps": 741, "loss": 0.384, "lr": 2.9913810076675722e-05, "epoch": 0.25557809330628806, "percentage": 8.5, "elapsed_time": "5:41:22", "remaining_time": "2 days, 13:13:46"}
|
| 64 |
+
{"current_steps": 64, "total_steps": 741, "loss": 0.3573, "lr": 2.990648557536699e-05, "epoch": 0.25963488843813387, "percentage": 8.64, "elapsed_time": "5:46:35", "remaining_time": "2 days, 13:06:16"}
|
| 65 |
+
{"current_steps": 65, "total_steps": 741, "loss": 0.3329, "lr": 2.9898863384475917e-05, "epoch": 0.26369168356997974, "percentage": 8.77, "elapsed_time": "5:51:40", "remaining_time": "2 days, 12:57:20"}
|
| 66 |
+
{"current_steps": 66, "total_steps": 741, "loss": 0.3359, "lr": 2.9890943656221262e-05, "epoch": 0.26774847870182555, "percentage": 8.91, "elapsed_time": "5:57:10", "remaining_time": "2 days, 12:52:56"}
|
| 67 |
+
{"current_steps": 67, "total_steps": 741, "loss": 0.3707, "lr": 2.9882726548763765e-05, "epoch": 0.2718052738336714, "percentage": 9.04, "elapsed_time": "6:03:11", "remaining_time": "2 days, 12:53:36"}
|
| 68 |
+
{"current_steps": 68, "total_steps": 741, "loss": 0.3975, "lr": 2.9874212226202946e-05, "epoch": 0.27586206896551724, "percentage": 9.18, "elapsed_time": "6:08:27", "remaining_time": "2 days, 12:46:40"}
|
| 69 |
+
{"current_steps": 69, "total_steps": 741, "loss": 0.3639, "lr": 2.9865400858573866e-05, "epoch": 0.2799188640973631, "percentage": 9.31, "elapsed_time": "6:14:32", "remaining_time": "2 days, 12:47:37"}
|
| 70 |
+
{"current_steps": 70, "total_steps": 741, "loss": 0.3945, "lr": 2.985629262184371e-05, "epoch": 0.2839756592292089, "percentage": 9.45, "elapsed_time": "6:20:39", "remaining_time": "2 days, 12:48:55"}
|
| 71 |
+
{"current_steps": 71, "total_steps": 741, "loss": 0.3875, "lr": 2.9846887697908292e-05, "epoch": 0.2880324543610548, "percentage": 9.58, "elapsed_time": "6:26:24", "remaining_time": "2 days, 12:46:24"}
|
| 72 |
+
{"current_steps": 72, "total_steps": 741, "loss": 0.3666, "lr": 2.9837186274588388e-05, "epoch": 0.2920892494929006, "percentage": 9.72, "elapsed_time": "6:31:41", "remaining_time": "2 days, 12:39:31"}
|
| 73 |
+
{"current_steps": 73, "total_steps": 741, "loss": 0.3371, "lr": 2.9827188545626026e-05, "epoch": 0.2961460446247465, "percentage": 9.85, "elapsed_time": "6:36:47", "remaining_time": "2 days, 12:30:57"}
|
| 74 |
+
{"current_steps": 74, "total_steps": 741, "loss": 0.3472, "lr": 2.9816894710680595e-05, "epoch": 0.3002028397565923, "percentage": 9.99, "elapsed_time": "6:42:00", "remaining_time": "2 days, 12:23:29"}
|
| 75 |
+
{"current_steps": 75, "total_steps": 741, "loss": 0.3787, "lr": 2.9806304975324853e-05, "epoch": 0.30425963488843816, "percentage": 10.12, "elapsed_time": "6:47:52", "remaining_time": "2 days, 12:21:52"}
|
| 76 |
+
{"current_steps": 76, "total_steps": 741, "loss": 0.3422, "lr": 2.9795419551040836e-05, "epoch": 0.30831643002028397, "percentage": 10.26, "elapsed_time": "6:53:36", "remaining_time": "2 days, 12:19:07"}
|
| 77 |
+
{"current_steps": 77, "total_steps": 741, "loss": 0.3424, "lr": 2.9784238655215627e-05, "epoch": 0.31237322515212984, "percentage": 10.39, "elapsed_time": "6:58:36", "remaining_time": "2 days, 12:09:45"}
|
| 78 |
+
{"current_steps": 78, "total_steps": 741, "loss": 0.3363, "lr": 2.9772762511137018e-05, "epoch": 0.31643002028397565, "percentage": 10.53, "elapsed_time": "7:04:06", "remaining_time": "2 days, 12:04:55"}
|
| 79 |
+
{"current_steps": 79, "total_steps": 741, "loss": 0.3256, "lr": 2.976099134798904e-05, "epoch": 0.3204868154158215, "percentage": 10.66, "elapsed_time": "7:09:25", "remaining_time": "2 days, 11:58:31"}
|
| 80 |
+
{"current_steps": 80, "total_steps": 741, "loss": 0.3485, "lr": 2.97489254008474e-05, "epoch": 0.32454361054766734, "percentage": 10.8, "elapsed_time": "7:14:58", "remaining_time": "2 days, 11:53:57"}
|
| 81 |
+
{"current_steps": 81, "total_steps": 741, "loss": 0.3706, "lr": 2.973656491067479e-05, "epoch": 0.3286004056795132, "percentage": 10.93, "elapsed_time": "7:21:16", "remaining_time": "2 days, 11:55:31"}
|
| 82 |
+
{"current_steps": 82, "total_steps": 741, "loss": 0.3272, "lr": 2.972391012431605e-05, "epoch": 0.332657200811359, "percentage": 11.07, "elapsed_time": "7:26:10", "remaining_time": "2 days, 11:45:46"}
|
| 83 |
+
{"current_steps": 83, "total_steps": 741, "loss": 0.333, "lr": 2.9710961294493258e-05, "epoch": 0.3367139959432049, "percentage": 11.2, "elapsed_time": "7:30:51", "remaining_time": "2 days, 11:34:13"}
|
| 84 |
+
{"current_steps": 84, "total_steps": 741, "loss": 0.347, "lr": 2.96977186798007e-05, "epoch": 0.3407707910750507, "percentage": 11.34, "elapsed_time": "7:36:13", "remaining_time": "2 days, 11:28:16"}
|
| 85 |
+
{"current_steps": 85, "total_steps": 741, "loss": 0.3006, "lr": 2.9684182544699645e-05, "epoch": 0.3448275862068966, "percentage": 11.47, "elapsed_time": "7:41:48", "remaining_time": "2 days, 11:24:02"}
|
| 86 |
+
{"current_steps": 86, "total_steps": 741, "loss": 0.3158, "lr": 2.9670353159513148e-05, "epoch": 0.3488843813387424, "percentage": 11.61, "elapsed_time": "7:47:53", "remaining_time": "2 days, 11:23:35"}
|
| 87 |
+
{"current_steps": 87, "total_steps": 741, "loss": 0.3582, "lr": 2.965623080042057e-05, "epoch": 0.35294117647058826, "percentage": 11.74, "elapsed_time": "7:53:15", "remaining_time": "2 days, 11:17:36"}
|
| 88 |
+
{"current_steps": 88, "total_steps": 741, "loss": 0.3002, "lr": 2.964181574945213e-05, "epoch": 0.35699797160243407, "percentage": 11.88, "elapsed_time": "7:58:48", "remaining_time": "2 days, 11:12:59"}
|
| 89 |
+
{"current_steps": 89, "total_steps": 741, "loss": 0.3232, "lr": 2.9627108294483213e-05, "epoch": 0.36105476673427994, "percentage": 12.01, "elapsed_time": "8:04:03", "remaining_time": "2 days, 11:06:11"}
|
| 90 |
+
{"current_steps": 90, "total_steps": 741, "loss": 0.3568, "lr": 2.9612108729228678e-05, "epoch": 0.36511156186612576, "percentage": 12.15, "elapsed_time": "8:09:03", "remaining_time": "2 days, 10:57:28"}
|
| 91 |
+
{"current_steps": 91, "total_steps": 741, "loss": 0.3072, "lr": 2.9596817353236945e-05, "epoch": 0.3691683569979716, "percentage": 12.28, "elapsed_time": "8:14:29", "remaining_time": "2 days, 10:52:06"}
|
| 92 |
+
{"current_steps": 92, "total_steps": 741, "loss": 0.3363, "lr": 2.9581234471884047e-05, "epoch": 0.37322515212981744, "percentage": 12.42, "elapsed_time": "8:19:35", "remaining_time": "2 days, 10:44:14"}
|
| 93 |
+
{"current_steps": 93, "total_steps": 741, "loss": 0.2996, "lr": 2.9565360396367506e-05, "epoch": 0.3772819472616633, "percentage": 12.55, "elapsed_time": "8:24:57", "remaining_time": "2 days, 10:38:28"}
|
| 94 |
+
{"current_steps": 94, "total_steps": 741, "loss": 0.347, "lr": 2.954919544370014e-05, "epoch": 0.3813387423935091, "percentage": 12.69, "elapsed_time": "8:30:40", "remaining_time": "2 days, 10:34:59"}
|
| 95 |
+
{"current_steps": 95, "total_steps": 741, "loss": 0.3332, "lr": 2.9532739936703703e-05, "epoch": 0.385395537525355, "percentage": 12.82, "elapsed_time": "8:35:41", "remaining_time": "2 days, 10:26:39"}
|
| 96 |
+
{"current_steps": 96, "total_steps": 741, "loss": 0.2828, "lr": 2.9515994204002485e-05, "epoch": 0.3894523326572008, "percentage": 12.96, "elapsed_time": "8:41:32", "remaining_time": "2 days, 10:24:09"}
|
| 97 |
+
{"current_steps": 97, "total_steps": 741, "loss": 0.3293, "lr": 2.9498958580016692e-05, "epoch": 0.3935091277890467, "percentage": 13.09, "elapsed_time": "8:46:43", "remaining_time": "2 days, 10:17:02"}
|
| 98 |
+
{"current_steps": 98, "total_steps": 741, "loss": 0.3071, "lr": 2.9481633404955816e-05, "epoch": 0.3975659229208925, "percentage": 13.23, "elapsed_time": "8:52:05", "remaining_time": "2 days, 10:11:08"}
|
| 99 |
+
{"current_steps": 99, "total_steps": 741, "loss": 0.293, "lr": 2.9464019024811817e-05, "epoch": 0.40162271805273836, "percentage": 13.36, "elapsed_time": "8:57:10", "remaining_time": "2 days, 10:03:30"}
|
| 100 |
+
{"current_steps": 100, "total_steps": 741, "loss": 0.3201, "lr": 2.9446115791352207e-05, "epoch": 0.4056795131845842, "percentage": 13.5, "elapsed_time": "9:02:08", "remaining_time": "2 days, 9:55:07"}
|