Training in progress, step 50
Browse files- README.md +2 -2
- adapter_model.safetensors +1 -1
- preprocessor_config.json +39 -0
- processor_config.json +0 -39
- training_args.bin +2 -2
README.md
CHANGED
|
@@ -3,8 +3,8 @@ library_name: transformers
|
|
| 3 |
model_name: pakdd_tag_comcts_gemma
|
| 4 |
tags:
|
| 5 |
- generated_from_trainer
|
| 6 |
-
- trl
|
| 7 |
- grpo
|
|
|
|
| 8 |
licence: license
|
| 9 |
---
|
| 10 |
|
|
@@ -26,7 +26,7 @@ print(output["generated_text"])
|
|
| 26 |
|
| 27 |
## Training procedure
|
| 28 |
|
| 29 |
-
[<img src="https://raw.githubusercontent.com/wandb/assets/main/wandb-github-badge-28.svg" alt="Visualize in Weights & Biases" width="150" height="24"/>](https://wandb.ai/jylee18/tag/runs/
|
| 30 |
|
| 31 |
|
| 32 |
This model was trained with GRPO, a method introduced in [DeepSeekMath: Pushing the Limits of Mathematical Reasoning in Open Language Models](https://huggingface.co/papers/2402.03300).
|
|
|
|
| 3 |
model_name: pakdd_tag_comcts_gemma
|
| 4 |
tags:
|
| 5 |
- generated_from_trainer
|
|
|
|
| 6 |
- grpo
|
| 7 |
+
- trl
|
| 8 |
licence: license
|
| 9 |
---
|
| 10 |
|
|
|
|
| 26 |
|
| 27 |
## Training procedure
|
| 28 |
|
| 29 |
+
[<img src="https://raw.githubusercontent.com/wandb/assets/main/wandb-github-badge-28.svg" alt="Visualize in Weights & Biases" width="150" height="24"/>](https://wandb.ai/jylee18/tag/runs/5626hibe)
|
| 30 |
|
| 31 |
|
| 32 |
This model was trained with GRPO, a method introduced in [DeepSeekMath: Pushing the Limits of Mathematical Reasoning in Open Language Models](https://huggingface.co/papers/2402.03300).
|
adapter_model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 12932216
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:bbf625ea0857f9a418b28fc331ab3233953020a699bc53fea0b6a9ca59186324
|
| 3 |
size 12932216
|
preprocessor_config.json
ADDED
|
@@ -0,0 +1,39 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"crop_size": null,
|
| 3 |
+
"data_format": "channels_first",
|
| 4 |
+
"default_to_square": true,
|
| 5 |
+
"device": null,
|
| 6 |
+
"disable_grouping": null,
|
| 7 |
+
"do_center_crop": null,
|
| 8 |
+
"do_convert_rgb": null,
|
| 9 |
+
"do_normalize": true,
|
| 10 |
+
"do_pad": null,
|
| 11 |
+
"do_pan_and_scan": null,
|
| 12 |
+
"do_rescale": true,
|
| 13 |
+
"do_resize": true,
|
| 14 |
+
"image_mean": [
|
| 15 |
+
0.5,
|
| 16 |
+
0.5,
|
| 17 |
+
0.5
|
| 18 |
+
],
|
| 19 |
+
"image_processor_type": "Gemma3ImageProcessorFast",
|
| 20 |
+
"image_seq_length": 256,
|
| 21 |
+
"image_std": [
|
| 22 |
+
0.5,
|
| 23 |
+
0.5,
|
| 24 |
+
0.5
|
| 25 |
+
],
|
| 26 |
+
"input_data_format": null,
|
| 27 |
+
"pad_size": null,
|
| 28 |
+
"pan_and_scan_max_num_crops": null,
|
| 29 |
+
"pan_and_scan_min_crop_size": null,
|
| 30 |
+
"pan_and_scan_min_ratio_to_activate": null,
|
| 31 |
+
"processor_class": "Gemma3Processor",
|
| 32 |
+
"resample": 2,
|
| 33 |
+
"rescale_factor": 0.00392156862745098,
|
| 34 |
+
"return_tensors": null,
|
| 35 |
+
"size": {
|
| 36 |
+
"height": 896,
|
| 37 |
+
"width": 896
|
| 38 |
+
}
|
| 39 |
+
}
|
processor_config.json
CHANGED
|
@@ -1,43 +1,4 @@
|
|
| 1 |
{
|
| 2 |
-
"image_processor": {
|
| 3 |
-
"crop_size": null,
|
| 4 |
-
"data_format": "channels_first",
|
| 5 |
-
"default_to_square": true,
|
| 6 |
-
"device": null,
|
| 7 |
-
"disable_grouping": null,
|
| 8 |
-
"do_center_crop": null,
|
| 9 |
-
"do_convert_rgb": null,
|
| 10 |
-
"do_normalize": true,
|
| 11 |
-
"do_pad": null,
|
| 12 |
-
"do_pan_and_scan": null,
|
| 13 |
-
"do_rescale": true,
|
| 14 |
-
"do_resize": true,
|
| 15 |
-
"image_mean": [
|
| 16 |
-
0.5,
|
| 17 |
-
0.5,
|
| 18 |
-
0.5
|
| 19 |
-
],
|
| 20 |
-
"image_processor_type": "Gemma3ImageProcessorFast",
|
| 21 |
-
"image_seq_length": 256,
|
| 22 |
-
"image_std": [
|
| 23 |
-
0.5,
|
| 24 |
-
0.5,
|
| 25 |
-
0.5
|
| 26 |
-
],
|
| 27 |
-
"input_data_format": null,
|
| 28 |
-
"pad_size": null,
|
| 29 |
-
"pan_and_scan_max_num_crops": null,
|
| 30 |
-
"pan_and_scan_min_crop_size": null,
|
| 31 |
-
"pan_and_scan_min_ratio_to_activate": null,
|
| 32 |
-
"processor_class": "Gemma3Processor",
|
| 33 |
-
"resample": 2,
|
| 34 |
-
"rescale_factor": 0.00392156862745098,
|
| 35 |
-
"return_tensors": null,
|
| 36 |
-
"size": {
|
| 37 |
-
"height": 896,
|
| 38 |
-
"width": 896
|
| 39 |
-
}
|
| 40 |
-
},
|
| 41 |
"image_seq_length": 256,
|
| 42 |
"processor_class": "Gemma3Processor"
|
| 43 |
}
|
|
|
|
| 1 |
{
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 2 |
"image_seq_length": 256,
|
| 3 |
"processor_class": "Gemma3Processor"
|
| 4 |
}
|
training_args.bin
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c01fdd119e8b2fe6c6f8f32bef79b2e58497a3eabaa6c75c7d51203c168d598c
|
| 3 |
+
size 6904
|