EmiliaLee commited on
Commit
cfc68cf
·
verified ·
1 Parent(s): af3a467

Training in progress, step 50

Browse files
README.md CHANGED
@@ -3,8 +3,8 @@ library_name: transformers
3
  model_name: pakdd_tag_comcts_gemma
4
  tags:
5
  - generated_from_trainer
6
- - trl
7
  - grpo
 
8
  licence: license
9
  ---
10
 
@@ -26,7 +26,7 @@ print(output["generated_text"])
26
 
27
  ## Training procedure
28
 
29
- [<img src="https://raw.githubusercontent.com/wandb/assets/main/wandb-github-badge-28.svg" alt="Visualize in Weights & Biases" width="150" height="24"/>](https://wandb.ai/jylee18/tag/runs/bkwqqhra)
30
 
31
 
32
  This model was trained with GRPO, a method introduced in [DeepSeekMath: Pushing the Limits of Mathematical Reasoning in Open Language Models](https://huggingface.co/papers/2402.03300).
 
3
  model_name: pakdd_tag_comcts_gemma
4
  tags:
5
  - generated_from_trainer
 
6
  - grpo
7
+ - trl
8
  licence: license
9
  ---
10
 
 
26
 
27
  ## Training procedure
28
 
29
+ [<img src="https://raw.githubusercontent.com/wandb/assets/main/wandb-github-badge-28.svg" alt="Visualize in Weights & Biases" width="150" height="24"/>](https://wandb.ai/jylee18/tag/runs/5626hibe)
30
 
31
 
32
  This model was trained with GRPO, a method introduced in [DeepSeekMath: Pushing the Limits of Mathematical Reasoning in Open Language Models](https://huggingface.co/papers/2402.03300).
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f057c762fd61cb9ca14d09d69e123415de6a4812f29de00490a4804026cf4afb
3
  size 12932216
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bbf625ea0857f9a418b28fc331ab3233953020a699bc53fea0b6a9ca59186324
3
  size 12932216
preprocessor_config.json ADDED
@@ -0,0 +1,39 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "crop_size": null,
3
+ "data_format": "channels_first",
4
+ "default_to_square": true,
5
+ "device": null,
6
+ "disable_grouping": null,
7
+ "do_center_crop": null,
8
+ "do_convert_rgb": null,
9
+ "do_normalize": true,
10
+ "do_pad": null,
11
+ "do_pan_and_scan": null,
12
+ "do_rescale": true,
13
+ "do_resize": true,
14
+ "image_mean": [
15
+ 0.5,
16
+ 0.5,
17
+ 0.5
18
+ ],
19
+ "image_processor_type": "Gemma3ImageProcessorFast",
20
+ "image_seq_length": 256,
21
+ "image_std": [
22
+ 0.5,
23
+ 0.5,
24
+ 0.5
25
+ ],
26
+ "input_data_format": null,
27
+ "pad_size": null,
28
+ "pan_and_scan_max_num_crops": null,
29
+ "pan_and_scan_min_crop_size": null,
30
+ "pan_and_scan_min_ratio_to_activate": null,
31
+ "processor_class": "Gemma3Processor",
32
+ "resample": 2,
33
+ "rescale_factor": 0.00392156862745098,
34
+ "return_tensors": null,
35
+ "size": {
36
+ "height": 896,
37
+ "width": 896
38
+ }
39
+ }
processor_config.json CHANGED
@@ -1,43 +1,4 @@
1
  {
2
- "image_processor": {
3
- "crop_size": null,
4
- "data_format": "channels_first",
5
- "default_to_square": true,
6
- "device": null,
7
- "disable_grouping": null,
8
- "do_center_crop": null,
9
- "do_convert_rgb": null,
10
- "do_normalize": true,
11
- "do_pad": null,
12
- "do_pan_and_scan": null,
13
- "do_rescale": true,
14
- "do_resize": true,
15
- "image_mean": [
16
- 0.5,
17
- 0.5,
18
- 0.5
19
- ],
20
- "image_processor_type": "Gemma3ImageProcessorFast",
21
- "image_seq_length": 256,
22
- "image_std": [
23
- 0.5,
24
- 0.5,
25
- 0.5
26
- ],
27
- "input_data_format": null,
28
- "pad_size": null,
29
- "pan_and_scan_max_num_crops": null,
30
- "pan_and_scan_min_crop_size": null,
31
- "pan_and_scan_min_ratio_to_activate": null,
32
- "processor_class": "Gemma3Processor",
33
- "resample": 2,
34
- "rescale_factor": 0.00392156862745098,
35
- "return_tensors": null,
36
- "size": {
37
- "height": 896,
38
- "width": 896
39
- }
40
- },
41
  "image_seq_length": 256,
42
  "processor_class": "Gemma3Processor"
43
  }
 
1
  {
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
2
  "image_seq_length": 256,
3
  "processor_class": "Gemma3Processor"
4
  }
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9e2b1931eb8e4acc0b0bac7ca3c7f637f681100fcdcbb1becd527df06588b304
3
- size 6136
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c01fdd119e8b2fe6c6f8f32bef79b2e58497a3eabaa6c75c7d51203c168d598c
3
+ size 6904