baloglu321 commited on
Commit
bafbcb2
·
verified ·
1 Parent(s): fa0f274

baloglu321/gemma-2-2B-it-thinking-function_calling-V0

Browse files
README.md CHANGED
@@ -34,11 +34,11 @@ This model was trained with SFT.
34
 
35
  ### Framework versions
36
 
37
- - TRL: 0.15.1
38
- - Transformers: 4.48.3
39
- - Pytorch: 2.5.1+cu124
40
- - Datasets: 3.3.2
41
- - Tokenizers: 0.21.0
42
 
43
  ## Citations
44
 
@@ -49,7 +49,7 @@ Cite TRL as:
49
  ```bibtex
50
  @misc{vonwerra2022trl,
51
  title = {{TRL: Transformer Reinforcement Learning}},
52
- author = {Leandro von Werra and Younes Belkada and Lewis Tunstall and Edward Beeching and Tristan Thrush and Nathan Lambert and Shengyi Huang and Kashif Rasul and Quentin Gallouédec},
53
  year = 2020,
54
  journal = {GitHub repository},
55
  publisher = {GitHub},
 
34
 
35
  ### Framework versions
36
 
37
+ - TRL: 0.17.0
38
+ - Transformers: 4.51.3
39
+ - Pytorch: 2.6.0+cu124
40
+ - Datasets: 3.6.0
41
+ - Tokenizers: 0.21.1
42
 
43
  ## Citations
44
 
 
49
  ```bibtex
50
  @misc{vonwerra2022trl,
51
  title = {{TRL: Transformer Reinforcement Learning}},
52
+ author = {Leandro von Werra and Younes Belkada and Lewis Tunstall and Edward Beeching and Tristan Thrush and Nathan Lambert and Shengyi Huang and Kashif Rasul and Quentin Gallou{\'e}dec},
53
  year = 2020,
54
  journal = {GitHub repository},
55
  publisher = {GitHub},
adapter_config.json CHANGED
@@ -3,6 +3,7 @@
3
  "auto_mapping": null,
4
  "base_model_name_or_path": "google/gemma-2-2b-it",
5
  "bias": "none",
 
6
  "eva_config": null,
7
  "exclude_modules": null,
8
  "fan_in_fan_out": false,
@@ -23,17 +24,18 @@
23
  "rank_pattern": {},
24
  "revision": null,
25
  "target_modules": [
26
- "k_proj",
27
- "v_proj",
28
  "down_proj",
29
- "gate_proj",
30
  "embed_tokens",
31
- "o_proj",
32
- "q_proj",
33
- "lm_head",
34
- "up_proj"
35
  ],
36
  "task_type": "CAUSAL_LM",
 
37
  "use_dora": false,
38
  "use_rslora": false
39
  }
 
3
  "auto_mapping": null,
4
  "base_model_name_or_path": "google/gemma-2-2b-it",
5
  "bias": "none",
6
+ "corda_config": null,
7
  "eva_config": null,
8
  "exclude_modules": null,
9
  "fan_in_fan_out": false,
 
24
  "rank_pattern": {},
25
  "revision": null,
26
  "target_modules": [
27
+ "lm_head",
28
+ "q_proj",
29
  "down_proj",
30
+ "k_proj",
31
  "embed_tokens",
32
+ "gate_proj",
33
+ "v_proj",
34
+ "up_proj",
35
+ "o_proj"
36
  ],
37
  "task_type": "CAUSAL_LM",
38
+ "trainable_token_indices": null,
39
  "use_dora": false,
40
  "use_rslora": false
41
  }
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3ac146acd21f54248f045ac12d50e4f1265afeb00901719a4740bcb1c2fc8e68
3
  size 2475549872
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c3bdf32ea49d0e5a1c9152d96734629f75611c8a9c95d07067aa94572eb8ea5a
3
  size 2475549872
runs/May11_12-41-58_4dd80c48a4c5/events.out.tfevents.1746967345.4dd80c48a4c5.1808.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2fe3c0968162b6b1e59ff1a06323c18e2d5997fd75ce83f6ff087f2e0a7b452f
3
+ size 41400
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:95485e8c267905da6178e167d719e7e47b4ce3c451d64b4e38b719a8ea4e08d8
3
- size 5624
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ae19ba492176177f25b68ab411b8e2ca1ec69526ad23ca1df12e5faaeb36a253
3
+ size 5752