danijeun commited on
Commit
8d7e632
·
verified ·
1 Parent(s): 6950e83

Jofthomas/gemma-2-2B-it-thinking-function_calling-V0

Browse files
README.md CHANGED
@@ -1,5 +1,5 @@
1
  ---
2
- base_model: google/gemma-2-2b-it
3
  library_name: transformers
4
  model_name: gemma-2-2B-it-thinking-function_calling-V0
5
  tags:
@@ -11,7 +11,7 @@ licence: license
11
 
12
  # Model Card for gemma-2-2B-it-thinking-function_calling-V0
13
 
14
- This model is a fine-tuned version of [google/gemma-2-2b-it](https://huggingface.co/google/gemma-2-2b-it).
15
  It has been trained using [TRL](https://github.com/huggingface/trl).
16
 
17
  ## Quick start
@@ -34,9 +34,9 @@ This model was trained with SFT.
34
 
35
  ### Framework versions
36
 
37
- - TRL: 0.18.0
38
- - Transformers: 4.52.3
39
- - Pytorch: 2.7.0
40
  - Datasets: 3.6.0
41
  - Tokenizers: 0.21.1
42
 
 
1
  ---
2
+ base_model: QCRI/Fanar-1-9B-Instruct
3
  library_name: transformers
4
  model_name: gemma-2-2B-it-thinking-function_calling-V0
5
  tags:
 
11
 
12
  # Model Card for gemma-2-2B-it-thinking-function_calling-V0
13
 
14
+ This model is a fine-tuned version of [QCRI/Fanar-1-9B-Instruct](https://huggingface.co/QCRI/Fanar-1-9B-Instruct).
15
  It has been trained using [TRL](https://github.com/huggingface/trl).
16
 
17
  ## Quick start
 
34
 
35
  ### Framework versions
36
 
37
+ - TRL: 0.18.1
38
+ - Transformers: 4.52.4
39
+ - Pytorch: 2.7.1
40
  - Datasets: 3.6.0
41
  - Tokenizers: 0.21.1
42
 
adapter_config.json CHANGED
@@ -1,7 +1,7 @@
1
  {
2
  "alpha_pattern": {},
3
  "auto_mapping": null,
4
- "base_model_name_or_path": "google/gemma-2-2b-it",
5
  "bias": "none",
6
  "corda_config": null,
7
  "eva_config": null,
@@ -24,15 +24,15 @@
24
  "rank_pattern": {},
25
  "revision": null,
26
  "target_modules": [
27
- "down_proj",
28
- "embed_tokens",
29
- "gate_proj",
30
  "k_proj",
 
 
 
31
  "q_proj",
 
32
  "v_proj",
33
- "lm_head",
34
- "up_proj",
35
- "o_proj"
36
  ],
37
  "task_type": "CAUSAL_LM",
38
  "trainable_token_indices": null,
 
1
  {
2
  "alpha_pattern": {},
3
  "auto_mapping": null,
4
+ "base_model_name_or_path": "QCRI/Fanar-1-9B-Instruct",
5
  "bias": "none",
6
  "corda_config": null,
7
  "eva_config": null,
 
24
  "rank_pattern": {},
25
  "revision": null,
26
  "target_modules": [
27
+ "lm_head",
 
 
28
  "k_proj",
29
+ "embed_tokens",
30
+ "down_proj",
31
+ "o_proj",
32
  "q_proj",
33
+ "gate_proj",
34
  "v_proj",
35
+ "up_proj"
 
 
36
  ],
37
  "task_type": "CAUSAL_LM",
38
  "trainable_token_indices": null,
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a4ace2d0713c369b1111a51dbe8b907ca893c3884ad908f5c5bfc94ed9633e59
3
- size 2475549872
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1dd592f48b190b9262a4cac71e0c38d219d3b7ee90d3c7b0f8750227d79549a3
3
+ size 2071821368
added_tokens.json CHANGED
@@ -1,10 +1,10 @@
1
  {
2
- "</think>": 256003,
3
- "</tool_call>": 256005,
4
- "</tool_response>": 256007,
5
- "</tools>": 256001,
6
- "<think>": 256002,
7
- "<tool_call>": 256004,
8
- "<tool_response>": 256006,
9
- "<tools>": 256000
10
  }
 
1
  {
2
+ "</think>": 128259,
3
+ "</tool_call>": 128261,
4
+ "</tool_response>": 128263,
5
+ "</tools>": 128257,
6
+ "<think>": 128258,
7
+ "<tool_call>": 128260,
8
+ "<tool_response>": 128262,
9
+ "<tools>": 128256
10
  }
runs/Jun11_05-56-03_c410f4ca4dc9/events.out.tfevents.1749621366.c410f4ca4dc9.704.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:50cbfa539478b1b3b7aa78f606c00e3839df86277e8094fee87cd56aff51c1f6
3
+ size 7312
tokenizer.json CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1cd8f004969d7a7c0b0d9b1c0d3335171bf05fd2e2bcf3066f780c9ad5b3fe99
3
- size 34364373
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1b0fce840be951700b72e7a32fc69f6fd9e7c801029b8a0277918f8151e51ce4
3
+ size 18069535
tokenizer.model CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:61a7b147390c64585d6c3543dd6fc636906c9af3865a5548f27f31aee1d4c8e2
3
- size 4241003
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c689fef08039792f515e5bcd67759b3bd73f845d8e7f0fda75471c6a103aad41
3
+ size 2124704
tokenizer_config.json CHANGED
@@ -1738,7 +1738,7 @@
1738
  "single_word": false,
1739
  "special": false
1740
  },
1741
- "255968": {
1742
  "content": "[toxicity=0]",
1743
  "lstrip": false,
1744
  "normalized": false,
@@ -1746,7 +1746,7 @@
1746
  "single_word": false,
1747
  "special": false
1748
  },
1749
- "255969": {
1750
  "content": "\t\t",
1751
  "lstrip": false,
1752
  "normalized": false,
@@ -1754,7 +1754,7 @@
1754
  "single_word": false,
1755
  "special": false
1756
  },
1757
- "255970": {
1758
  "content": "\t\t\t",
1759
  "lstrip": false,
1760
  "normalized": false,
@@ -1762,7 +1762,7 @@
1762
  "single_word": false,
1763
  "special": false
1764
  },
1765
- "255971": {
1766
  "content": "\t\t\t\t",
1767
  "lstrip": false,
1768
  "normalized": false,
@@ -1770,7 +1770,7 @@
1770
  "single_word": false,
1771
  "special": false
1772
  },
1773
- "255972": {
1774
  "content": "\t\t\t\t\t",
1775
  "lstrip": false,
1776
  "normalized": false,
@@ -1778,7 +1778,7 @@
1778
  "single_word": false,
1779
  "special": false
1780
  },
1781
- "255973": {
1782
  "content": "\t\t\t\t\t\t",
1783
  "lstrip": false,
1784
  "normalized": false,
@@ -1786,7 +1786,7 @@
1786
  "single_word": false,
1787
  "special": false
1788
  },
1789
- "255974": {
1790
  "content": "\t\t\t\t\t\t\t",
1791
  "lstrip": false,
1792
  "normalized": false,
@@ -1794,7 +1794,7 @@
1794
  "single_word": false,
1795
  "special": false
1796
  },
1797
- "255975": {
1798
  "content": "\t\t\t\t\t\t\t\t",
1799
  "lstrip": false,
1800
  "normalized": false,
@@ -1802,7 +1802,7 @@
1802
  "single_word": false,
1803
  "special": false
1804
  },
1805
- "255976": {
1806
  "content": "\t\t\t\t\t\t\t\t\t",
1807
  "lstrip": false,
1808
  "normalized": false,
@@ -1810,7 +1810,7 @@
1810
  "single_word": false,
1811
  "special": false
1812
  },
1813
- "255977": {
1814
  "content": "\t\t\t\t\t\t\t\t\t\t",
1815
  "lstrip": false,
1816
  "normalized": false,
@@ -1818,7 +1818,7 @@
1818
  "single_word": false,
1819
  "special": false
1820
  },
1821
- "255978": {
1822
  "content": "\t\t\t\t\t\t\t\t\t\t\t",
1823
  "lstrip": false,
1824
  "normalized": false,
@@ -1826,7 +1826,7 @@
1826
  "single_word": false,
1827
  "special": false
1828
  },
1829
- "255979": {
1830
  "content": "\t\t\t\t\t\t\t\t\t\t\t\t",
1831
  "lstrip": false,
1832
  "normalized": false,
@@ -1834,7 +1834,7 @@
1834
  "single_word": false,
1835
  "special": false
1836
  },
1837
- "255980": {
1838
  "content": "\t\t\t\t\t\t\t\t\t\t\t\t\t",
1839
  "lstrip": false,
1840
  "normalized": false,
@@ -1842,7 +1842,7 @@
1842
  "single_word": false,
1843
  "special": false
1844
  },
1845
- "255981": {
1846
  "content": "\t\t\t\t\t\t\t\t\t\t\t\t\t\t",
1847
  "lstrip": false,
1848
  "normalized": false,
@@ -1850,7 +1850,7 @@
1850
  "single_word": false,
1851
  "special": false
1852
  },
1853
- "255982": {
1854
  "content": "\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t",
1855
  "lstrip": false,
1856
  "normalized": false,
@@ -1858,7 +1858,7 @@
1858
  "single_word": false,
1859
  "special": false
1860
  },
1861
- "255983": {
1862
  "content": "\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t",
1863
  "lstrip": false,
1864
  "normalized": false,
@@ -1866,7 +1866,7 @@
1866
  "single_word": false,
1867
  "special": false
1868
  },
1869
- "255984": {
1870
  "content": "\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t",
1871
  "lstrip": false,
1872
  "normalized": false,
@@ -1874,7 +1874,7 @@
1874
  "single_word": false,
1875
  "special": false
1876
  },
1877
- "255985": {
1878
  "content": "\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t",
1879
  "lstrip": false,
1880
  "normalized": false,
@@ -1882,7 +1882,7 @@
1882
  "single_word": false,
1883
  "special": false
1884
  },
1885
- "255986": {
1886
  "content": "\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t",
1887
  "lstrip": false,
1888
  "normalized": false,
@@ -1890,7 +1890,7 @@
1890
  "single_word": false,
1891
  "special": false
1892
  },
1893
- "255987": {
1894
  "content": "\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t",
1895
  "lstrip": false,
1896
  "normalized": false,
@@ -1898,7 +1898,7 @@
1898
  "single_word": false,
1899
  "special": false
1900
  },
1901
- "255988": {
1902
  "content": "\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t",
1903
  "lstrip": false,
1904
  "normalized": false,
@@ -1906,7 +1906,7 @@
1906
  "single_word": false,
1907
  "special": false
1908
  },
1909
- "255989": {
1910
  "content": "\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t",
1911
  "lstrip": false,
1912
  "normalized": false,
@@ -1914,7 +1914,7 @@
1914
  "single_word": false,
1915
  "special": false
1916
  },
1917
- "255990": {
1918
  "content": "\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t",
1919
  "lstrip": false,
1920
  "normalized": false,
@@ -1922,7 +1922,7 @@
1922
  "single_word": false,
1923
  "special": false
1924
  },
1925
- "255991": {
1926
  "content": "\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t",
1927
  "lstrip": false,
1928
  "normalized": false,
@@ -1930,7 +1930,7 @@
1930
  "single_word": false,
1931
  "special": false
1932
  },
1933
- "255992": {
1934
  "content": "\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t",
1935
  "lstrip": false,
1936
  "normalized": false,
@@ -1938,7 +1938,7 @@
1938
  "single_word": false,
1939
  "special": false
1940
  },
1941
- "255993": {
1942
  "content": "\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t",
1943
  "lstrip": false,
1944
  "normalized": false,
@@ -1946,7 +1946,7 @@
1946
  "single_word": false,
1947
  "special": false
1948
  },
1949
- "255994": {
1950
  "content": "\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t",
1951
  "lstrip": false,
1952
  "normalized": false,
@@ -1954,7 +1954,7 @@
1954
  "single_word": false,
1955
  "special": false
1956
  },
1957
- "255995": {
1958
  "content": "\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t",
1959
  "lstrip": false,
1960
  "normalized": false,
@@ -1962,7 +1962,7 @@
1962
  "single_word": false,
1963
  "special": false
1964
  },
1965
- "255996": {
1966
  "content": "\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t",
1967
  "lstrip": false,
1968
  "normalized": false,
@@ -1970,7 +1970,7 @@
1970
  "single_word": false,
1971
  "special": false
1972
  },
1973
- "255997": {
1974
  "content": "\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t",
1975
  "lstrip": false,
1976
  "normalized": false,
@@ -1978,7 +1978,7 @@
1978
  "single_word": false,
1979
  "special": false
1980
  },
1981
- "255998": {
1982
  "content": "\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t",
1983
  "lstrip": false,
1984
  "normalized": false,
@@ -1986,7 +1986,7 @@
1986
  "single_word": false,
1987
  "special": false
1988
  },
1989
- "255999": {
1990
  "content": "<unused99>",
1991
  "lstrip": false,
1992
  "normalized": false,
@@ -1994,7 +1994,7 @@
1994
  "single_word": false,
1995
  "special": false
1996
  },
1997
- "256000": {
1998
  "content": "<tools>",
1999
  "lstrip": false,
2000
  "normalized": false,
@@ -2002,7 +2002,7 @@
2002
  "single_word": false,
2003
  "special": true
2004
  },
2005
- "256001": {
2006
  "content": "</tools>",
2007
  "lstrip": false,
2008
  "normalized": false,
@@ -2010,7 +2010,7 @@
2010
  "single_word": false,
2011
  "special": true
2012
  },
2013
- "256002": {
2014
  "content": "<think>",
2015
  "lstrip": false,
2016
  "normalized": false,
@@ -2018,7 +2018,7 @@
2018
  "single_word": false,
2019
  "special": true
2020
  },
2021
- "256003": {
2022
  "content": "</think>",
2023
  "lstrip": false,
2024
  "normalized": false,
@@ -2026,7 +2026,7 @@
2026
  "single_word": false,
2027
  "special": true
2028
  },
2029
- "256004": {
2030
  "content": "<tool_call>",
2031
  "lstrip": false,
2032
  "normalized": false,
@@ -2034,7 +2034,7 @@
2034
  "single_word": false,
2035
  "special": true
2036
  },
2037
- "256005": {
2038
  "content": "</tool_call>",
2039
  "lstrip": false,
2040
  "normalized": false,
@@ -2042,7 +2042,7 @@
2042
  "single_word": false,
2043
  "special": true
2044
  },
2045
- "256006": {
2046
  "content": "<tool_response>",
2047
  "lstrip": false,
2048
  "normalized": false,
@@ -2050,7 +2050,7 @@
2050
  "single_word": false,
2051
  "special": true
2052
  },
2053
- "256007": {
2054
  "content": "</tool_response>",
2055
  "lstrip": false,
2056
  "normalized": false,
@@ -2077,8 +2077,10 @@
2077
  "extra_special_tokens": {},
2078
  "model_max_length": 1000000000000000019884624838656,
2079
  "pad_token": "<pad>",
 
2080
  "sp_model_kwargs": {},
2081
  "spaces_between_special_tokens": false,
 
2082
  "tokenizer_class": "GemmaTokenizer",
2083
  "unk_token": "<unk>",
2084
  "use_default_system_prompt": false
 
1738
  "single_word": false,
1739
  "special": false
1740
  },
1741
+ "128224": {
1742
  "content": "[toxicity=0]",
1743
  "lstrip": false,
1744
  "normalized": false,
 
1746
  "single_word": false,
1747
  "special": false
1748
  },
1749
+ "128225": {
1750
  "content": "\t\t",
1751
  "lstrip": false,
1752
  "normalized": false,
 
1754
  "single_word": false,
1755
  "special": false
1756
  },
1757
+ "128226": {
1758
  "content": "\t\t\t",
1759
  "lstrip": false,
1760
  "normalized": false,
 
1762
  "single_word": false,
1763
  "special": false
1764
  },
1765
+ "128227": {
1766
  "content": "\t\t\t\t",
1767
  "lstrip": false,
1768
  "normalized": false,
 
1770
  "single_word": false,
1771
  "special": false
1772
  },
1773
+ "128228": {
1774
  "content": "\t\t\t\t\t",
1775
  "lstrip": false,
1776
  "normalized": false,
 
1778
  "single_word": false,
1779
  "special": false
1780
  },
1781
+ "128229": {
1782
  "content": "\t\t\t\t\t\t",
1783
  "lstrip": false,
1784
  "normalized": false,
 
1786
  "single_word": false,
1787
  "special": false
1788
  },
1789
+ "128230": {
1790
  "content": "\t\t\t\t\t\t\t",
1791
  "lstrip": false,
1792
  "normalized": false,
 
1794
  "single_word": false,
1795
  "special": false
1796
  },
1797
+ "128231": {
1798
  "content": "\t\t\t\t\t\t\t\t",
1799
  "lstrip": false,
1800
  "normalized": false,
 
1802
  "single_word": false,
1803
  "special": false
1804
  },
1805
+ "128232": {
1806
  "content": "\t\t\t\t\t\t\t\t\t",
1807
  "lstrip": false,
1808
  "normalized": false,
 
1810
  "single_word": false,
1811
  "special": false
1812
  },
1813
+ "128233": {
1814
  "content": "\t\t\t\t\t\t\t\t\t\t",
1815
  "lstrip": false,
1816
  "normalized": false,
 
1818
  "single_word": false,
1819
  "special": false
1820
  },
1821
+ "128234": {
1822
  "content": "\t\t\t\t\t\t\t\t\t\t\t",
1823
  "lstrip": false,
1824
  "normalized": false,
 
1826
  "single_word": false,
1827
  "special": false
1828
  },
1829
+ "128235": {
1830
  "content": "\t\t\t\t\t\t\t\t\t\t\t\t",
1831
  "lstrip": false,
1832
  "normalized": false,
 
1834
  "single_word": false,
1835
  "special": false
1836
  },
1837
+ "128236": {
1838
  "content": "\t\t\t\t\t\t\t\t\t\t\t\t\t",
1839
  "lstrip": false,
1840
  "normalized": false,
 
1842
  "single_word": false,
1843
  "special": false
1844
  },
1845
+ "128237": {
1846
  "content": "\t\t\t\t\t\t\t\t\t\t\t\t\t\t",
1847
  "lstrip": false,
1848
  "normalized": false,
 
1850
  "single_word": false,
1851
  "special": false
1852
  },
1853
+ "128238": {
1854
  "content": "\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t",
1855
  "lstrip": false,
1856
  "normalized": false,
 
1858
  "single_word": false,
1859
  "special": false
1860
  },
1861
+ "128239": {
1862
  "content": "\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t",
1863
  "lstrip": false,
1864
  "normalized": false,
 
1866
  "single_word": false,
1867
  "special": false
1868
  },
1869
+ "128240": {
1870
  "content": "\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t",
1871
  "lstrip": false,
1872
  "normalized": false,
 
1874
  "single_word": false,
1875
  "special": false
1876
  },
1877
+ "128241": {
1878
  "content": "\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t",
1879
  "lstrip": false,
1880
  "normalized": false,
 
1882
  "single_word": false,
1883
  "special": false
1884
  },
1885
+ "128242": {
1886
  "content": "\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t",
1887
  "lstrip": false,
1888
  "normalized": false,
 
1890
  "single_word": false,
1891
  "special": false
1892
  },
1893
+ "128243": {
1894
  "content": "\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t",
1895
  "lstrip": false,
1896
  "normalized": false,
 
1898
  "single_word": false,
1899
  "special": false
1900
  },
1901
+ "128244": {
1902
  "content": "\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t",
1903
  "lstrip": false,
1904
  "normalized": false,
 
1906
  "single_word": false,
1907
  "special": false
1908
  },
1909
+ "128245": {
1910
  "content": "\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t",
1911
  "lstrip": false,
1912
  "normalized": false,
 
1914
  "single_word": false,
1915
  "special": false
1916
  },
1917
+ "128246": {
1918
  "content": "\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t",
1919
  "lstrip": false,
1920
  "normalized": false,
 
1922
  "single_word": false,
1923
  "special": false
1924
  },
1925
+ "128247": {
1926
  "content": "\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t",
1927
  "lstrip": false,
1928
  "normalized": false,
 
1930
  "single_word": false,
1931
  "special": false
1932
  },
1933
+ "128248": {
1934
  "content": "\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t",
1935
  "lstrip": false,
1936
  "normalized": false,
 
1938
  "single_word": false,
1939
  "special": false
1940
  },
1941
+ "128249": {
1942
  "content": "\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t",
1943
  "lstrip": false,
1944
  "normalized": false,
 
1946
  "single_word": false,
1947
  "special": false
1948
  },
1949
+ "128250": {
1950
  "content": "\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t",
1951
  "lstrip": false,
1952
  "normalized": false,
 
1954
  "single_word": false,
1955
  "special": false
1956
  },
1957
+ "128251": {
1958
  "content": "\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t",
1959
  "lstrip": false,
1960
  "normalized": false,
 
1962
  "single_word": false,
1963
  "special": false
1964
  },
1965
+ "128252": {
1966
  "content": "\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t",
1967
  "lstrip": false,
1968
  "normalized": false,
 
1970
  "single_word": false,
1971
  "special": false
1972
  },
1973
+ "128253": {
1974
  "content": "\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t",
1975
  "lstrip": false,
1976
  "normalized": false,
 
1978
  "single_word": false,
1979
  "special": false
1980
  },
1981
+ "128254": {
1982
  "content": "\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t",
1983
  "lstrip": false,
1984
  "normalized": false,
 
1986
  "single_word": false,
1987
  "special": false
1988
  },
1989
+ "128255": {
1990
  "content": "<unused99>",
1991
  "lstrip": false,
1992
  "normalized": false,
 
1994
  "single_word": false,
1995
  "special": false
1996
  },
1997
+ "128256": {
1998
  "content": "<tools>",
1999
  "lstrip": false,
2000
  "normalized": false,
 
2002
  "single_word": false,
2003
  "special": true
2004
  },
2005
+ "128257": {
2006
  "content": "</tools>",
2007
  "lstrip": false,
2008
  "normalized": false,
 
2010
  "single_word": false,
2011
  "special": true
2012
  },
2013
+ "128258": {
2014
  "content": "<think>",
2015
  "lstrip": false,
2016
  "normalized": false,
 
2018
  "single_word": false,
2019
  "special": true
2020
  },
2021
+ "128259": {
2022
  "content": "</think>",
2023
  "lstrip": false,
2024
  "normalized": false,
 
2026
  "single_word": false,
2027
  "special": true
2028
  },
2029
+ "128260": {
2030
  "content": "<tool_call>",
2031
  "lstrip": false,
2032
  "normalized": false,
 
2034
  "single_word": false,
2035
  "special": true
2036
  },
2037
+ "128261": {
2038
  "content": "</tool_call>",
2039
  "lstrip": false,
2040
  "normalized": false,
 
2042
  "single_word": false,
2043
  "special": true
2044
  },
2045
+ "128262": {
2046
  "content": "<tool_response>",
2047
  "lstrip": false,
2048
  "normalized": false,
 
2050
  "single_word": false,
2051
  "special": true
2052
  },
2053
+ "128263": {
2054
  "content": "</tool_response>",
2055
  "lstrip": false,
2056
  "normalized": false,
 
2077
  "extra_special_tokens": {},
2078
  "model_max_length": 1000000000000000019884624838656,
2079
  "pad_token": "<pad>",
2080
+ "padding_side": "right",
2081
  "sp_model_kwargs": {},
2082
  "spaces_between_special_tokens": false,
2083
+ "split_special_tokens": false,
2084
  "tokenizer_class": "GemmaTokenizer",
2085
  "unk_token": "<unk>",
2086
  "use_default_system_prompt": false
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b68d94d3a198c58b76d2e6e69908cc405b4ff886116c10e586f704d7017c4792
3
  size 6097
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:16f56f0696e1d1888e4ec399da4ea04d2ee0d1af7779f1570a80a942d614ec4e
3
  size 6097