rubenz-org commited on
Commit
751eaf5
·
verified ·
1 Parent(s): 7c6529c

Training in progress, epoch 2

Browse files
README.md CHANGED
@@ -4,8 +4,8 @@ library_name: transformers
4
  model_name: gemma3_google
5
  tags:
6
  - generated_from_trainer
7
- - sft
8
  - trl
 
9
  licence: license
10
  ---
11
 
@@ -20,7 +20,7 @@ It has been trained using [TRL](https://github.com/huggingface/trl).
20
  from transformers import pipeline
21
 
22
  question = "If you had a time machine, but could only go to the past or the future once and never return, which would you choose and why?"
23
- generator = pipeline("text-generation", model="rubengerad/gemma3_google", device="cuda")
24
  output = generator([{"role": "user", "content": question}], max_new_tokens=128, return_full_text=False)[0]
25
  print(output["generated_text"])
26
  ```
 
4
  model_name: gemma3_google
5
  tags:
6
  - generated_from_trainer
 
7
  - trl
8
+ - sft
9
  licence: license
10
  ---
11
 
 
20
  from transformers import pipeline
21
 
22
  question = "If you had a time machine, but could only go to the past or the future once and never return, which would you choose and why?"
23
+ generator = pipeline("text-generation", model="rubenz-org/gemma3_google", device="cuda")
24
  output = generator([{"role": "user", "content": question}], max_new_tokens=128, return_full_text=False)[0]
25
  print(output["generated_text"])
26
  ```
config.json CHANGED
@@ -49,6 +49,6 @@
49
  "torch_dtype": "bfloat16",
50
  "transformers_version": "4.55.4",
51
  "use_bidirectional_attention": false,
52
- "use_cache": true,
53
  "vocab_size": 262144
54
  }
 
49
  "torch_dtype": "bfloat16",
50
  "transformers_version": "4.55.4",
51
  "use_bidirectional_attention": false,
52
+ "use_cache": false,
53
  "vocab_size": 262144
54
  }
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:933ea103a5881db9afd88aeccbb3d07e2b39b88ce6911e780e25c2acf4ad90d3
3
  size 536223056
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d1a675457af0c9c535cd22e1cc40239e0d81a0b614177efd1db75f9474afdfba
3
  size 536223056
runs/Oct17_03-02-21_llmsvr/events.out.tfevents.1760650345.llmsvr.220029.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:aa14b96086f7d297ae10600e8e8c931d5ce0d40cec11fe61e60c91baa6518036
3
+ size 9850
runs/Oct17_03-30-34_llmsvr/events.out.tfevents.1760652038.llmsvr.299567.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:839f47fcfea1f40b00ddc4c0c09180041d52d2f746f12d854e6626617b9868a8
3
+ size 87695
runs/Oct18_06-31-10_llmsvr/events.out.tfevents.1760749274.llmsvr.126427.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7e378a7f05d22e65a219feeaf531cf123479f7fd0db6ec5feae0412edc0884da
3
+ size 87695
special_tokens_map.json CHANGED
@@ -8,13 +8,7 @@
8
  "single_word": false
9
  },
10
  "eoi_token": "<end_of_image>",
11
- "eos_token": {
12
- "content": "<eos>",
13
- "lstrip": false,
14
- "normalized": false,
15
- "rstrip": false,
16
- "single_word": false
17
- },
18
  "image_token": "<image_soft_token>",
19
  "pad_token": {
20
  "content": "<pad>",
 
8
  "single_word": false
9
  },
10
  "eoi_token": "<end_of_image>",
11
+ "eos_token": "<unk>",
 
 
 
 
 
 
12
  "image_token": "<image_soft_token>",
13
  "pad_token": {
14
  "content": "<pad>",
tokenizer_config.json CHANGED
@@ -51327,7 +51327,7 @@
51327
  "bos_token": "<bos>",
51328
  "clean_up_tokenization_spaces": false,
51329
  "eoi_token": "<end_of_image>",
51330
- "eos_token": "<eos>",
51331
  "extra_special_tokens": {
51332
  "boi_token": "<start_of_image>",
51333
  "eoi_token": "<end_of_image>",
 
51327
  "bos_token": "<bos>",
51328
  "clean_up_tokenization_spaces": false,
51329
  "eoi_token": "<end_of_image>",
51330
+ "eos_token": "<unk>",
51331
  "extra_special_tokens": {
51332
  "boi_token": "<start_of_image>",
51333
  "eoi_token": "<end_of_image>",
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:59dcce217a2c9e923d1c7e4f7c7795e517f92a7237b7b86540aa83f176d29a2d
3
- size 6161
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:be0f85e2e45442c7078bda0ad3aabc844f478387f9434edd7819c06714edf056
3
+ size 6289