Training in progress, epoch 2

Files changed (9) hide show

README.md CHANGED Viewed

@@ -4,8 +4,8 @@ library_name: transformers
 model_name: gemma3_google
 tags:
 - generated_from_trainer
-- sft
 - trl
 licence: license
 ---
@@ -20,7 +20,7 @@ It has been trained using [TRL](https://github.com/huggingface/trl).
 from transformers import pipeline
 question = "If you had a time machine, but could only go to the past or the future once and never return, which would you choose and why?"
-generator = pipeline("text-generation", model="rubengerad/gemma3_google", device="cuda")
 output = generator([{"role": "user", "content": question}], max_new_tokens=128, return_full_text=False)[0]
 print(output["generated_text"])
 ```

 model_name: gemma3_google
 tags:
 - generated_from_trainer
 - trl
+- sft
 licence: license
 ---
 from transformers import pipeline
 question = "If you had a time machine, but could only go to the past or the future once and never return, which would you choose and why?"
+generator = pipeline("text-generation", model="rubenz-org/gemma3_google", device="cuda")
 output = generator([{"role": "user", "content": question}], max_new_tokens=128, return_full_text=False)[0]
 print(output["generated_text"])
 ```

config.json CHANGED Viewed

@@ -49,6 +49,6 @@
   "torch_dtype": "bfloat16",
   "transformers_version": "4.55.4",
   "use_bidirectional_attention": false,
-  "use_cache": true,
   "vocab_size": 262144
 }

   "torch_dtype": "bfloat16",
   "transformers_version": "4.55.4",
   "use_bidirectional_attention": false,
+  "use_cache": false,
   "vocab_size": 262144
 }

model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:933ea103a5881db9afd88aeccbb3d07e2b39b88ce6911e780e25c2acf4ad90d3
 size 536223056

 version https://git-lfs.github.com/spec/v1
+oid sha256:d1a675457af0c9c535cd22e1cc40239e0d81a0b614177efd1db75f9474afdfba
 size 536223056

runs/Oct17_03-02-21_llmsvr/events.out.tfevents.1760650345.llmsvr.220029.0 ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:aa14b96086f7d297ae10600e8e8c931d5ce0d40cec11fe61e60c91baa6518036
+size 9850

runs/Oct17_03-30-34_llmsvr/events.out.tfevents.1760652038.llmsvr.299567.0 ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:839f47fcfea1f40b00ddc4c0c09180041d52d2f746f12d854e6626617b9868a8
+size 87695

runs/Oct18_06-31-10_llmsvr/events.out.tfevents.1760749274.llmsvr.126427.0 ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:7e378a7f05d22e65a219feeaf531cf123479f7fd0db6ec5feae0412edc0884da
+size 87695

special_tokens_map.json CHANGED Viewed

@@ -8,13 +8,7 @@
     "single_word": false
   },
   "eoi_token": "<end_of_image>",
-  "eos_token": {
-    "content": "<eos>",
-    "lstrip": false,
-    "normalized": false,
-    "rstrip": false,
-    "single_word": false
-  },
   "image_token": "<image_soft_token>",
   "pad_token": {
     "content": "<pad>",

     "single_word": false
   },
   "eoi_token": "<end_of_image>",
+  "eos_token": "<unk>",
   "image_token": "<image_soft_token>",
   "pad_token": {
     "content": "<pad>",

tokenizer_config.json CHANGED Viewed

@@ -51327,7 +51327,7 @@
   "bos_token": "<bos>",
   "clean_up_tokenization_spaces": false,
   "eoi_token": "<end_of_image>",
-  "eos_token": "<eos>",
   "extra_special_tokens": {
     "boi_token": "<start_of_image>",
     "eoi_token": "<end_of_image>",

   "bos_token": "<bos>",
   "clean_up_tokenization_spaces": false,
   "eoi_token": "<end_of_image>",
+  "eos_token": "<unk>",
   "extra_special_tokens": {
     "boi_token": "<start_of_image>",
     "eoi_token": "<end_of_image>",

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:59dcce217a2c9e923d1c7e4f7c7795e517f92a7237b7b86540aa83f176d29a2d
-size 6161

 version https://git-lfs.github.com/spec/v1
+oid sha256:be0f85e2e45442c7078bda0ad3aabc844f478387f9434edd7819c06714edf056
+size 6289