TessWOfficial commited on
Commit
8c5f05e
·
verified ·
1 Parent(s): ef059a8

Training in progress, epoch 1

Browse files
adapter_config.json CHANGED
@@ -3,6 +3,7 @@
3
  "auto_mapping": null,
4
  "base_model_name_or_path": "google/gemma-3-4b-pt",
5
  "bias": "none",
 
6
  "eva_config": null,
7
  "exclude_modules": null,
8
  "fan_in_fan_out": false,
@@ -27,18 +28,18 @@
27
  "revision": null,
28
  "target_modules": [
29
  "o_proj",
30
- "up_proj",
31
- "fc1",
32
  "v_proj",
33
- "out_proj",
34
- "gate_proj",
35
  "k_proj",
 
36
  "fc2",
37
- "lm_head",
38
- "q_proj",
39
- "down_proj"
 
 
40
  ],
41
  "task_type": "CAUSAL_LM",
 
42
  "use_dora": false,
43
  "use_rslora": false
44
  }
 
3
  "auto_mapping": null,
4
  "base_model_name_or_path": "google/gemma-3-4b-pt",
5
  "bias": "none",
6
+ "corda_config": null,
7
  "eva_config": null,
8
  "exclude_modules": null,
9
  "fan_in_fan_out": false,
 
28
  "revision": null,
29
  "target_modules": [
30
  "o_proj",
 
 
31
  "v_proj",
 
 
32
  "k_proj",
33
+ "up_proj",
34
  "fc2",
35
+ "down_proj",
36
+ "gate_proj",
37
+ "fc1",
38
+ "out_proj",
39
+ "q_proj"
40
  ],
41
  "task_type": "CAUSAL_LM",
42
+ "trainable_token_indices": null,
43
  "use_dora": false,
44
  "use_rslora": false
45
  }
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f41253ec07583eab99a0583d49f36af16125c31d7090941b28e0c70ab216df8a
3
- size 2839124552
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c271c0068f609e88d5d65c862cbe875d741308348edbacd3fd423ed46ba88241
3
+ size 2839126480
chat_template.jinja ADDED
@@ -0,0 +1,47 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {{ bos_token }}
2
+ {%- if messages[0]['role'] == 'system' -%}
3
+ {%- if messages[0]['content'] is string -%}
4
+ {%- set first_user_prefix = messages[0]['content'] + '
5
+
6
+ ' -%}
7
+ {%- else -%}
8
+ {%- set first_user_prefix = messages[0]['content'][0]['text'] + '
9
+
10
+ ' -%}
11
+ {%- endif -%}
12
+ {%- set loop_messages = messages[1:] -%}
13
+ {%- else -%}
14
+ {%- set first_user_prefix = "" -%}
15
+ {%- set loop_messages = messages -%}
16
+ {%- endif -%}
17
+ {%- for message in loop_messages -%}
18
+ {%- if (message['role'] == 'user') != (loop.index0 % 2 == 0) -%}
19
+ {{ raise_exception("Conversation roles must alternate user/assistant/user/assistant/...") }}
20
+ {%- endif -%}
21
+ {%- if (message['role'] == 'assistant') -%}
22
+ {%- set role = "model" -%}
23
+ {%- else -%}
24
+ {%- set role = message['role'] -%}
25
+ {%- endif -%}
26
+ {{ '<start_of_turn>' + role + '
27
+ ' + (first_user_prefix if loop.first else "") }}
28
+ {%- if message['content'] is string -%}
29
+ {{ message['content'] | trim }}
30
+ {%- elif message['content'] is iterable -%}
31
+ {%- for item in message['content'] -%}
32
+ {%- if item['type'] == 'image' -%}
33
+ {{ '<start_of_image>' }}
34
+ {%- elif item['type'] == 'text' -%}
35
+ {{ item['text'] | trim }}
36
+ {%- endif -%}
37
+ {%- endfor -%}
38
+ {%- else -%}
39
+ {{ raise_exception("Invalid content type") }}
40
+ {%- endif -%}
41
+ {{ '<end_of_turn>
42
+ ' }}
43
+ {%- endfor -%}
44
+ {%- if add_generation_prompt -%}
45
+ {{'<start_of_turn>model
46
+ '}}
47
+ {%- endif -%}
runs/May22_14-24-06_verb-workspace/events.out.tfevents.1747923915.verb-workspace.4814.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1c5cfa8a84666b6c0aa0d0c5a6d7712843095ba2f86967ebf8e4dfd116d7c3bf
3
+ size 20494
runs/May22_14-29-40_verb-workspace/events.out.tfevents.1747924203.verb-workspace.6545.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:62f0d95d449d5e03330ffb7efbfef5d662ab40be90d62e50a372197850bce458
3
+ size 6890
runs/May22_14-31-34_verb-workspace/events.out.tfevents.1747924310.verb-workspace.6545.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:667f710228cbcdf642dd41c8123f547dd81c8d05c90f195a7bc80785a969a0ed
3
+ size 6889
runs/May22_14-33-24_verb-workspace/events.out.tfevents.1747924408.verb-workspace.7730.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:26537ba55e212de6202ce460751145721594404ed751e122918c23c7005c0637
3
+ size 8185
tokenizer_config.json CHANGED
@@ -51325,7 +51325,6 @@
51325
  },
51326
  "boi_token": "<start_of_image>",
51327
  "bos_token": "<bos>",
51328
- "chat_template": "{{ bos_token }}\n{%- if messages[0]['role'] == 'system' -%}\n {%- if messages[0]['content'] is string -%}\n {%- set first_user_prefix = messages[0]['content'] + '\n\n' -%}\n {%- else -%}\n {%- set first_user_prefix = messages[0]['content'][0]['text'] + '\n\n' -%}\n {%- endif -%}\n {%- set loop_messages = messages[1:] -%}\n{%- else -%}\n {%- set first_user_prefix = \"\" -%}\n {%- set loop_messages = messages -%}\n{%- endif -%}\n{%- for message in loop_messages -%}\n {%- if (message['role'] == 'user') != (loop.index0 % 2 == 0) -%}\n {{ raise_exception(\"Conversation roles must alternate user/assistant/user/assistant/...\") }}\n {%- endif -%}\n {%- if (message['role'] == 'assistant') -%}\n {%- set role = \"model\" -%}\n {%- else -%}\n {%- set role = message['role'] -%}\n {%- endif -%}\n {{ '<start_of_turn>' + role + '\n' + (first_user_prefix if loop.first else \"\") }}\n {%- if message['content'] is string -%}\n {{ message['content'] | trim }}\n {%- elif message['content'] is iterable -%}\n {%- for item in message['content'] -%}\n {%- if item['type'] == 'image' -%}\n {{ '<start_of_image>' }}\n {%- elif item['type'] == 'text' -%}\n {{ item['text'] | trim }}\n {%- endif -%}\n {%- endfor -%}\n {%- else -%}\n {{ raise_exception(\"Invalid content type\") }}\n {%- endif -%}\n {{ '<end_of_turn>\n' }}\n{%- endfor -%}\n{%- if add_generation_prompt -%}\n {{'<start_of_turn>model\n'}}\n{%- endif -%}\n",
51329
  "clean_up_tokenization_spaces": false,
51330
  "eoi_token": "<end_of_image>",
51331
  "eos_token": "<eos>",
 
51325
  },
51326
  "boi_token": "<start_of_image>",
51327
  "bos_token": "<bos>",
 
51328
  "clean_up_tokenization_spaces": false,
51329
  "eoi_token": "<end_of_image>",
51330
  "eos_token": "<eos>",
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:96096c19fe23082a1d6d724880bedd9775db1008175d7759442208c7832475ad
3
- size 6097
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e72bd333eae003f26a166608024131db03306aafb5ea416bd35d48a72859f3f4
3
+ size 6161