Training in progress, epoch 0
Browse files
adapter_config.json
CHANGED
|
@@ -1,7 +1,7 @@
|
|
| 1 |
{
|
| 2 |
"alpha_pattern": {},
|
| 3 |
"auto_mapping": null,
|
| 4 |
-
"base_model_name_or_path": "
|
| 5 |
"bias": "none",
|
| 6 |
"fan_in_fan_out": false,
|
| 7 |
"inference_mode": true,
|
|
|
|
| 1 |
{
|
| 2 |
"alpha_pattern": {},
|
| 3 |
"auto_mapping": null,
|
| 4 |
+
"base_model_name_or_path": "hishab/titulm-llama-3.2-1b-v1.0",
|
| 5 |
"bias": "none",
|
| 6 |
"fan_in_fan_out": false,
|
| 7 |
"inference_mode": true,
|
adapter_model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1772140424
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4ae5d9cc5e7137165e092f5b5121d894718e2869a6a668eb595137a8ac47b5e1
|
| 3 |
size 1772140424
|
runs/Mar06_09-46-31_cc3e83913ab1/events.out.tfevents.1741254436.cc3e83913ab1.320.4
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:55c12557db9e897f1504e22275a02cc4c5aa69d6dcbd121af2a64754d9f520a5
|
| 3 |
+
size 6050
|
tokenizer_config.json
CHANGED
|
@@ -2073,15 +2073,13 @@
|
|
| 2073 |
"chat_template": "{% for message in messages %}{{'<|im_start|>' + message['role'] + '\n' + message['content'] + '<|im_end|>' + '\n'}}{% endfor %}{% if add_generation_prompt %}{{ '<|im_start|>assistant\n' }}{% endif %}",
|
| 2074 |
"clean_up_tokenization_spaces": true,
|
| 2075 |
"eos_token": "<|im_end|>",
|
| 2076 |
-
"max_length": 131072,
|
| 2077 |
"model_input_names": [
|
| 2078 |
"input_ids",
|
| 2079 |
"attention_mask"
|
| 2080 |
],
|
| 2081 |
"model_max_length": 131072,
|
| 2082 |
"pad_token": "<|im_end|>",
|
| 2083 |
-
"
|
| 2084 |
-
"
|
| 2085 |
-
"
|
| 2086 |
-
"truncation_strategy": "longest_first"
|
| 2087 |
}
|
|
|
|
| 2073 |
"chat_template": "{% for message in messages %}{{'<|im_start|>' + message['role'] + '\n' + message['content'] + '<|im_end|>' + '\n'}}{% endfor %}{% if add_generation_prompt %}{{ '<|im_start|>assistant\n' }}{% endif %}",
|
| 2074 |
"clean_up_tokenization_spaces": true,
|
| 2075 |
"eos_token": "<|im_end|>",
|
|
|
|
| 2076 |
"model_input_names": [
|
| 2077 |
"input_ids",
|
| 2078 |
"attention_mask"
|
| 2079 |
],
|
| 2080 |
"model_max_length": 131072,
|
| 2081 |
"pad_token": "<|im_end|>",
|
| 2082 |
+
"padding_side": "right",
|
| 2083 |
+
"split_special_tokens": false,
|
| 2084 |
+
"tokenizer_class": "PreTrainedTokenizerFast"
|
|
|
|
| 2085 |
}
|
training_args.bin
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 5496
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8784e38c64949757b034e8b037e4ee5882214ce066778485b79d7d471c2be322
|
| 3 |
size 5496
|