IoakeimE commited on
Commit
9802694
·
verified ·
1 Parent(s): 44262bc

Training in progress, epoch 1

Browse files
README.md CHANGED
@@ -1,18 +1,18 @@
1
  ---
2
- base_model: unsloth/mistral-7b-instruct-v0.3-bnb-4bit
3
  library_name: transformers
4
  model_name: sft_best_simplification
5
  tags:
6
  - generated_from_trainer
7
- - unsloth
8
  - trl
 
9
  - sft
10
  licence: license
11
  ---
12
 
13
  # Model Card for sft_best_simplification
14
 
15
- This model is a fine-tuned version of [unsloth/mistral-7b-instruct-v0.3-bnb-4bit](https://huggingface.co/unsloth/mistral-7b-instruct-v0.3-bnb-4bit).
16
  It has been trained using [TRL](https://github.com/huggingface/trl).
17
 
18
  ## Quick start
@@ -28,7 +28,7 @@ print(output["generated_text"])
28
 
29
  ## Training procedure
30
 
31
- [<img src="https://raw.githubusercontent.com/wandb/assets/main/wandb-github-badge-28.svg" alt="Visualize in Weights & Biases" width="150" height="24"/>](https://wandb.ai/ioakeime-aristotle-university-of-thessaloniki/sft_best_simplification/runs/9amgp9pe)
32
 
33
 
34
  This model was trained with SFT.
 
1
  ---
2
+ base_model: unsloth/mistral-7b-v0.3-bnb-4bit
3
  library_name: transformers
4
  model_name: sft_best_simplification
5
  tags:
6
  - generated_from_trainer
 
7
  - trl
8
+ - unsloth
9
  - sft
10
  licence: license
11
  ---
12
 
13
  # Model Card for sft_best_simplification
14
 
15
+ This model is a fine-tuned version of [unsloth/mistral-7b-v0.3-bnb-4bit](https://huggingface.co/unsloth/mistral-7b-v0.3-bnb-4bit).
16
  It has been trained using [TRL](https://github.com/huggingface/trl).
17
 
18
  ## Quick start
 
28
 
29
  ## Training procedure
30
 
31
+ [<img src="https://raw.githubusercontent.com/wandb/assets/main/wandb-github-badge-28.svg" alt="Visualize in Weights & Biases" width="150" height="24"/>](https://wandb.ai/ioakeime-aristotle-university-of-thessaloniki/sft_best_simplification/runs/kc6lw27s)
32
 
33
 
34
  This model was trained with SFT.
adapter_config.json CHANGED
@@ -7,7 +7,7 @@
7
  "parent_library": "transformers.models.mistral.modeling_mistral",
8
  "unsloth_fixed": true
9
  },
10
- "base_model_name_or_path": "unsloth/mistral-7b-instruct-v0.3-bnb-4bit",
11
  "bias": "none",
12
  "corda_config": null,
13
  "ensure_weight_tying": false,
@@ -33,13 +33,13 @@
33
  "rank_pattern": {},
34
  "revision": null,
35
  "target_modules": [
36
- "o_proj",
 
37
  "down_proj",
38
  "v_proj",
39
  "k_proj",
40
- "q_proj",
41
  "gate_proj",
42
- "up_proj"
43
  ],
44
  "target_parameters": null,
45
  "task_type": "CAUSAL_LM",
 
7
  "parent_library": "transformers.models.mistral.modeling_mistral",
8
  "unsloth_fixed": true
9
  },
10
+ "base_model_name_or_path": "unsloth/mistral-7b-v0.3-bnb-4bit",
11
  "bias": "none",
12
  "corda_config": null,
13
  "ensure_weight_tying": false,
 
33
  "rank_pattern": {},
34
  "revision": null,
35
  "target_modules": [
36
+ "up_proj",
37
+ "q_proj",
38
  "down_proj",
39
  "v_proj",
40
  "k_proj",
 
41
  "gate_proj",
42
+ "o_proj"
43
  ],
44
  "target_parameters": null,
45
  "task_type": "CAUSAL_LM",
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d8264ef51349540391c8791d34755db267ace4ed3577d90965629495a6ee8544
3
  size 167832240
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2c191500666a73afc7b36b3ae7277329f9cf35396f5c021a71ed8f7acd8aa3ba
3
  size 167832240
tokenizer_config.json CHANGED
@@ -6179,7 +6179,7 @@
6179
  "legacy": false,
6180
  "model_max_length": 32768,
6181
  "pad_token": "[control_768]",
6182
- "padding_side": "left",
6183
  "sp_model_kwargs": {},
6184
  "spaces_between_special_tokens": false,
6185
  "tokenizer_class": "LlamaTokenizer",
 
6179
  "legacy": false,
6180
  "model_max_length": 32768,
6181
  "pad_token": "[control_768]",
6182
+ "padding_side": "right",
6183
  "sp_model_kwargs": {},
6184
  "spaces_between_special_tokens": false,
6185
  "tokenizer_class": "LlamaTokenizer",
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:91b195bbee031377a98da390b75c70b5f638541cb5f65dfa6119007797723266
3
  size 6353
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c40cf0f3fb04a0ff90a766e83b9ee7fcc9800df8b0bf374934d3bf32257ed7ff
3
  size 6353