Striker-7 commited on
Commit
e89435b
·
verified ·
1 Parent(s): 63cb577
README.md CHANGED
@@ -7,14 +7,14 @@ tags:
7
  - generated_from_trainer
8
  base_model: microsoft/Phi-3-mini-4k-instruct
9
  model-index:
10
- - name: phi3
11
  results: []
12
  ---
13
 
14
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
15
  should probably proofread and complete it, then remove this comment. -->
16
 
17
- # phi3
18
 
19
  This model is a fine-tuned version of [microsoft/Phi-3-mini-4k-instruct](https://huggingface.co/microsoft/Phi-3-mini-4k-instruct) on an unknown dataset.
20
 
@@ -52,7 +52,7 @@ The following hyperparameters were used during training:
52
  ### Framework versions
53
 
54
  - PEFT 0.11.1
55
- - Transformers 4.42.3
56
  - Pytorch 2.1.2
57
  - Datasets 2.20.0
58
  - Tokenizers 0.19.1
 
7
  - generated_from_trainer
8
  base_model: microsoft/Phi-3-mini-4k-instruct
9
  model-index:
10
+ - name: elephi3
11
  results: []
12
  ---
13
 
14
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
15
  should probably proofread and complete it, then remove this comment. -->
16
 
17
+ # elephi3
18
 
19
  This model is a fine-tuned version of [microsoft/Phi-3-mini-4k-instruct](https://huggingface.co/microsoft/Phi-3-mini-4k-instruct) on an unknown dataset.
20
 
 
52
  ### Framework versions
53
 
54
  - PEFT 0.11.1
55
+ - Transformers 4.42.4
56
  - Pytorch 2.1.2
57
  - Datasets 2.20.0
58
  - Tokenizers 0.19.1
adapter_config.json CHANGED
@@ -20,11 +20,11 @@
20
  "rank_pattern": {},
21
  "revision": null,
22
  "target_modules": [
23
- "o_proj",
24
  "down_proj",
25
  "gate_up_proj",
26
- "embed_tokens",
27
- "qkv_proj"
28
  ],
29
  "task_type": "CAUSAL_LM",
30
  "use_dora": false,
 
20
  "rank_pattern": {},
21
  "revision": null,
22
  "target_modules": [
23
+ "qkv_proj",
24
  "down_proj",
25
  "gate_up_proj",
26
+ "o_proj",
27
+ "embed_tokens"
28
  ],
29
  "task_type": "CAUSAL_LM",
30
  "use_dora": false,
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:005ddc8a510ec0191faa1cd3876b22d6f921c0ecd1a7086cdae20fbd4779050c
3
  size 496949808
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:728420ba06e737e9a69c8b7511479aaa75ac3b6365d487f99d61b6e8d5ea5fa9
3
  size 496949808
tokenizer.json CHANGED
@@ -2,7 +2,7 @@
2
  "version": "1.0",
3
  "truncation": {
4
  "direction": "Right",
5
- "max_length": 2048,
6
  "strategy": "LongestFirst",
7
  "stride": 0
8
  },
 
2
  "version": "1.0",
3
  "truncation": {
4
  "direction": "Right",
5
+ "max_length": 200,
6
  "strategy": "LongestFirst",
7
  "stride": 0
8
  },
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1080a01b32f3081a6496eb343a90ca037ebaeedb38fa916277a702a4fdf21d9e
3
  size 5368
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4d25b21726b13a6ee7654f7d33cbe9fd05fc7899c90b5176ec974878adeab89e
3
  size 5368