TinyPixel commited on
Commit
e2ab2de
·
1 Parent(s): cd48d59

Upload folder using huggingface_hub

Browse files
README.md CHANGED
@@ -12,9 +12,21 @@ The following `bitsandbytes` quantization config was used during training:
12
  - llm_int8_enable_fp32_cpu_offload: False
13
  - llm_int8_has_fp16_weight: False
14
  - bnb_4bit_quant_type: nf4
15
- - bnb_4bit_use_double_quant: True
16
- - bnb_4bit_compute_dtype: float32
 
 
 
 
 
 
 
 
 
 
 
17
  ### Framework versions
18
 
 
19
 
20
- - PEFT 0.4.0
 
12
  - llm_int8_enable_fp32_cpu_offload: False
13
  - llm_int8_has_fp16_weight: False
14
  - bnb_4bit_quant_type: nf4
15
+ - bnb_4bit_use_double_quant: False
16
+ - bnb_4bit_compute_dtype: float16
17
+
18
+ The following `bitsandbytes` quantization config was used during training:
19
+ - load_in_8bit: False
20
+ - load_in_4bit: True
21
+ - llm_int8_threshold: 6.0
22
+ - llm_int8_skip_modules: None
23
+ - llm_int8_enable_fp32_cpu_offload: False
24
+ - llm_int8_has_fp16_weight: False
25
+ - bnb_4bit_quant_type: nf4
26
+ - bnb_4bit_use_double_quant: False
27
+ - bnb_4bit_compute_dtype: float16
28
  ### Framework versions
29
 
30
+ - PEFT 0.5.0.dev0
31
 
32
+ - PEFT 0.5.0.dev0
adapter_config.json CHANGED
@@ -1,14 +1,14 @@
1
  {
2
  "auto_mapping": null,
3
- "base_model_name_or_path": "EleutherAI/pythia-1.4b-deduped",
4
  "bias": "none",
5
  "fan_in_fan_out": false,
6
  "inference_mode": true,
7
  "init_lora_weights": true,
8
  "layers_pattern": null,
9
  "layers_to_transform": null,
10
- "lora_alpha": 16.0,
11
- "lora_dropout": 0.05,
12
  "modules_to_save": null,
13
  "peft_type": "LORA",
14
  "r": 64,
@@ -16,8 +16,8 @@
16
  "target_modules": [
17
  "query_key_value",
18
  "dense",
19
- "dense_4h_to_h",
20
- "dense_h_to_4h"
21
  ],
22
  "task_type": "CAUSAL_LM"
23
  }
 
1
  {
2
  "auto_mapping": null,
3
+ "base_model_name_or_path": "EleutherAI/pythia-1b-deduped",
4
  "bias": "none",
5
  "fan_in_fan_out": false,
6
  "inference_mode": true,
7
  "init_lora_weights": true,
8
  "layers_pattern": null,
9
  "layers_to_transform": null,
10
+ "lora_alpha": 16,
11
+ "lora_dropout": 0.1,
12
  "modules_to_save": null,
13
  "peft_type": "LORA",
14
  "r": 64,
 
16
  "target_modules": [
17
  "query_key_value",
18
  "dense",
19
+ "dense_h_to_4h",
20
+ "dense_4h_to_h"
21
  ],
22
  "task_type": "CAUSAL_LM"
23
  }
adapter_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c131d7ef0152ba05901fcc4d00eb8d3989c4ab25884d85967b687a68fe837221
3
- size 201396877
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:852b986d81ea036484e87906f30a6cd3b723f35bff5b93a8f032563db86255de
3
+ size 134264397
optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0451a20c28f34735ef7dfa777a68b2a3a923bed7fac096edb2ac3b648829c015
3
- size 2050282373
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a771516865e4eb4fbb5c0c99154ed9baa398cfb231b36a1e6e77594bdd307ac9
3
+ size 268514565
rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d266ddecfade7ae12d89d853bf0985517cf37a6a52c274d08548cfff0d913c51
3
- size 14511
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4dd5eab74cb3dd3f340372d749261e9eb25431fffa35a03d95317e82166525d6
3
+ size 14575
scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f4880f3f40e7ab04d8efce4fc909327351c41d3ccafff780222b4189f527a9a0
3
  size 627
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a6a57ca5387433ab2e0c3edbde111c8e94d32be99ea44e5cb4defa29c730fedb
3
  size 627
special_tokens_map.json CHANGED
@@ -1,6 +1,6 @@
1
  {
2
  "bos_token": "<|endoftext|>",
3
  "eos_token": "<|endoftext|>",
4
- "pad_token": "[PAD]",
5
  "unk_token": "<|endoftext|>"
6
  }
 
1
  {
2
  "bos_token": "<|endoftext|>",
3
  "eos_token": "<|endoftext|>",
4
+ "pad_token": "<|endoftext|>",
5
  "unk_token": "<|endoftext|>"
6
  }
tokenizer.json CHANGED
@@ -1,6 +1,11 @@
1
  {
2
  "version": "1.0",
3
- "truncation": null,
 
 
 
 
 
4
  "padding": null,
5
  "added_tokens": [
6
  {
@@ -227,15 +232,6 @@
227
  "rstrip": false,
228
  "normalized": true,
229
  "special": false
230
- },
231
- {
232
- "id": 50277,
233
- "content": "[PAD]",
234
- "single_word": false,
235
- "lstrip": false,
236
- "rstrip": false,
237
- "normalized": false,
238
- "special": true
239
  }
240
  ],
241
  "normalizer": {
 
1
  {
2
  "version": "1.0",
3
+ "truncation": {
4
+ "direction": "Right",
5
+ "max_length": 1024,
6
+ "strategy": "LongestFirst",
7
+ "stride": 0
8
+ },
9
  "padding": null,
10
  "added_tokens": [
11
  {
 
232
  "rstrip": false,
233
  "normalized": true,
234
  "special": false
 
 
 
 
 
 
 
 
 
235
  }
236
  ],
237
  "normalizer": {
tokenizer_config.json CHANGED
@@ -4,7 +4,6 @@
4
  "clean_up_tokenization_spaces": true,
5
  "eos_token": "<|endoftext|>",
6
  "model_max_length": 1000000000000000019884624838656,
7
- "padding_side": "right",
8
  "tokenizer_class": "GPTNeoXTokenizer",
9
  "unk_token": "<|endoftext|>"
10
  }
 
4
  "clean_up_tokenization_spaces": true,
5
  "eos_token": "<|endoftext|>",
6
  "model_max_length": 1000000000000000019884624838656,
 
7
  "tokenizer_class": "GPTNeoXTokenizer",
8
  "unk_token": "<|endoftext|>"
9
  }
trainer_state.json CHANGED
The diff for this file is too large to render. See raw diff
 
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:643cd8215538899410f2288daee01465ee05e777a4971bf0fec462ea7d279181
3
- size 5691
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e0ff256d9d1b37b1b9f76875037fc6d6258489dcce2955aa6051fa2f9fa464ef
3
+ size 3963