jkgl commited on
Commit
a220365
·
verified ·
1 Parent(s): 958425a

Initial Bitnet-SFT run

Browse files
Files changed (4) hide show
  1. config.json +0 -1
  2. generation_config.json +2 -5
  3. model.safetensors +1 -1
  4. tokenizer.json +2 -16
config.json CHANGED
@@ -16,7 +16,6 @@
16
  "max_position_embeddings": 1024,
17
  "mlp_bias": false,
18
  "model_type": "llama",
19
- "n_ctx": 1024,
20
  "num_attention_heads": 2,
21
  "num_hidden_layers": 1,
22
  "num_key_value_heads": 1,
 
16
  "max_position_embeddings": 1024,
17
  "mlp_bias": false,
18
  "model_type": "llama",
 
19
  "num_attention_heads": 2,
20
  "num_hidden_layers": 1,
21
  "num_key_value_heads": 1,
generation_config.json CHANGED
@@ -1,10 +1,7 @@
1
  {
2
  "_from_model_config": true,
3
  "bos_token_id": 1,
4
- "do_sample": true,
5
  "eos_token_id": 2,
6
- "max_length": 1000000000000,
7
- "temperature": 0.8,
8
- "top_p": 0.95,
9
- "transformers_version": "4.52.2"
10
  }
 
1
  {
2
  "_from_model_config": true,
3
  "bos_token_id": 1,
 
4
  "eos_token_id": 2,
5
+ "transformers_version": "4.52.2",
6
+ "use_cache": false
 
 
7
  }
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f9c0b12eaec6d240985dec3bb2a056758ef34b2b16e4304e366832266a783c55
3
  size 51977872
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3de4db08c1b06b8d5402ca3c5b92bf8d9f953b7f3a75ea21a30f46c5f682ae94
3
  size 51977872
tokenizer.json CHANGED
@@ -1,21 +1,7 @@
1
  {
2
  "version": "1.0",
3
- "truncation": {
4
- "direction": "Right",
5
- "max_length": 1024,
6
- "strategy": "LongestFirst",
7
- "stride": 0
8
- },
9
- "padding": {
10
- "strategy": {
11
- "Fixed": 1024
12
- },
13
- "direction": "Left",
14
- "pad_to_multiple_of": null,
15
- "pad_id": 2,
16
- "pad_type_id": 0,
17
- "pad_token": "</s>"
18
- },
19
  "added_tokens": [
20
  {
21
  "id": 0,
 
1
  {
2
  "version": "1.0",
3
+ "truncation": null,
4
+ "padding": null,
 
 
 
 
 
 
 
 
 
 
 
 
 
 
5
  "added_tokens": [
6
  {
7
  "id": 0,