ASTRALK commited on
Commit
73701ee
·
verified ·
1 Parent(s): b99a90c

sft merged

Browse files
Files changed (4) hide show
  1. README.md +3 -1
  2. config.json +2 -2
  3. generation_config.json +6 -2
  4. model.safetensors +2 -2
README.md CHANGED
@@ -1,6 +1,8 @@
1
  ---
2
  library_name: transformers
3
- tags: []
 
 
4
  ---
5
 
6
  # Model Card for Model ID
 
1
  ---
2
  library_name: transformers
3
+ tags:
4
+ - trl
5
+ - sft
6
  ---
7
 
8
  # Model Card for Model ID
config.json CHANGED
@@ -7,7 +7,7 @@
7
  "attn_output_gate": true,
8
  "bos_token_id": null,
9
  "dtype": "bfloat16",
10
- "eos_token_id": 248044,
11
  "full_attention_interval": 4,
12
  "head_dim": 256,
13
  "hidden_act": "silu",
@@ -84,7 +84,7 @@
84
  "rope_type": "default"
85
  },
86
  "tie_word_embeddings": true,
87
- "transformers_version": "5.5.0",
88
  "use_cache": false,
89
  "vocab_size": 248320
90
  }
 
7
  "attn_output_gate": true,
8
  "bos_token_id": null,
9
  "dtype": "bfloat16",
10
+ "eos_token_id": 248046,
11
  "full_attention_interval": 4,
12
  "head_dim": 256,
13
  "hidden_act": "silu",
 
84
  "rope_type": "default"
85
  },
86
  "tie_word_embeddings": true,
87
+ "transformers_version": "5.5.2",
88
  "use_cache": false,
89
  "vocab_size": 248320
90
  }
generation_config.json CHANGED
@@ -1,6 +1,10 @@
1
  {
2
  "_from_model_config": true,
3
- "eos_token_id": 248044,
4
- "transformers_version": "5.5.0",
 
 
 
 
5
  "use_cache": true
6
  }
 
1
  {
2
  "_from_model_config": true,
3
+ "eos_token_id": [
4
+ 248046,
5
+ 248044
6
+ ],
7
+ "pad_token_id": 248044,
8
+ "transformers_version": "5.5.2",
9
  "use_cache": true
10
  }
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0a9b2f88ebc5a2588421a7ec100701bcbaf8dfef1cac782961a2e4ecdd41b029
3
- size 1726761609
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e5049f505114b491760684e36accb9edecb37d739170002b00f99c57392536ed
3
+ size 1726761639