DariaaaS commited on
Commit
7757096
·
verified ·
1 Parent(s): 137931a

Training in progress, step 10

Browse files
config.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "_name_or_path": "mistralai/Mistral-7B-Instruct-v0.1",
3
  "architectures": [
4
  "MistralForCausalLM"
5
  ],
@@ -17,11 +17,11 @@
17
  "num_hidden_layers": 32,
18
  "num_key_value_heads": 8,
19
  "rms_norm_eps": 1e-05,
20
- "rope_theta": 10000.0,
21
- "sliding_window": 4096,
22
  "tie_word_embeddings": false,
23
  "torch_dtype": "float32",
24
  "transformers_version": "4.49.0",
25
  "use_cache": true,
26
- "vocab_size": 32000
27
  }
 
1
  {
2
+ "_name_or_path": "mistralai/Mistral-7B-Instruct-v0.3",
3
  "architectures": [
4
  "MistralForCausalLM"
5
  ],
 
17
  "num_hidden_layers": 32,
18
  "num_key_value_heads": 8,
19
  "rms_norm_eps": 1e-05,
20
+ "rope_theta": 1000000.0,
21
+ "sliding_window": null,
22
  "tie_word_embeddings": false,
23
  "torch_dtype": "float32",
24
  "transformers_version": "4.49.0",
25
  "use_cache": true,
26
+ "vocab_size": 32768
27
  }
model-00001-of-00006.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2edfc4667afc0bd69d37eeea36075303589b67c106632e80f1ae3961e5796e54
3
- size 4987196936
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:11e1c04d69a35a4a33bf0b3d8a0432ec642b1e1ba76c9c555cc0c3b60ec80246
3
+ size 4999779856
model-00002-of-00006.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d2203390edfb38ef618e66d0d556676c426d4f02a48d82267a211fa252635c31
3
  size 4899116440
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4160266844d5050bc9de13dc5c303d1cb52a8339ae480592355636ac6abf4d89
3
  size 4899116440
model-00003-of-00006.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c59f37f090d3a219fb897ff58ecd0eee0eb53527350cfebf17cbb2a94bd7796d
3
  size 4999813120
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6e03df78cd63e2bc788bc4d2bb9bdb86877ba4b9c4b00b95585bc2bc3faefe2c
3
  size 4999813120
model-00004-of-00006.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0ae65b450d36a5143e0ccec93d2838f372c4e6df3c600ad0d531b07819859f35
3
  size 4999813128
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:681a3fe1af5ca8941ccedc816af9e69004e3ea28f7aadb6eeae7878713033016
3
  size 4999813128
model-00005-of-00006.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1295692670156e06e61af502b326bfba49f5b98c778ecf52c446b639ddc2c308
3
  size 4832007496
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:62f8d7e77e5a356d66534a4e28fcb2bf355f8f173d94619eecc103feec6f8236
3
  size 4832007496
model-00006-of-00006.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f4e388769618badcbd053411a991d5cb9918bea8603a691e8879850c30492128
3
- size 4249014896
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:937928e6ef4fbd9b2c9a628b18a6485ef165890232a6b7d56b7b75a2f246f137
3
+ size 4261597808
model.safetensors.index.json CHANGED
@@ -1,6 +1,6 @@
1
  {
2
  "metadata": {
3
- "total_size": 28966928384
4
  },
5
  "weight_map": {
6
  "lm_head.weight": "model-00006-of-00006.safetensors",
 
1
  {
2
  "metadata": {
3
+ "total_size": 28992094208
4
  },
5
  "weight_map": {
6
  "lm_head.weight": "model-00006-of-00006.safetensors",
tokenizer.json CHANGED
The diff for this file is too large to render. See raw diff
 
tokenizer.model CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:dadfd56d766715c61d2ef780a525ab43b8e6da4de6865bda3d95fdef5e134055
3
- size 493443
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:37f00374dea48658ee8f5d0f21895b9bc55cb0103939607c8185bfd1c6ca1f89
3
+ size 587404
tokenizer_config.json CHANGED
The diff for this file is too large to render. See raw diff
 
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a159a2cf6abdb90e18161c6b45f24b006ec2eb2623664ffef18ace0deb326e20
3
  size 5496
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fc4e1de7bf877d06d8b499c9a257b16871c71fe7c27379c12dbc64644d9216c5
3
  size 5496