Training in progress, step 10

Files changed (12) hide show

config.json CHANGED Viewed

@@ -1,5 +1,5 @@
 {
-  "_name_or_path": "mistralai/Mistral-7B-Instruct-v0.1",
   "architectures": [
     "MistralForCausalLM"
   ],
@@ -17,11 +17,11 @@
   "num_hidden_layers": 32,
   "num_key_value_heads": 8,
   "rms_norm_eps": 1e-05,
-  "rope_theta": 10000.0,
-  "sliding_window": 4096,
   "tie_word_embeddings": false,
   "torch_dtype": "float32",
   "transformers_version": "4.49.0",
   "use_cache": true,
-  "vocab_size": 32000
 }

 {
+  "_name_or_path": "mistralai/Mistral-7B-Instruct-v0.3",
   "architectures": [
     "MistralForCausalLM"
   ],
   "num_hidden_layers": 32,
   "num_key_value_heads": 8,
   "rms_norm_eps": 1e-05,
+  "rope_theta": 1000000.0,
+  "sliding_window": null,
   "tie_word_embeddings": false,
   "torch_dtype": "float32",
   "transformers_version": "4.49.0",
   "use_cache": true,
+  "vocab_size": 32768
 }

model-00001-of-00006.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:2edfc4667afc0bd69d37eeea36075303589b67c106632e80f1ae3961e5796e54
-size 4987196936

 version https://git-lfs.github.com/spec/v1
+oid sha256:11e1c04d69a35a4a33bf0b3d8a0432ec642b1e1ba76c9c555cc0c3b60ec80246
+size 4999779856

model-00002-of-00006.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:d2203390edfb38ef618e66d0d556676c426d4f02a48d82267a211fa252635c31
 size 4899116440

 version https://git-lfs.github.com/spec/v1
+oid sha256:4160266844d5050bc9de13dc5c303d1cb52a8339ae480592355636ac6abf4d89
 size 4899116440

model-00003-of-00006.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:c59f37f090d3a219fb897ff58ecd0eee0eb53527350cfebf17cbb2a94bd7796d
 size 4999813120

 version https://git-lfs.github.com/spec/v1
+oid sha256:6e03df78cd63e2bc788bc4d2bb9bdb86877ba4b9c4b00b95585bc2bc3faefe2c
 size 4999813120

model-00004-of-00006.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:0ae65b450d36a5143e0ccec93d2838f372c4e6df3c600ad0d531b07819859f35
 size 4999813128

 version https://git-lfs.github.com/spec/v1
+oid sha256:681a3fe1af5ca8941ccedc816af9e69004e3ea28f7aadb6eeae7878713033016
 size 4999813128

model-00005-of-00006.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:1295692670156e06e61af502b326bfba49f5b98c778ecf52c446b639ddc2c308
 size 4832007496

 version https://git-lfs.github.com/spec/v1
+oid sha256:62f8d7e77e5a356d66534a4e28fcb2bf355f8f173d94619eecc103feec6f8236
 size 4832007496

model-00006-of-00006.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:f4e388769618badcbd053411a991d5cb9918bea8603a691e8879850c30492128
-size 4249014896

 version https://git-lfs.github.com/spec/v1
+oid sha256:937928e6ef4fbd9b2c9a628b18a6485ef165890232a6b7d56b7b75a2f246f137
+size 4261597808

model.safetensors.index.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "metadata": {
-    "total_size": 28966928384
   },
   "weight_map": {
     "lm_head.weight": "model-00006-of-00006.safetensors",

 {
   "metadata": {
+    "total_size": 28992094208
   },
   "weight_map": {
     "lm_head.weight": "model-00006-of-00006.safetensors",

tokenizer.json CHANGED Viewed

The diff for this file is too large to render. See raw diff

tokenizer.model CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:dadfd56d766715c61d2ef780a525ab43b8e6da4de6865bda3d95fdef5e134055
-size 493443

 version https://git-lfs.github.com/spec/v1
+oid sha256:37f00374dea48658ee8f5d0f21895b9bc55cb0103939607c8185bfd1c6ca1f89
+size 587404

tokenizer_config.json CHANGED Viewed

The diff for this file is too large to render. See raw diff

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:a159a2cf6abdb90e18161c6b45f24b006ec2eb2623664ffef18ace0deb326e20
 size 5496

 version https://git-lfs.github.com/spec/v1
+oid sha256:fc4e1de7bf877d06d8b499c9a257b16871c71fe7c27379c12dbc64644d9216c5
 size 5496