aerner
/

lm-v2

@@ -1,7 +1,7 @@
 {
-  "_name_or_path": "/mnt/n/ml/models/aerner/lm-v2/checkpoint-76000",
   "architectures": [
-    "LlamaForCausalLM"
   ],
   "attention_dropout_prob": 0.1,
   "bos_token_id": 1,
@@ -12,7 +12,7 @@
   "initializer_range": 0.02,
   "intermediate_size": 11008,
   "max_position_embeddings": 2048,
-  "model_type": "llama",
   "num_attention_heads": 32,
   "num_hidden_layers": 8,
   "pad_token_id": 0,

 {
+  "_name_or_path": "/mnt/n/ml/models/aerner/lm-v2/checkpoint-76200",
   "architectures": [
+    "OpenLlamaForCausalLM"
   ],
   "attention_dropout_prob": 0.1,
   "bos_token_id": 1,
   "initializer_range": 0.02,
   "intermediate_size": 11008,
   "max_position_embeddings": 2048,
+  "model_type": "open-llama",
   "num_attention_heads": 32,
   "num_hidden_layers": 8,
   "pad_token_id": 0,

pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:9af5ea94b7d6af2b5c99464086434f26ae3a681d767bd29674ded3b51f22336a
-size 2169864106

 version https://git-lfs.github.com/spec/v1
+oid sha256:a8c5dd165b8fc67f0aac39e7162adde3a7aae9c039b5a2d92100dfb2fd91d90d
+size 1760272621