bigscience
/

bloomz

Text Generation

Eval Results (legacy)

text-generation-inference

Model card Files Files and versions

Metrics Training metrics Community

Fix architecture

#34

by lewtun HF Staff - opened Feb 10, 2023

base: refs/heads/main

←

from: refs/pr/34

Discussion Files changed

Files changed (1) hide show

config.json +2 -2

config.json CHANGED Viewed

@@ -2,7 +2,7 @@
   "apply_residual_connection_post_layernorm": false,
   "attention_dropout": 0.0,
   "architectures": [
-    "BloomModelForCausalLM"
   ],
   "attention_softmax_in_fp32": true,
   "seq_length": 2048,
@@ -22,4 +22,4 @@
   "transformers_version": "4.21.0",
   "use_cache": true,
   "vocab_size": 250880
-}

   "apply_residual_connection_post_layernorm": false,
   "attention_dropout": 0.0,
   "architectures": [
+    "BloomForCausalLM"
   ],
   "attention_softmax_in_fp32": true,
   "seq_length": 2048,
   "transformers_version": "4.21.0",
   "use_cache": true,
   "vocab_size": 250880
+}