Update README.md
Browse files
README.md
CHANGED
|
@@ -10,8 +10,6 @@ Here is a code to create this tiny model:
|
|
| 10 |
import os
|
| 11 |
import torch
|
| 12 |
|
| 13 |
-
torch.set_default_dtype(torch.bfloat16)
|
| 14 |
-
|
| 15 |
from transformers import AutoTokenizer, AutoConfig, Lfm2MoeForCausalLM
|
| 16 |
|
| 17 |
# # === Step 1: Define tiny model config ===
|
|
@@ -29,6 +27,7 @@ config.num_key_value_heads = 4
|
|
| 29 |
config.hidden_size = 16
|
| 30 |
config.num_dense_layers = 1
|
| 31 |
config.moe_intermediate_size = 16
|
|
|
|
| 32 |
|
| 33 |
# === Step 2: Create model from config ===
|
| 34 |
model = Lfm2MoeForCausalLM(config)
|
|
|
|
| 10 |
import os
|
| 11 |
import torch
|
| 12 |
|
|
|
|
|
|
|
| 13 |
from transformers import AutoTokenizer, AutoConfig, Lfm2MoeForCausalLM
|
| 14 |
|
| 15 |
# # === Step 1: Define tiny model config ===
|
|
|
|
| 27 |
config.hidden_size = 16
|
| 28 |
config.num_dense_layers = 1
|
| 29 |
config.moe_intermediate_size = 16
|
| 30 |
+
config.intermediate_size = 16
|
| 31 |
|
| 32 |
# === Step 2: Create model from config ===
|
| 33 |
model = Lfm2MoeForCausalLM(config)
|