pnevskaiaan commited on
Commit
e26ddf8
·
verified ·
1 Parent(s): 98e8a7f

Update README.md

Browse files
Files changed (1) hide show
  1. README.md +60 -3
README.md CHANGED
@@ -1,3 +1,60 @@
1
- ---
2
- license: apache-2.0
3
- ---
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ license: apache-2.0
3
+ ---
4
+
5
+ import torch
6
+ from transformers import AutoConfig, AutoModelForCausalLM, AutoTokenizer
7
+ import os
8
+
9
+ # Create a tiny config for testing
10
+ from transformers.models.hunyuan_v1_dense.configuration_hunyuan_v1_dense import HunYuanDenseV1Config
11
+
12
+ tiny_config = HunYuanDenseV1Config(
13
+ vocab_size=300,
14
+ hidden_size=64,
15
+ intermediate_size=128,
16
+ num_hidden_layers=2,
17
+ num_attention_heads=4,
18
+ head_dim=16,
19
+ num_key_value_heads=2,
20
+ hidden_act="silu",
21
+ max_position_embeddings=128,
22
+ rms_norm_eps=1e-05,
23
+ use_cache=True,
24
+ tie_word_embeddings=False,
25
+ rope_theta=10000.0,
26
+ attention_bias=False,
27
+ attention_dropout=0.0,
28
+ use_qk_norm=True,
29
+ bos_token_id=1,
30
+ eos_token_id=2,
31
+ pad_token_id=0,
32
+ )
33
+
34
+ print("Config created:", tiny_config.model_type)
35
+
36
+ # Create model from config
37
+ model = AutoModelForCausalLM.from_config(tiny_config)
38
+ model.eval()
39
+ print("Model created, params:", sum(p.numel() for p in model.parameters()))
40
+
41
+ # Save model
42
+ save_dir = "/home/panas/git/optimum-intel/tiny-random-hunyuan-v1-dense"
43
+ model.save_pretrained(save_dir)
44
+ tiny_config.save_pretrained(save_dir)
45
+
46
+ # Create a simple tokenizer config for testing
47
+ from transformers import PreTrainedTokenizerFast
48
+ tokenizer = PreTrainedTokenizerFast(
49
+ tokenizer_object=None,
50
+ bos_token="<s>",
51
+ eos_token="</s>",
52
+ unk_token="<unk>",
53
+ pad_token="<pad>",
54
+ )
55
+ # Just save a minimal tokenizer
56
+ # Actually, for tests, we can use the AutoTokenizer approach or skip tokenizer
57
+
58
+ print(f"Saved tiny model to {save_dir}")
59
+ print("Files:", os.listdir(save_dir))
60
+