pnevskaiaan commited on
Commit
d60719c
·
verified ·
1 Parent(s): 58d21f9

Update README.md

Browse files
Files changed (1) hide show
  1. README.md +39 -3
README.md CHANGED
@@ -1,3 +1,39 @@
1
- ---
2
- license: apache-2.0
3
- ---
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ license: apache-2.0
3
+ ---
4
+
5
+ ```python
6
+ import os
7
+ from transformers import (
8
+ AutoConfig,
9
+ AutoModelForImageTextToText,
10
+ AutoProcessor,
11
+ AutoTokenizer,
12
+ )
13
+
14
+ model_id = "mistralai/Mistral-Small-3.1-24B-Instruct-2503"
15
+ config = AutoConfig.from_pretrained(model_id)
16
+
17
+ config.text_config.num_hidden_layers = 2
18
+ config.text_config.hidden_size = 8
19
+ config.text_config.intermediate_size = 64
20
+ config.text_config.num_attention_heads = 8
21
+ config.text_config.num_key_value_heads = 4
22
+ config.text_config.head_dim = 32
23
+
24
+ config.vision_config.num_hidden_layers = 2
25
+ config.vision_config.hidden_size = 128
26
+ config.vision_config.intermediate_size = 64
27
+ config.vision_config.num_attention_heads = 4
28
+ config.vision_config.head_dim = 32
29
+
30
+ model = AutoModelForImageTextToText.from_config(config)
31
+ tokenizer = AutoTokenizer.from_pretrained(model_id)
32
+ processor = AutoProcessor.from_pretrained(model_id)
33
+
34
+ output_dir = "./tiny-random-mistral3"
35
+ os.makedirs(output_dir, exist_ok=True)
36
+ model.save_pretrained(output_dir)
37
+ tokenizer.save_pretrained(output_dir)
38
+ processor.save_pretrained(output_dir)
39
+ ```