preductor commited on
Commit
ef89f0a
·
verified ·
1 Parent(s): 25dd07c

Upload README.md with huggingface_hub

Browse files
Files changed (1) hide show
  1. README.md +17 -3
README.md CHANGED
@@ -1,6 +1,20 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
  ## Description
2
 
3
- **MetalGPT-1** is a model built upon the Qwen3-32b and incorporates both continual pre-training and supervised fine-tuning.
4
 
5
  ---
6
 
@@ -43,7 +57,7 @@ model_inputs = tokenizer([text], return_tensors="pt").to(model.device)
43
 
44
  generated_ids = model.generate(
45
  **model_inputs,
46
- max_new_tokens=1024,
47
  )
48
 
49
  # Обрезаем префикс промпта
@@ -132,7 +146,7 @@ sampling_params = SamplingParams(
132
  repetition_penalty=1.05,
133
  top_p=0.8,
134
  top_k=70,
135
- max_tokens=512,
136
  )
137
 
138
  prompt = (
 
1
+ ---
2
+ pipeline_tag: text-generation
3
+ library_name: transformers
4
+ tags:
5
+ - mining
6
+ - russian
7
+ license: apache-2.0
8
+ datasets:
9
+ - nn-tech/Alloy-Bench
10
+ language:
11
+ - ru
12
+ base_model: Qwen/Qwen3-32B
13
+ ---
14
+
15
  ## Description
16
 
17
+ **MetalGPT-1** is a model built upon the Qwen/Qwen3-32B and incorporates both continual pre-training and supervised fine-tuning.
18
 
19
  ---
20
 
 
57
 
58
  generated_ids = model.generate(
59
  **model_inputs,
60
+ max_new_tokens=2048,
61
  )
62
 
63
  # Обрезаем префикс промпта
 
146
  repetition_penalty=1.05,
147
  top_p=0.8,
148
  top_k=70,
149
+ max_tokens=2048,
150
  )
151
 
152
  prompt = (