File size: 249 Bytes
8730f5f
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
run-title: micro-llama-3b
model: micro-llama-3b

base-model: meta-llama/Llama-3.2-3B
tokenizer: meta-llama/Llama-3.2-3B-Instruct
num-experts: 4
top-k-experts: 1
jitter-noise: 0
use-router: True
mask-input: True
max-length: 8192

trainable:
  - model