hell0ks's picture
Upload folder using huggingface_hub
1ff9e4b verified
# Model Configuration
model:
name: "MiniMaxAI/MiniMax-M2.1" # Target model to modify
output_path: "./output" # Path to save the modified model
dtype: "bfloat16" # Data type for model weights (e.g. "bfloat16")
# Analysis Configuration
analysis:
method: "ngram" # Token analysis method (e.g., "ngram")
window_size: 4 # Size of the n-gram window (e.g. 2 for bigrams)
sample_size: 1000 # Number of samples per token for analysis
ngram_weights: [0.5, 0.3, 0.2] # Use the first weight for window_size 2, fisrt two for 3, all three for 4.
# Weight Smoothing Configuration
adjustment:
min_scale: 0.9 # Minimum scaling factor for target token weights (0.0–1.0)
smoothness: 3.0 # Smoothing intensity (>1). Higher = more aggressive down-weighting
# Target Unicode Ranges
unicode_targets:
- name: CJK Unified Ideographs
range: [0x4E00, 0x9FFF]
- name: CJK Unified Ideographs Extension A
range: [0x3400, 0x4DBF]
- name: CJK Unified Ideographs Extension B
range: [0x20000, 0x2A6DF]
- name: CJK Compatibility Ideographs
range: [0xF900, 0xFAFF]
- name: CJK Radicals Supplement
range: [0x2E80, 0x2EFF]
- name: Kangxi Radicals
range: [0x2F00, 0x2FDF]
- name: Ideographic Description Characters
range: [0x2FF0, 0x2FFF]
- name: CJK Symbols and Punctuation
range: [0x3000, 0x303F]
- name: CJK Strokes
range: [0x31C0, 0x31EF]
- name: Enclosed CJK Letters and Months
range: [0x3200, 0x32FF]
- name: CJK Compatibility
range: [0x3300, 0x33FF]