| base_model: Qwen/Qwen2.5-7B-Instruct-1M | |
| merge_method: passthrough | |
| slices: | |
| - sources: | |
| - model: Qwen/Qwen2.5-7B-Instruct-1M | |
| layer_range: [0, 12] # Base model layers | |
| tokenizer_source: Qwen/Qwen2.5-7B-Instruct-1M | |
| dtype: float16 | |
| base_model: Qwen/Qwen2.5-7B-Instruct-1M | |
| merge_method: passthrough | |
| slices: | |
| - sources: | |
| - model: Qwen/Qwen2.5-7B-Instruct-1M | |
| layer_range: [0, 12] # Base model layers | |
| tokenizer_source: Qwen/Qwen2.5-7B-Instruct-1M | |
| dtype: float16 | |