| """ | |
| Knowledge Tracing inference with Qwen3-Next-80B-A3B-Instruct model. | |
| This is the standard instruction-following model (no thinking blocks). | |
| Recommended sampling: temperature=0.7, top_p=0.8, top_k=20, min_p=0 | |
| Usage: | |
| CUDA_VISIBLE_DEVICES=0,1,2,3 python qwen3next80bvllm_instruct.py \ | |
| --data-dir foundationalktdataset/ \ | |
| --num-gpus 4 \ | |
| --batch-size 10 \ | |
| --cache-dir /data1/ \ | |
| --num-students 500 \ | |
| --bin-size 50 \ | |
| --min-history 50 | |
| """ | |
| from kt_inference_base import run_inference | |
| MODEL_CONFIG = { | |
| "model_id": "Qwen/Qwen3-Next-80B-A3B-Instruct", | |
| "gen_configs": { | |
| "temperature": 0.7, | |
| "top_p": 0.8, | |
| "top_k": 20, | |
| "min_p": 0.0, | |
| "max_tokens": 32768, | |
| "repetition_penalty": 1.0, | |
| }, | |
| "output_prefix": "qwen3next80binstruct", | |
| "system_prompt_prefix": "", # No prefix - standard instruct model | |
| } | |
| if __name__ == "__main__": | |
| run_inference(MODEL_CONFIG) | |