""" Knowledge Tracing inference with Qwen3-Next-80B-A3B-Instruct model. This is the standard instruction-following model (no thinking blocks). Recommended sampling: temperature=0.7, top_p=0.8, top_k=20, min_p=0 Usage: CUDA_VISIBLE_DEVICES=0,1,2,3 python qwen3next80bvllm_instruct.py \ --data-dir foundationalktdataset/ \ --num-gpus 4 \ --batch-size 10 \ --cache-dir /data1/ \ --num-students 500 \ --bin-size 50 \ --min-history 50 """ from kt_inference_base import run_inference MODEL_CONFIG = { "model_id": "Qwen/Qwen3-Next-80B-A3B-Instruct", "gen_configs": { "temperature": 0.7, "top_p": 0.8, "top_k": 20, "min_p": 0.0, "max_tokens": 32768, "repetition_penalty": 1.0, }, "output_prefix": "qwen3next80binstruct", "system_prompt_prefix": "", # No prefix - standard instruct model } if __name__ == "__main__": run_inference(MODEL_CONFIG)