FoundationalASSIST / Code /qwen3next80bvllm_instruct.py

Upload folder using huggingface_hub

6256eb9 verified about 1 month ago

974 Bytes

	"""
	Knowledge Tracing inference with Qwen3-Next-80B-A3B-Instruct model.

	This is the standard instruction-following model (no thinking blocks).
	Recommended sampling: temperature=0.7, top_p=0.8, top_k=20, min_p=0

	Usage:
	CUDA_VISIBLE_DEVICES=0,1,2,3 python qwen3next80bvllm_instruct.py \
	--data-dir foundationalktdataset/ \
	--num-gpus 4 \
	--batch-size 10 \
	--cache-dir /data1/ \
	--num-students 500 \
	--bin-size 50 \
	--min-history 50
	"""

	from kt_inference_base import run_inference

	MODEL_CONFIG = {
	"model_id": "Qwen/Qwen3-Next-80B-A3B-Instruct",
	"gen_configs": {
	"temperature": 0.7,
	"top_p": 0.8,
	"top_k": 20,
	"min_p": 0.0,
	"max_tokens": 32768,
	"repetition_penalty": 1.0,
	},
	"output_prefix": "qwen3next80binstruct",
	"system_prompt_prefix": "", # No prefix - standard instruct model
	}

	if __name__ == "__main__":
	run_inference(MODEL_CONFIG)