cafe3310 commited on
Commit
a074dc6
·
1 Parent(s): cb25b17

fix: 推理前将输入张量移动到模型设备

Browse files
Files changed (1) hide show
  1. comp.py +2 -2
comp.py CHANGED
@@ -46,8 +46,8 @@ def completion_node(state: GraphState) -> dict:
46
  prompt += "Assistant:"
47
 
48
  # --- 模型调用 ---
49
- # 使用 device_map="auto" 时,我们无需手动将张量移动到特定设备
50
- input_ids = tokenizer(prompt, return_tensors="pt").input_ids
51
  output_ids = model.generate(
52
  input_ids,
53
  max_new_tokens=512, # 暂时硬编码
 
46
  prompt += "Assistant:"
47
 
48
  # --- 模型调用 ---
49
+ # 虽然模型设备是自动映射的,但输入张量仍需显式移动到模型所在的设备
50
+ input_ids = tokenizer(prompt, return_tensors="pt").input_ids.to(model.device)
51
  output_ids = model.generate(
52
  input_ids,
53
  max_new_tokens=512, # 暂时硬编码