wlabchoi
/

training-scripts

wlabchoi commited on Dec 11, 2025

Commit

80fd90a

verified ·

1 Parent(s): dc45fe9

Upload train_qwen3_distillation.py with huggingface_hub

Files changed (1) hide show

train_qwen3_distillation.py CHANGED Viewed

@@ -191,7 +191,7 @@ class MiniLLMTrainer(Trainer):
             teacher_logits = teacher_outputs.logits
             # Teacher token sampling (key part of MiniLLM)
-            if self.use_teacher_sampling and self.training:
                 # Sample from teacher's softmax distribution
                 teacher_probs = F.softmax(teacher_logits / self.temperature, dim=-1)
                 # Sample tokens: [batch, seq_len]

             teacher_logits = teacher_outputs.logits
             # Teacher token sampling (key part of MiniLLM)
+            if self.use_teacher_sampling and model.training:
                 # Sample from teacher's softmax distribution
                 teacher_probs = F.softmax(teacher_logits / self.temperature, dim=-1)
                 # Sample tokens: [batch, seq_len]