diff --git a/src/axolotl/integrations/kd/kernels/liger.py b/src/axolotl/integrations/kd/kernels/liger.py index 75fe718f6..787740bcf 100644 --- a/src/axolotl/integrations/kd/kernels/liger.py +++ b/src/axolotl/integrations/kd/kernels/liger.py @@ -125,7 +125,6 @@ class LigerFusedLinearKLTopKLogprobFunction(LigerFusedLinearDistillationBase): target_token_ids_chunk, target_logprobs_chunk, target_mask_chunk, - temperature=temperature, ) loss = weight_hard_loss * ce_loss + weight_soft_loss * soft_loss