From a928d9c12892fce8422448a132a106a2c0def4f9 Mon Sep 17 00:00:00 2001 From: Arthur <48595927+ArthurZucker@users.noreply.github.com> Date: Thu, 5 Dec 2024 21:07:46 +0530 Subject: [PATCH] [`trainer`] fix the GA `model_accepts_loss_kwargs` (#34915) * fix * style * values * fix --- src/transformers/trainer.py | 9 +++++---- 1 file changed, 5 insertions(+), 4 deletions(-) diff --git a/src/transformers/trainer.py b/src/transformers/trainer.py index 13d9d45f19a..af908e48e4b 100755 --- a/src/transformers/trainer.py +++ b/src/transformers/trainer.py @@ -623,9 +623,7 @@ def __init__( else unwrapped_model.get_base_model().forward ) forward_params = inspect.signature(model_forward).parameters - self.model_accepts_loss_kwargs = ( - "loss_kwargs" in forward_params and forward_params["loss_kwargs"].kind == inspect.Parameter.VAR_KEYWORD - ) + self.model_accepts_loss_kwargs = any(k.kind == inspect.Parameter.VAR_KEYWORD for k in forward_params.values()) self.neftune_noise_alpha = args.neftune_noise_alpha @@ -3651,7 +3649,10 @@ def training_step( return loss_mb.reduce_mean().detach().to(self.args.device) with self.compute_loss_context_manager(): - loss = self.compute_loss(model, inputs, num_items_in_batch=num_items_in_batch) + if self.model_accepts_loss_kwargs: + loss = self.compute_loss(model, inputs) + else: + loss = self.compute_loss(model, inputs, num_items_in_batch=num_items_in_batch) del inputs if (