From b0a4ce9ac816e24935a73065baa9d100e5df99fe Mon Sep 17 00:00:00 2001 From: songsenand Date: Thu, 26 Feb 2026 01:00:16 +0800 Subject: [PATCH] =?UTF-8?q?fix(model):=20=E4=BF=AE=E6=AD=A3=E8=AF=84?= =?UTF-8?q?=E4=BC=B0=E6=8D=9F=E5=A4=B1=E8=AE=A1=E7=AE=97=E4=BB=A5=E9=81=BF?= =?UTF-8?q?=E5=85=8D=E9=99=A4=E9=9B=B6=E9=94=99=E8=AF=AF?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit --- src/trainer/model.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/src/trainer/model.py b/src/trainer/model.py index 49fb424..b48ad4c 100644 --- a/src/trainer/model.py +++ b/src/trainer/model.py @@ -517,7 +517,7 @@ class MoEModel(nn.Module): if monitor: # 使用 eval_loss 作为监控指标 monitor.add_step( - global_step, {"loss": batch_loss_sum, "acc": acc} + global_step, {"loss": batch_loss_sum / (eval_frequency if global_step > 0 else 1), "acc": acc} ) logger.info( f"step: {global_step}, eval_loss: {eval_loss:.4f}, acc: {acc:.4f}, 'batch_loss_sum': {batch_loss_sum / (eval_frequency if global_step > 0 else 1):.4f}, current_lr: {current_lr}"