修复初始步骤损失计算逻辑
This commit is contained in:
parent
4560a9ed06
commit
17324ffa10
|
|
@ -579,6 +579,8 @@ class MoEModel(nn.Module):
|
||||||
):
|
):
|
||||||
avg_loss = batch_loss_sum / eval_frequency
|
avg_loss = batch_loss_sum / eval_frequency
|
||||||
acc, eval_loss = self.model_eval(eval_dataloader, criterion)
|
acc, eval_loss = self.model_eval(eval_dataloader, criterion)
|
||||||
|
if global_step == 0:
|
||||||
|
avg_loss = eval_loss
|
||||||
super().train()
|
super().train()
|
||||||
if monitor is not None:
|
if monitor is not None:
|
||||||
monitor.add_step(
|
monitor.add_step(
|
||||||
|
|
|
||||||
Loading…
Reference in New Issue