调整学习率阈值并优化日志输出精度

This commit is contained in:
songsenand 2026-02-13 12:12:12 +08:00
parent 02f851205f
commit 335540d8c2
1 changed files with 2 additions and 2 deletions

View File

@ -399,7 +399,7 @@ class MoEModel(nn.Module):
# ---------- 学习率调度(仅当使用默认优化器且未传入自定义调度函数时)----------
if created_optimizer and lr_schedule is None:
if processed_batches <= 1000:
if processed_batches <= 8000:
new_lr = 1e-4
else:
new_lr = 6e-6
@ -451,7 +451,7 @@ class MoEModel(nn.Module):
{"loss": avg_loss, "acc": acc},
)
logger.info(
f"step: {global_step}, loss: {avg_loss:.4f}, acc: {acc}"
f"step: {global_step}, loss: {avg_loss:.4f}, acc: {acc:.4f}"
)
batch_loss_sum = 0.0