调整学习率阈值并优化日志输出精度
This commit is contained in:
parent
02f851205f
commit
335540d8c2
|
|
@ -399,7 +399,7 @@ class MoEModel(nn.Module):
|
||||||
|
|
||||||
# ---------- 学习率调度(仅当使用默认优化器且未传入自定义调度函数时)----------
|
# ---------- 学习率调度(仅当使用默认优化器且未传入自定义调度函数时)----------
|
||||||
if created_optimizer and lr_schedule is None:
|
if created_optimizer and lr_schedule is None:
|
||||||
if processed_batches <= 1000:
|
if processed_batches <= 8000:
|
||||||
new_lr = 1e-4
|
new_lr = 1e-4
|
||||||
else:
|
else:
|
||||||
new_lr = 6e-6
|
new_lr = 6e-6
|
||||||
|
|
@ -451,7 +451,7 @@ class MoEModel(nn.Module):
|
||||||
{"loss": avg_loss, "acc": acc},
|
{"loss": avg_loss, "acc": acc},
|
||||||
)
|
)
|
||||||
logger.info(
|
logger.info(
|
||||||
f"step: {global_step}, loss: {avg_loss:.4f}, acc: {acc}"
|
f"step: {global_step}, loss: {avg_loss:.4f}, acc: {acc:.4f}"
|
||||||
)
|
)
|
||||||
batch_loss_sum = 0.0
|
batch_loss_sum = 0.0
|
||||||
|
|
||||||
|
|
|
||||||
Loading…
Reference in New Issue