From 5061cbe8738a258a5ffcedc1c72ba3d16dd28933 Mon Sep 17 00:00:00 2001 From: songsenand Date: Thu, 2 Apr 2026 21:31:40 +0800 Subject: [PATCH] =?UTF-8?q?=E4=BF=AE=E5=A4=8D=20README=20=E4=B8=AD?= =?UTF-8?q?=E5=AD=A6=E4=B9=A0=E7=8E=87=E9=85=8D=E7=BD=AE=E6=B3=A8=E9=87=8A?= =?UTF-8?q?=E6=A0=BC=E5=BC=8F=E9=97=AE=E9=A2=98=E5=B9=B6=E6=9B=B4=E6=96=B0?= =?UTF-8?q?=E8=AF=B4=E6=98=8E?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit --- .README.md.kate-swp | Bin 118 -> 0 bytes README.md | 6 +----- 2 files changed, 1 insertion(+), 5 deletions(-) delete mode 100644 .README.md.kate-swp diff --git a/.README.md.kate-swp b/.README.md.kate-swp deleted file mode 100644 index d61619f614720467706cd864fd513e1dc6b247b7..0000000000000000000000000000000000000000 GIT binary patch literal 0 HcmV?d00001 literal 118 zcmZQzU=Z?7EJ;-eE>A2_aLdd|RWQ;sU|?Vn>Dl{b>9jo$QWs{#h4TJ3R4^3|QVk9Q s$|M0X2-t!+2_O~_Foyz(WDt=AA`)GLK~w^SigyKTj01`&0|-ivR!s diff --git a/README.md b/README.md index 99c26c0..8549d90 100644 --- a/README.md +++ b/README.md @@ -92,8 +92,4 @@ - 注意力头数:4 - 专家数量:20 - 束宽:5 -- 学习率:待调(建议 1e-4 ~ 5e-4,带warmup) - ---- - -此方案结构完整,模块间接口清晰,可立即进入原型实现阶段。建议先在小规模数据上验证前向与训练流程,再逐步扩展至全量数据调优。 +- 学习率:待调(建议 1e-4 ~ 5e-4,带warmup)