From 69238701715c720ad8f25b5107b76bf1a45cff93 Mon Sep 17 00:00:00 2001 From: songsenand Date: Fri, 13 Feb 2026 14:15:25 +0800 Subject: [PATCH] =?UTF-8?q?=E4=BF=AE=E5=A4=8D=E8=BE=93=E5=87=BA=E7=BB=B4?= =?UTF-8?q?=E5=BA=A6=E8=AE=A1=E7=AE=97=E9=94=99=E8=AF=AF=EF=BC=8C=E4=BD=BF?= =?UTF-8?q?=E7=94=A8=20d=5Fmodel=20=E4=BB=A3=E6=9B=BF=20input=5Fdim?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit --- src/trainer/model.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/src/trainer/model.py b/src/trainer/model.py index 9f7b64e..cb3e8cf 100644 --- a/src/trainer/model.py +++ b/src/trainer/model.py @@ -59,7 +59,7 @@ class Expert(nn.Module): super().__init__() self.input_dim = input_dim self.d_model = d_model - self.output_dim = input_dim * output_multiplier + self.output_dim = d_model * output_multiplier # 输入映射:input_dim -> d_model self.linear_in = nn.Linear(input_dim, d_model)