From db90516fcf6a12678a7f54f20f5dc8e8bd777c03 Mon Sep 17 00:00:00 2001 From: songsenand Date: Tue, 24 Feb 2026 01:05:57 +0800 Subject: [PATCH] =?UTF-8?q?fix(encoder):=20=E4=BF=AE=E5=A4=8D=20encoder=20?= =?UTF-8?q?=E8=B0=83=E7=94=A8=E6=97=B6=E7=BC=BA=E5=B0=91=20src=5Fkey=5Fpad?= =?UTF-8?q?ding=5Fmask=20=E5=8F=82=E6=95=B0?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit --- src/trainer/model.py | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/src/trainer/model.py b/src/trainer/model.py index 660d74f..07c301c 100644 --- a/src/trainer/model.py +++ b/src/trainer/model.py @@ -180,9 +180,9 @@ class MoEModel(nn.Module): # ----- 2. Transformer Encoder ----- # padding mask: True 表示忽略该位置 - # padding_mask = attention_mask == 0 + padding_mask = attention_mask == 0 encoded = self.encoder( - embeddings #, src_key_padding_mask=padding_mask + embeddings , src_key_padding_mask=padding_mask ) # [B, S, H] # ----- 3. 池化量 -----