diff --git a/src/trainer/model.py b/src/trainer/model.py index cabfb6a..fcffcca 100644 --- a/src/trainer/model.py +++ b/src/trainer/model.py @@ -181,9 +181,9 @@ class MoEModel(nn.Module): # ----- 2. Transformer Encoder ----- # padding mask: True 表示忽略该位置 # padding_mask = attention_mask == 0 - # encoded = self.encoder( - # embeddings, src_key_padding_mask=padding_mask - # ) # [B, S, H] + encoded = self.encoder( + embeddings #, src_key_padding_mask=padding_mask + ) # [B, S, H] # ----- 3. 池化量 ----- # for block in self.shared_resblocks: