From b68f75b09d82ea9b676fa8b8dd539fe2b8890abf Mon Sep 17 00:00:00 2001 From: songsenand Date: Sat, 14 Feb 2026 15:29:25 +0800 Subject: [PATCH] =?UTF-8?q?=E4=BF=AE=E5=A4=8D=20char=5Finfo.pinyin=20?= =?UTF-8?q?=E8=AE=BF=E9=97=AE=E6=96=B9=E5=BC=8F=EF=BC=8C=E4=BD=BF=E7=94=A8?= =?UTF-8?q?=E5=AD=97=E5=85=B8=E5=BD=A2=E5=BC=8F=E7=A1=AE=E4=BF=9D=E5=85=BC?= =?UTF-8?q?=E5=AE=B9=E6=80=A7?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit --- src/suinput/dataset.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/src/suinput/dataset.py b/src/suinput/dataset.py index 5833121..b7223d3 100644 --- a/src/suinput/dataset.py +++ b/src/suinput/dataset.py @@ -440,7 +440,7 @@ class PinyinInputDataset(IterableDataset): "char_id": torch.tensor([char_info["id"]]), "char": char, "freq": char_info["freq"], - "pg": torch.tensor([self.pg_groups[char_info.pinyin[0]]]), + "pg": torch.tensor([self.pg_groups[char_info["pinyin"][0]]]), } # 根据调整因子重复样本