From fa9a6cdb1eade68c258eed7297f5a8a8a5329ac6 Mon Sep 17 00:00:00 2001
From: Flute <41096447+fluteink@users.noreply.github.com>
Date: 星期三, 01 十月 2025 14:44:28 +0800
Subject: [PATCH] 更新文档和运行脚本,修复文档拼写错误 (#2688)
---
runtime/tools/fst/generate_lexicon.py | 16 ++++++++--------
1 files changed, 8 insertions(+), 8 deletions(-)
diff --git a/runtime/tools/fst/generate_lexicon.py b/runtime/tools/fst/generate_lexicon.py
index a5a47ec..f8c7443 100755
--- a/runtime/tools/fst/generate_lexicon.py
+++ b/runtime/tools/fst/generate_lexicon.py
@@ -8,18 +8,19 @@
# sys.argv[3]: lexicon file for corpus.dict
lex_dict = {}
-with open(sys.argv[2], 'r', encoding='utf8') as fin:
+with open(sys.argv[2], "r", encoding="utf8") as fin:
for line in fin:
- words = line.strip().split('\t')
+ words = line.strip().split("\t")
if len(words) != 2:
continue
lex_dict[words[0]] = words[1]
-with open(sys.argv[1], 'r', encoding='utf8') as fin, \
- open(sys.argv[3], 'w', encoding='utf8') as fout:
+with open(sys.argv[1], "r", encoding="utf8") as fin, open(
+ sys.argv[3], "w", encoding="utf8"
+) as fout:
for line in fin:
word = line.strip()
- if word == '<s>' or word == '</s>':
+ if word == "<s>" or word == "</s>":
continue
word_lex = ""
if word in lex_dict:
@@ -29,7 +30,6 @@
if word[i] in lex_dict:
word_lex += " " + lex_dict[word[i]]
else:
- word_lex += " <unk>"
-
- fout.write('{}\t{}\n'.format(word, word_lex.strip()))
+ word_lex += " <unk>"
+ fout.write("{}\t{}\n".format(word, word_lex.strip()))
--
Gitblit v1.9.1