From 12e1849c6ddc228d6f62dedc7f95c22038498236 Mon Sep 17 00:00:00 2001
From: chenmengzheAAA <123789350+chenmengzheAAA@users.noreply.github.com>
Date: 星期二, 06 六月 2023 19:16:36 +0800
Subject: [PATCH] fix eng word space (#598)

---
 funasr/datasets/small_datasets/preprocessor.py |    2 +-
 1 files changed, 1 insertions(+), 1 deletions(-)

diff --git a/funasr/datasets/small_datasets/preprocessor.py b/funasr/datasets/small_datasets/preprocessor.py
index 7ec6929..d80f48a 100644
--- a/funasr/datasets/small_datasets/preprocessor.py
+++ b/funasr/datasets/small_datasets/preprocessor.py
@@ -828,7 +828,7 @@
             token_type=args.token_type,
             token_list=args.token_list,
             bpemodel=args.bpemodel,
-            non_linguistic_symbols=args.non_linguistic_symbols,
+            non_linguistic_symbols=args.non_linguistic_symbols if hasattr(args, "non_linguistic_symbols") else None,
             text_cleaner=args.cleaner,
             g2p_type=args.g2p,
             split_with_space=args.split_with_space if hasattr(args, "split_with_space") else False,

--
Gitblit v1.9.1