| | |
| | | |
| | | |
| | | def isChinese(ch: str): |
| | | if '\u4e00' <= ch <= '\u9fff': |
| | | if '\u4e00' <= ch <= '\u9fff' or '\u0030' <= ch <= '\u0039': |
| | | return True |
| | | return False |
| | | |
| | | |
| | | def isAllChinese(word: Union[List[Any], str]): |
| | | word_lists = [] |
| | | table = str.maketrans('', '', string.punctuation) |
| | | for i in word: |
| | | cur = i.translate(table) |
| | | cur = cur.replace(' ', '') |
| | | cur = i.replace(' ', '') |
| | | cur = cur.replace('</s>', '') |
| | | cur = cur.replace('<s>', '') |
| | | word_lists.append(cur) |
| | |
| | | |
| | | def isAllAlpha(word: Union[List[Any], str]): |
| | | word_lists = [] |
| | | table = str.maketrans('', '', string.punctuation) |
| | | for i in word: |
| | | cur = i.translate(table) |
| | | cur = cur.replace(' ', '') |
| | | cur = i.replace(' ', '') |
| | | cur = cur.replace('</s>', '') |
| | | cur = cur.replace('<s>', '') |
| | | word_lists.append(cur) |
| | |
| | | return False |
| | | |
| | | for ch in word_lists: |
| | | if ch.isalpha() is False: |
| | | if ch.isalpha() is False and ch != "'": |
| | | return False |
| | | elif ch.isalpha() is True and isChinese(ch) is True: |
| | | return False |