Spaces:
Sleeping
Sleeping
| # Copyright (c) 2024 Amphion. | |
| # | |
| # This source code is licensed under the MIT license found in the | |
| # LICENSE file in the root directory of this source tree. | |
| import os | |
| def generate_poly_lexicon(file_path: str): | |
| """Generate poly char lexicon for Mandarin Chinese.""" | |
| poly_dict = {} | |
| with open(file_path, "r", encoding="utf-8") as readf: | |
| txt_list = readf.readlines() | |
| for txt in txt_list: | |
| word = txt.strip("\n") | |
| if word not in poly_dict: | |
| poly_dict[word] = 1 | |
| readf.close() | |
| return poly_dict | |