diff --git a/text/cleaners.py b/text/cleaners.py index eb9db06..2524e20 100644 --- a/text/cleaners.py +++ b/text/cleaners.py @@ -12,7 +12,7 @@ the symbols in symbols.py to match your data). ''' -import re +import os, sys, re from unidecode import unidecode import pyopenjtalk from jamo import h2j, j2hcj @@ -21,6 +21,8 @@ import logging logging.getLogger('jieba').setLevel(logging.WARNING) +jieba.set_dictionary(os.path.dirname(sys.argv[0])+'/jieba/dict.txt') +jieba.initialize() # This is a list of Korean classifiers preceded by pure Korean numerals.