def just_number(string, resymbol=""):
sub_str = re.sub(u"([^\u0030-\u0039])", resymbol, string)
return sub_str
def filter_dict(words,numbers):
word_dict = dict()
for word,num in zip(words,numbers):
try:
number = float(just_number(num))
expr = {word:1/number}
except Exception:
pass
finally:
word_dict.update(expr)
return word_dict
def location_dict(dir_path):
init_dict = np.zeros((2,2))
for path in os.listdir(dir_path):
try:
file_path = "{}{}".format(dir_path,path)
file_of_one = np.loadtxt(file_path,delimiter='\t',dtype=str)
print("ok:",path)
except Exception as error:
file_of_one = np.array([line.replace("\n","").split("\t") for line in open(file_path,'r').readlines()])
print("error:",path,error)
finally :
init_dict = np.r_[init_dict,file_of_one]
words,numbers = init_dict[2:,0],init_dict[2:,1]
return filter_dict(words,numbers)
dir_path = ""
location_dict(dir_path)
加载本地词典
最新推荐文章于 2022-02-16 15:54:17 发布