随笔分类 - python工具之路
摘要:import numpy as np import json import codecs # 计算编辑距离 def edit_distance(word1, word2): len1 = len(word1) len2 = len(word2) dp = np.zeros((len1 + 1, len2 + 1)) for i in range(len1 + 1): dp[i][0] = i fo
阅读全文
摘要:import reimport codecsoperation_list = []operation_list_sort = []with codecs.open(r'C:\Users\Administrator.SC-201812211013\PycharmProjects\untitled29\
阅读全文
摘要:import re import jieba.analyse import codecs import pandas as pd def word_replace(xianbingshi,hospital1): """替换词表""" data = [] hospital = [] """去重""" with codecs.open(hospital1,'r...
阅读全文
摘要:import codecs import requests from bs4 import BeautifulSoup import re from lxml import etree url = 'https://jbk.jiankang.com/zhengzhuang/pinyin-z/?p=5' r = requests.get(url).text sym = re.findall(')'...
阅读全文
摘要:import codecs def word_replace(word): """替换词表""" word_list = [] """去重""" with codecs.open(word,'r','utf8') as f: for line in f: line = line.strip() if...
阅读全文
摘要:import re import jieba.analyse import codecs import pandas as pd def simplification_text(xianbingshi): """提取文本""" xianbingshi_simplification = [] with codecs.open(xianbingshi,'r','utf8')...
阅读全文
摘要:import re import codecs word_a = r'症状.txt' word_b = r'C:\Users\Administrator.SC-201812211013\PycharmProjects\词表工作代码\yiwoqu\TXT\disease_0903.txt' list_a = [] list_b = [] with codecs.open(word_a,'r','ut
阅读全文
摘要:import codecs file = r'C:\Users\Administrator.SC-201812211013\PycharmProjects\untitled29\yiwoqu\symptom1.txt' data = [] with codecs.open(file,'r','utf8') as f: for line in f: line = line.strip() line
阅读全文
摘要:import re import codecs def joint_list(xianbingshi,xianbingshi_sub,list_write): xianbingshi_list_x =[] xianbingshi_list_y =[] xianbingshi_list_xy = [] with codecs.open(xianbingshi,'r...
阅读全文
摘要:import codecs def word_replace(word): """替换词表""" word_list = [] """去重""" with codecs.open(word,'r','utf8') as f: for line in f: line = line.strip() if...
阅读全文


浙公网安备 33010602011771号