'''
1.读取本地网页
2.匹配页面中的中文
3.转换为繁体
'''
import re
from Fan_Jian.langconv import *
import Fan_Jian.zh_wiki
import multiprocessing
import os


class Fan_jian_change(object):
# 读取本地所有的网页源码文件
def read_local_web(self):
dir_name = '../file'
name_list = os.listdir(dir_name)
for name in name_list:
with open(name, 'r', encoding='utf-8') as f:
web_data = f.readlines()
return web_data

# 将读取到的web源代码进行正则匹配,匹配出所有的汉字
# 将匹配出的简体汉字转换为繁体
def re_change(self, web_data):
sentence = Converter('zh-hant').convert(web_data)
for i in range(2):
with open('../end/{}.txt'.format(i), 'a+', encoding='utf-8') as f:
f.write(sentence)
print('网站转换成功..')

def main(self):
web_data = self.read_local_web()
q = multiprocessing.Pool(10)
q.apply_async(self.re_change, args=(web_data,))


if __name__ == '__main__':
f = Fan_jian_change()
f.main()
posted on 2019-08-28 19:02  Yihan_07  阅读(453)  评论(0编辑  收藏  举报