# @Time : 2021/11/1 22:47 # @Author :wenkaic # @File : 002文件处理 # @Project : python爬虫 import re def find_chinese(file): pattern = re.compile(r'[^\u4e00-\u9fa5\n\\,\\:\\。\\!]') chinese = re.sub(pattern, '', file) chinese = re.sub('\n+','\n',chinese) chinese = re.sub('章','章 ',chinese) chinese = re.sub('第',' 第',chinese) print(chinese) return chinese fp = open('003斗破苍穹.json', 'r', encoding='utf-8') content=fp.read() content1=find_chinese(content) fp1 = open('004斗破苍穹.txt','w',encoding='utf-8') fp1.write(content1) fp1.close()