|
|
|
@ -25,6 +25,7 @@ for root, dirs, files in os.walk(working_dir):
|
|
|
|
|
file_path = os.path.join(county_dir, file)
|
|
|
|
|
# 判断文件是否是Word文档
|
|
|
|
|
if file_path.endswith('.docx') and not file.startswith('~'):
|
|
|
|
|
cityName=file_path.replace(working_dir,'')[1:].split("各县")[0]
|
|
|
|
|
areaName = file
|
|
|
|
|
areaName = re.sub(r'[^\u4e00-\u9fa5]', '', areaName)
|
|
|
|
|
if '市' not in areaName and '县' not in areaName and '区' not in areaName:
|
|
|
|
@ -44,6 +45,6 @@ for root, dirs, files in os.walk(working_dir):
|
|
|
|
|
# 将文本中的关键字替换为空字符串
|
|
|
|
|
areaName = areaName.replace(line.split(' ')[0], line.split(' ')[1])
|
|
|
|
|
#
|
|
|
|
|
print(f"正在处理文件:{areaName}")
|
|
|
|
|
print(f"正在处理县区:{cityName}{areaName}")
|
|
|
|
|
|
|
|
|
|
print("恭喜,所有县区数据整理工作成功完成!")
|
|
|
|
|