from docx import Document
import os
cur_path = r"D:\Document\生产\VR\auto_video\2-Vedios"
def get_paragraphs(docx_path):
# 打开word文档
document = Document(docx_path)
# 获取所有段落
all_paragraphs = document.paragraphs
paragraph_texts = []
# 循环读取列表
for paragraph in all_paragraphs:
paragraph_texts.append(paragraph.text)
return paragraph_texts
for file in os.listdir(cur_path):
if (file[-5:]==".docx"):
cur_texts = get_paragraphs(os.path.join(cur_path,file))
with open(os.path.join(cur_path,file)[:-4] + 'txt', 'w', encoding='utf-8') as file:
for item in cur_texts:
if not item:
continue
# print(item)
file.write(item.replace("\n", "") + '\n')
file.close()