I am able to get a script to copy over things from a Word Doc. However, I am having trouble copying over the numbering format(Match Destination Formatting) which I need. My code is below, if anyone can help me that would be great 🙂
<code>import os
from docx import Document
import openpyxl
from openpyxl.utils.dataframe import dataframe_to_rows
def read_word_doc(file_path):
doc = Document(file_path)
content = ""
for paragraph in doc.paragraphs:
content += paragraph.text + "n"
return content
def copy_to_excel(ws, content, row):
for paragraph in content.split("n"):
ws.cell(row=row, column=1, value=paragraph)
row+=1
return row
def create_excel_file(folder_path, excel_file_name):
wb = openpyxl.Workbook()
ws = wb.active
files = os.listdir(r"C:folder")
row = 1
for file_name in files:
if file_name.endswith(".DOCX"):
file_path = os.path.join(folder_path, file_name)
content = read_word_doc(file_path)
row = copy_to_excel(ws, content, row)
wb.save(path)
</code>
<code>import os
from docx import Document
import openpyxl
from openpyxl.utils.dataframe import dataframe_to_rows
def read_word_doc(file_path):
doc = Document(file_path)
content = ""
for paragraph in doc.paragraphs:
content += paragraph.text + "n"
return content
def copy_to_excel(ws, content, row):
for paragraph in content.split("n"):
ws.cell(row=row, column=1, value=paragraph)
row+=1
return row
def create_excel_file(folder_path, excel_file_name):
wb = openpyxl.Workbook()
ws = wb.active
files = os.listdir(r"C:folder")
row = 1
for file_name in files:
if file_name.endswith(".DOCX"):
file_path = os.path.join(folder_path, file_name)
content = read_word_doc(file_path)
row = copy_to_excel(ws, content, row)
wb.save(path)
</code>
import os
from docx import Document
import openpyxl
from openpyxl.utils.dataframe import dataframe_to_rows
def read_word_doc(file_path):
doc = Document(file_path)
content = ""
for paragraph in doc.paragraphs:
content += paragraph.text + "n"
return content
def copy_to_excel(ws, content, row):
for paragraph in content.split("n"):
ws.cell(row=row, column=1, value=paragraph)
row+=1
return row
def create_excel_file(folder_path, excel_file_name):
wb = openpyxl.Workbook()
ws = wb.active
files = os.listdir(r"C:folder")
row = 1
for file_name in files:
if file_name.endswith(".DOCX"):
file_path = os.path.join(folder_path, file_name)
content = read_word_doc(file_path)
row = copy_to_excel(ws, content, row)
wb.save(path)
Tried using library that interact with Windows but that was really buggy. Tried Pandas but that was also no help.