pdf_splitter/pdf_splitter.py

32 lines
1.1 KiB
Python
Raw Permalink Normal View History

2024-02-10 20:49:26 +00:00
import os
import shutil
from PyPDF2 import PdfReader, PdfWriter
2024-02-10 20:49:26 +00:00
def split_pdf_pages(processed_folder):
if not os.path.exists(processed_folder):
os.makedirs(processed_folder)
for filename in os.listdir('.'):
if filename.endswith('.pdf'):
file_path = os.path.join('.', filename) # Added for clarity
with open(file_path, 'rb') as infile:
reader = PdfReader(infile)
num_pages = len(reader.pages)
2024-02-10 20:49:26 +00:00
if num_pages > 1:
for i in range(num_pages):
writer = PdfWriter()
writer.add_page(reader.pages[i])
2024-02-10 20:49:26 +00:00
split_filename = f"split_{i+1}_{filename}"
split_filepath = os.path.join(processed_folder, split_filename)
2024-02-10 20:49:26 +00:00
with open(split_filepath, 'wb') as outfile:
writer.write(outfile)
# Attempt to move the file after ensuring it's closed
shutil.move(file_path, os.path.join(processed_folder, filename))
2024-02-10 20:49:26 +00:00
processed_folder = 'Processed'
2024-02-10 20:49:26 +00:00
split_pdf_pages(processed_folder)