-
Notifications
You must be signed in to change notification settings - Fork 1.9k
/
remove_pdf_metadata.py
33 lines (25 loc) · 1.07 KB
/
remove_pdf_metadata.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
import PyPDF2
def remove_metadata(pdf_file):
# Open the PDF file.
with open(pdf_file, 'rb') as file:
reader = PyPDF2.PdfReader(file)
# Check if metadata exists.
if reader.metadata is not None:
print("Metadata found in the PDF file.")
# Create a new PDF file without metadata.
writer = PyPDF2.PdfWriter()
# Copy pages from the original PDF to the new PDF.
for page_num in range(len(reader.pages)):
page = reader.pages[page_num]
writer.add_page(page)
# Open a new file to write the PDF without metadata.
new_pdf_file = f"{pdf_file.split('.')[0]}_no_metadata.pdf"
with open(new_pdf_file, 'wb') as output_file:
writer.write(output_file)
print(f"PDF file without metadata saved as '{new_pdf_file}'.")
else:
print("No metadata found in the PDF file.")
# Specify the path to your PDF file.
pdf_file_path = "EEE415PQ.pdf"
# Call the function to remove metadata.
remove_metadata(pdf_file_path)