用Python批量去除PDF文件的密码
注意:前提是你知道密码,本代码不是暴力跑字典
最近有个需求,下载了一堆PDF,但都有加密,密码还不一样,每次打开都要输密码很麻烦,所有有了此工具,批量去除所有密码。
import os
from pypdf import PdfReader, PdfWriter
def decrypt_pdfs(folder_path, passwords):
for filename in os.listdir(folder_path):
if filename.endswith('.pdf'):
file_path = os.path.join(folder_path, filename)
try:
with open(file_path, 'rb') as pdf_file:
pdf_reader = PdfReader(pdf_file)
if pdf_reader.is_encrypted:
success = False
for password in passwords:
try:
pdf_reader.decrypt(password)
if pdf_reader.pages:
pdf_writer = PdfWriter()
for page_num in range(len(pdf_reader.pages)):
page = pdf_reader.pages[page_num]
pdf_writer.add_page(page)
file_name_without_ext = os.path.splitext(filename)[0]
new_file_name = f"{file_name_without_ext}_decrypted.pdf"
new_file_path = os.path.join(folder_path, new_file_name)
with open(new_file_path, 'wb') as new_pdf_file:
pdf_writer.write(new_pdf_file)
print(f"已使用密码 {password} 成功解密并保存为: {new_file_path}")
success = True
break
except Exception:
continue
if not success:
print(f"!!!!无法使用提供的任何密码解密 {filename}")
else:
print(f"{filename} 无密码,无需处理。")
except Exception as e:
print(f"处理文件 {filename} 时出现错误: {e}")
# 你的PDF文件所在文件夹路径
folder_path = 'C:\\Users\\lianq\\Downloads'
# 实际可能的密码组
passwords = ['12345678', '123qwe', '123456']
decrypt_pdfs(folder_path, passwords)