用Python批量去除PDF文件的密码

发布于:2025-02-11 ⋅ 阅读:(14) ⋅ 点赞:(0)

注意:前提是你知道密码,本代码不是暴力跑字典

最近有个需求,下载了一堆PDF,但都有加密,密码还不一样,每次打开都要输密码很麻烦,所有有了此工具,批量去除所有密码。

import os
from pypdf import PdfReader, PdfWriter

def decrypt_pdfs(folder_path, passwords):
    for filename in os.listdir(folder_path):
        if filename.endswith('.pdf'):
            file_path = os.path.join(folder_path, filename)
            try:
                with open(file_path, 'rb') as pdf_file:
                    pdf_reader = PdfReader(pdf_file)
                    if pdf_reader.is_encrypted:
                        success = False
                        for password in passwords:
                            try:
                                pdf_reader.decrypt(password)
                                if pdf_reader.pages:
                                    pdf_writer = PdfWriter()
                                    for page_num in range(len(pdf_reader.pages)):
                                        page = pdf_reader.pages[page_num]
                                        pdf_writer.add_page(page)
                                    file_name_without_ext = os.path.splitext(filename)[0]
                                    new_file_name = f"{file_name_without_ext}_decrypted.pdf"
                                    new_file_path = os.path.join(folder_path, new_file_name)
                                    with open(new_file_path, 'wb') as new_pdf_file:
                                        pdf_writer.write(new_pdf_file)
                                    print(f"已使用密码 {password} 成功解密并保存为: {new_file_path}")
                                    success = True
                                    break
                            except Exception:
                                continue
                        if not success:
                            print(f"!!!!无法使用提供的任何密码解密 {filename}")
                    else:
                        print(f"{filename} 无密码,无需处理。")
            except Exception as e:
                print(f"处理文件 {filename} 时出现错误: {e}")


# 你的PDF文件所在文件夹路径
folder_path = 'C:\\Users\\lianq\\Downloads'
# 实际可能的密码组
passwords = ['12345678', '123qwe', '123456']
decrypt_pdfs(folder_path, passwords)