python入门学习小工具制作系列各种小工具整理

置顶 LinuxLOVERes

已于 2025-06-03 19:29:14 修改

阅读量3k

点赞数 11

CC 4.0 BY-SA版权

文章标签：学习 python 小程序 python小工具

于 2023-06-25 09:30:00 首次发布

本文链接：https://blog.youkuaiyun.com/LinuxLOVERes/article/details/131360737

一、制作基于windows系统批量重命名文件小工具

参考博客：

使用python做一个批量重命名文件的小工具_讷言丶的博客-优快云博客

效果展示：

临时01

代码实现：

import os
from tkinter import filedialog
import tkinter as tk
from tkinter import messagebox

root = tk.Tk()
root.geometry('400x200+550+200')
root.title('批量重命名文件小工具')
page = tk.Frame()
page.pack()
text = tk.StringVar()


def rename_file():
    filepath = filedialog.askdirectory()
    index = 0
    if len(os.listdir(filepath)) == 0:
        messagebox.showinfo(title="文件重命名", message="该目录下文件为空，请重新选择目录")
    else:
        for filename in os.listdir(filepath):
            index += 1
            file_path = os.path.join(filepath, filename)
            if os.path.isfile(file_path):
                name, ext = os.path.splitext(filename)
                new_name = text.get() + str(index) + ext
                # print(new_name)
                os.rename(file_path, os.path.join(filepath, new_name))
        messagebox.showinfo(title='文件重命名', message='文件重命名成功，请查看目录')


tk.Label(page).grid(row=0, column=1)
tk.Label(page, text='文件名称前缀:', font=('华文楷体', 15)).grid(row=2, column=1, pady=10)
tk.Entry(page, textvariable=text).grid(row=2, column=2)
tk.Button(page, text='选择目录并重命名文件', font=('华文楷体', 15), command=rename_file).grid(row=3, column=2)
root.mainloop()

二、制作时间戳转换器

效果展示：

临时03

代码实现：

import time
import tkinter as tk
from tkinter import messagebox

root = tk.Tk()
root.geometry('400x300+500+300')
root.title('时间戳转换工具')

usertime = tk.StringVar()
usertimestamp = tk.StringVar()

page = tk.Frame(root)
page.pack()

tk.Label(page).grid(row=0, column=1)

tk.Label(page, text='请输入时间【格式：Y-M-D h:m:s】:', font=('黑体', 10)).grid(row=1, column=1, pady=10)
tk.Entry(page, textvariable=usertime).grid(row=1, column=2)

tk.Label(page, text='请输入时间戳: ', font=('黑体', 10)).grid(row=3, column=1, pady=30)
tk.Entry(page, textvariable=usertimestamp).grid(row=3, column=2)


# 将时间转换为时间戳，秒级
def timestamp_s():
    time_value = usertime.get()
    timeArray = time.strptime(time_value, "%Y-%m-%d %H:%M:%S")
    timestamp = time.mktime(timeArray)
    times = int(timestamp)
    messagebox.showinfo(title='时间戳(s)', message=f'获取到的时间戳(s)为{times}')


# 将时间转换为时间戳，毫秒级
def timestamp_ms():
    time_value = usertime.get()
    timeArray = time.strptime(time_value, "%Y-%m-%d %H:%M:%S")
    timestamp = time.mktime(timeArray)
    times = int(round(timestamp * 1000))
    messagebox.showinfo(title='时间戳(s)', message=f'获取到的时间戳(s)为{times}')


# 秒级时间戳转换
def time_s():
    time_value = usertimestamp.get()
    if len(time_value) == 10:
        timeas = int(time_value)
        time_local = time.localtime(timeas)
        dt = time.strftime("%Y-%m-%d %H:%M:%S", time_local)
        messagebox.showinfo(title='时间', message=f'获取到的时间为{dt}')
    elif len(time_value) == 13:
        timeas = int(time_value)
        timestamps = int(round(timeas / 1000))
        time_local = time.localtime(timestamps)
        dt = time.strftime("%Y-%m-%d %H:%M:%S", time_local)
        messagebox.showinfo(title='时间', message=f'获取到的时间为{dt}')

tk.Button(page, text='转换为时间戳(s)', command=timestamp_s).grid(row=2, column=1)
tk.Button(page, text='转换为时间戳(ms)', command=timestamp_ms).grid(row=2, column=2)
tk.Button(page, text='转换为时间', command=time_s).grid(row=4, column=1)
root.mainloop()

三、制作图书管理小工具

效果展示：

临时02

代码实现：

import tkinter as tk
from tkinter import messagebox


# 定义Book类
class Book:
    def __init__(self, title, author, isbn):
        self.title = title
        self.author = author
        self.isbn = isbn


# 定义GUI窗口
class BookManagementSystem:
    def __init__(self, master):
        self.master = master
        self.master.title("图书管理系统")

        # 创建标题标签
        tk.Label(self.master, text="图书管理系统", font=("Arial", 20)).grid(column=0, row=0, columnspan=3, pady=10)

        # 创建书籍信息输入框
        tk.Label(self.master, text="书名").grid(column=0, row=1)
        self.title_entry = tk.Entry(self.master)
        self.title_entry.grid(column=1, row=1, padx=5, pady=5)
        tk.Label(self.master, text="作者").grid(column=0, row=2)
        self.author_entry = tk.Entry(self.master)
        self.author_entry.grid(column=1, row=2, padx=5, pady=5)
        tk.Label(self.master, text="ISBN号").grid(column=0, row=3)
        self.isbn_entry = tk.Entry(self.master)
        self.isbn_entry.grid(column=1, row=3, padx=5, pady=5)

        # 创建添加书籍按钮
        self.add_book_button = tk.Button(self.master, text="添加书籍", command=self.add_book)
        self.add_book_button.grid(column=0, row=4, pady=10)

        # 创建书籍列表框
        tk.Label(self.master, text="当前书籍列表").grid(column=2, row=1)
        self.book_listbox = tk.Listbox(self.master)
        self.book_listbox.grid(column=2, row=2, rowspan=3, padx=10, pady=5)
        self.update_book_list()

        # 创建删除书籍按钮
        self.delete_book_button = tk.Button(self.master, text="删除书籍", command=self.delete_book)
        self.delete_book_button.grid(column=2, row=4, pady=10)

    # 添加书籍方法
    def add_book(self):
        title = self.title_entry.get()
        author = self.author_entry.get()
        isbn = self.isbn_entry.get()
        book = Book(title, author, isbn)
        with open("books.txt", "a") as f:
            f.write(f"{book.title},{book.author},{book.isbn}\n")
        messagebox.showinfo("添加书籍", "添加书籍成功！")
        self.update_book_list()

    # 删除书籍方法
    def delete_book(self):
        selection = self.book_listbox.curselection()
        if len(selection) == 0:
            messagebox.showerror("删除书籍", "请选择要删除的书籍！")
            return
        index = selection[0]
        book = self.book_listbox.get(index)
        with open("books.txt", "r") as f:
            lines = f.readlines()
        with open("books.txt", "w") as f:
            for line in lines:
                if line.strip() != book:
                    f.write(line)
        messagebox.showinfo("删除书籍", "删除书籍成功！")
        self.update_book_list()

    # 更新书籍列表方法
    def update_book_list(self):
        self.book_listbox.delete(0, tk.END)
        with open("books.txt", "r") as f:
            for line in f.readlines():
                book = line.strip()
                self.book_listbox.insert(tk.END, book)


# 启动GUI窗口
if __name__ == '__main__':
    root = tk.Tk()
    app = BookManagementSystem(root)
    root.mainloop()

四、制作jpg、png图片转ico图标小工具

效果展示：

临时04

代码实现：

import tkinter as tk
from tkinter import filedialog
# PythonMargick包可以到Unofficial Windows Binaries for Python Extension Packages下载
import PythonMagick
 
root = tk.Tk()
root.withdraw()
 
Fpath = filedialog.askopenfilename()
 
img = PythonMagick.Image(Fpath)
# 这里要设置一下尺寸，不然会报ico尺寸异常错误
img.sample('256x256')
img.write('robin.ico')

五、制作图片和base64互转小工具

效果展示：

临时05

代码实现：

import base64
import tkinter as tk
from tkinter import filedialog

root = tk.Tk()
root.withdraw()

Fpath = filedialog.askopenfilename()
def file_to_base64():
    print(Fpath)
    f=open(Fpath,'rb') #二进制方式打开图文件
    ls_f=base64.b64encode(f.read()) #读取文件内容，转换为base64编码
    open('x.txt', 'wb').write(ls_f)

def base64_to_file():
    print(Fpath)
    decoded = base64.b64decode(open(Fpath, 'rb').read())
    open('1.jpg', 'wb').write(decoded)  # 保存


if __name__ == '__main__':
    if "jpg" in Fpath or 'png' in Fpath or 'jpeg' in Fpath:
        file_to_base64()
    elif 'txt' in Fpath:
        base64_to_file()

六、制作英文翻译器（小工具）

代码逻辑：

requests模块请求第三方翻译接口，拿到数据后通过tkinter展示出来

效果展示：

临时06

代码实现：

import requests
import tkinter as tk
from tkinter import messagebox

root = tk.Tk()
root.geometry('1000x500+350+100')
root.title('英文翻译器')
page = tk.Frame()
page.pack()

text = tk.StringVar()
tk.Label(page).grid(row=0, column=1)
tk.Label(page, text='翻译小程序', font=('黑体', 20)).grid(row=1, column=1, pady=20)


def sure():
    page.pack_forget()
    page2.pack()


def exit():
    page2.pack_forget()
    page.pack()


def dcfy():
    url = 'https://fanyi.xxx.com/trans'
    headers = {
        "user-agent": 'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/111.0.0.0 Safari/537.36',
        "referer": 'https://fanyi.xxx.com/'
    }
    chinese = text.get()
    data = {
        'q': chinese,
        'from': 'Auto',
        'to': 'Auto'
    }

    resp = requests.post(url=url, headers=headers, data=data).json()
    chinatext = resp.get('web')[0]['key']
    Englishtext = resp.get('web')[0]['value'][0]
    messagebox.showinfo(title='单词翻译', message=Englishtext)


def para():
    page.pack_forget()
    page3.pack()


def exit2():
    page3.pack_forget()
    page.pack()


def dlfy():
    url = 'https://fanyi.xxx.com/trans'
    headers = {
        "user-agent": 'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/111.0.0.0 Safari/537.36',
        "referer": 'https://fanyi.xxx.com/'
    }
    chinese = text.get()
    data = {
        'q': chinese,
        'from': 'Auto',
        'to': 'Auto'
    }

    resp = requests.post(url=url, headers=headers, data=data).json()
    Englishtext = resp['translation'][0]
    messagebox.showinfo(title='段落句子翻译', message=f'{Englishtext}')


tk.Button(page, text='单词翻译', font=('黑体', 15), command=sure).grid(row=2, column=1, pady=20)
tk.Button(page, text='句子翻译', font=('黑体', 15), command=para).grid(row=2, column=2, padx=10, pady=20)

page2 = tk.Frame()
tk.Entry(page2, textvariable=text, bd=5).grid(row=2, column=2, pady=20)
tk.Button(page2, text='翻译', font=('黑体', 15), command=dcfy).grid(row=3, column=1, padx=20)
tk.Button(page2, text='返回上一页', font=('黑体', 15), command=exit).grid(row=3, column=2, pady=20)

page3 = tk.Frame()
tk.Entry(page3, textvariable=text, bd=5).grid(row=2, column=2, pady=20)
tk.Button(page3, text='翻译', font=('黑体', 15), command=dlfy).grid(row=3, column=1, padx=20)
tk.Button(page3, text='返回上一页', font=('黑体', 15), command=exit2).grid(row=3, column=2, pady=20)

root.mainloop()

七、制作图片查看器（小工具）：

效果展示：

临时07

代码实现：

import tkinter as tk
import glob
from PIL import Image, ImageTk

root = tk.Tk()  # 创建窗口
root.geometry('650x700+300+50')  # 设置弹出窗口的大小和在屏幕中的位置
root.title('图片查看器')  # 设置弹出窗口的标题

imgs = glob.glob('img/*.jpeg')
imgs = [ImageTk.PhotoImage(Image.open(item)) for item in imgs]

current_photo_no = 0
img_label = tk.Label(root, image=imgs[current_photo_no], width=640, height=640)
img_label.pack()
number_var = tk.StringVar()
number_var.set('1 of 8')
tk.Label(root, textvariable=number_var, bd=1, relief=tk.SUNKEN, anchor=tk.CENTER).pack(fill=tk.X)

button_form = tk.Frame(root)
button_form.pack()
prev_img = tk.Button(button_form, text='上一页')
next_img = tk.Button(button_form, text='下一页')
prev_img.pack(side=tk.LEFT, anchor=tk.CENTER)
next_img.pack(side=tk.RIGHT, anchor=tk.CENTER)


def change_images(next_no):
    global current_photo_no
    current_photo_no += next_no
    if current_photo_no >= len(imgs):
        current_photo_no = 0
    if current_photo_no < 0:
        current_photo_no = len(imgs) - 1
    number_var.set(f'{current_photo_no + 1} of {len(imgs)}')
    img_label.configure(image=imgs[current_photo_no])


prev_img.config(command=lambda: change_images(-1))
next_img.config(command=lambda: change_images(1))
root.mainloop()

八、制作BMI身体指数计算器（小工具）：

效果展示：

临时08

代码实现：

import tkinter as tk
from tkinter import messagebox

root = tk.Tk()
root.geometry('350x230+500+230')  # 设置弹出框位置和大小
# root.iconbitmap('E:/pythonProject/3.ico')  # 设置弹出框图标

root.title('BMI身体指数计算器')

height = tk.DoubleVar()
weight = tk.DoubleVar()

page = tk.Frame(root)
page.pack()

tk.Label(page).grid(row=0, column=0)

tk.Label(page, text='身高(米): ').grid(row=2, column=1, pady=20)
tk.Entry(page, textvariable=height).grid(row=2, column=2)

tk.Label(page, text='体重(kg): ').grid(row=3, column=1, pady=20)
tk.Entry(page, textvariable=weight).grid(row=3, column=2)


def jisuan():
    shengao = height.get()
    tizhong = weight.get()
    # print(shengao,tizhong)
    if shengao > 0 and tizhong > 0:
        BMI = tizhong / shengao ** 2
        BMI_new = float(('%.2f' % BMI))
        messagebox.showinfo(title='BMI身体指数计算',
                            message=f'您的身高为{shengao}m,您的体重为{tizhong}kg,您的BMI身体指数为{BMI_new}')
        if BMI_new < 18.4:
            messagebox.showinfo(title='BMI身体指数计算', message='BMI指数较低，提示您的身体消瘦，要注意补充营养哦!')
        elif BMI_new > 18.5 and BMI_new < 24:
            messagebox.showinfo(title='BMI身体指数计算', message='BMI指数为正常值，继续加油！')
        elif BMI_new > 24 and BMI_new < 28:
            messagebox.showinfo(title='BMI身体指数计算',
                                message='BMI指数较高，属于是超重了，提示您需要合理饮食，加强锻炼哦！')
        elif BMI_new > 28:
            messagebox.showinfo(title='BMI身体指数计算',
                                message='BMI指数很高，属于肥胖了，提示您需要注意身体健康了，过胖会增加人体器官的负担哦！')


tk.Button(page, text='计算', command=jisuan).grid(row=4, column=2, pady=10)

root.mainloop()

九，制作json数据格式化小工具

小工具效果：对于json格式（混乱）的数据做规范修改，格式化输出json数据。

import json
import tkinter as tk
from tkinter import filedialog

root = tk.Tk()
root.withdraw()

json_data_path = filedialog.askopenfilename()

with open(json_data_path) as json_file:
    data = json.load(json_file)

formatted_data = json.dumps(data, indent=4, sort_keys=True)
with open(json_data_path, 'w') as fp:
    fp.write(formatted_data)

十，微信消息轰炸

代码逻辑：即通过python的pyautogui库定位到微信的像素位置，然后通过模拟鼠标键盘操作自动发送消息

实现步骤：

1）先通过pyautogui定位到微信的桌面位置。

import pyautogui
import time

def search_positon():
    time.sleep(1)
    x1,y1 = pyautogui.position()
    print('您当前的位置坐标为:','x:'+str(x1)+'','y:'+str(y1))

if __name__ == '__main__':
    while True:
        search_positon()
        pass

效果展示：【具体方位不是固定的，只要确认可以点击打开微信即可】

2）编写消息发送逻辑，通过pyautogui自动下发微信消息

import pyautogui
import time
import pyperclip

user = input('输入用户名称:')
userinput = input('输入要发送的消息:')
pyautogui.click(37, 428, button='left', clicks=2)
# 找到微信程序位置，打开微信程序
time.sleep(0.5)
# 睡眠0.5秒
pyautogui.click(368, 83, button='left', clicks=1)
# 点击微信搜索框，具体位置可以通过运行上面的代码定位
pyperclip.copy(user)
pyautogui.hotkey('Ctrl', 'v')
# 输入搜索内容
pyautogui.press('enter')
# 点击回车搜索
time.sleep(0.5)
pyautogui.press('enter')
while True:
    pyperclip.copy(userinput)
    pyautogui.hotkey('Ctrl', 'v')
    pyautogui.press('enter')
    time.sleep(0.5)
# 死循环执行消息发送，每隔0.5秒发送一次

效果展示：

十一，制作OCR图片识别小工具

参考博客：

【Python • 图片识别】pytesseract快速识别提取图片中的文字_python识别图片中的文字_广龙宇的博客-优快云博客利用python做图片识别，识别提取图片中的文字会有很多方法，但是想要简单一点怎么办，那就可以使用tesseract识别引擎来实现，一行代码就可以做到提取图片文本。_python识别图片中的文字https://blog.youkuaiyun.com/weixin_47754149/article/details/125651707

效果展示：

临时09

代码实现：

from PIL import Image
import pytesseract
import tkinter as tk
from tkinter import filedialog

root = tk.Tk()
root.withdraw()

Fpath = filedialog.askopenfilename()


def read_image(name):
    with open('视频文件.txt','w',encoding='utf-8') as fp:
        fp.write(pytesseract.image_to_string(Image.open(name), lang='chi_sim'))

def main():
    read_image(Fpath)

if __name__ == '__main__':
    reslet = main()

十二，python代码制作证件照

效果展示：

将1寸蓝底照片修改为2寸橘色背景照片

原图：

代码修改后的效果图：

代码实现：

from rembg import remove
from PIL import Image, ImageEnhance
import cv2
import numpy as np


def create_id_photo(input_path, output_path,
                    bg_color=(255, 255, 255),
                    target_size=(295, 413),
                    dpi=300,
                    enhance=True):
    """
    制作专业证件照
    参数：
    input_path: 输入图片路径
    output_path: 输出图片路径
    bg_color: 背景颜色 (RGB)
    target_size: 目标尺寸 (宽, 高)
    dpi: 输出分辨率
    enhance: 是否启用图像增强
    """
    # 1. 去除背景
    with open(input_path, 'rb') as f:
        input_image = Image.open(f).convert("RGB")
        output_image = remove(input_image)

    # 2. 替换背景
    background = Image.new('RGB', output_image.size, bg_color)
    background.paste(output_image, mask=output_image.split()[3])  # 使用alpha通道

    # 3. 转换为OpenCV格式进行美颜处理
    cv_image = cv2.cvtColor(np.array(background), cv2.COLOR_RGB2BGR)

    if enhance:
        # 4. 美颜处理
        cv_image = cv2.bilateralFilter(cv_image, 9, 75, 75)  # 双边滤波
        cv_image = cv2.detailEnhance(cv_image, sigma_s=10, sigma_r=0.15)  # 细节增强

    # 5. 转换回PIL格式
    result_img = Image.fromarray(cv2.cvtColor(cv_image, cv2.COLOR_BGR2RGB))

    # 6. 调整尺寸
    result_img = result_img.resize(target_size, Image.LANCZOS)

    # 7. 增强对比度和锐度
    enhancer = ImageEnhance.Contrast(result_img)
    result_img = enhancer.enhance(1.1)
    enhancer = ImageEnhance.Sharpness(result_img)
    result_img = enhancer.enhance(1.2)

    # 8. 保存结果
    result_img.save(output_path, dpi=(dpi, dpi), quality=100)
    print(f"证件照已保存至 {output_path}")


# 使用示例
if __name__ == "__main__":
    # 常用尺寸预设（宽×高，单位：像素）
    sizes = {
        "1寸": (295, 413),  # 2.5×3.5cm @ 300dpi
        "2寸": (413, 579),  # 3.5×4.9cm @ 300dpi
        "小2寸": (413, 531)  # 3.5×4.5cm @ 300dpi
    }

    create_id_photo(
        input_path="C:/Users/17496/Pictures/个人二寸照片.jpg",
        output_path="C:/Users/17496/Pictures/动漫一寸照片.jpg",
        bg_color=("#FF7F00"),  # 白色背景
        target_size=sizes["2寸"],
        dpi=300,
        enhance=True
    )

注意事项：

1.）此代码运行前需要先安装对应的python库。

pip install pillow
pip install opencv-python
pip install rembg

如代码运行报错提示还有其他库缺失，请自行对应安装python库。

2.）图片大变小效果会比较好（比如1寸照改2寸照），小变大效果会比较差（比如2寸照改1寸照）

十三，python代码将pdf文件转为word文件

pdf文件分类：

pdf文件分为文字版pdf文件和图片版pdf文件。区分pdf文件是图片还是文字可以在文件中双击，双击后如果出现图片即为图片版pdf文件，双击后可以编辑即为文字版pdf。

下图为图片版pdf文件和文字版pdf文件示意图。

代码逻辑：

1，）针对文字类型的pdf文件

使用python的pdf2docx、pymupdf、python-docx库操作转换，使用tkinter库选择文件。

具体代码如下：

# 安装依赖库（需提前执行）
# pip install pdf2docx
# pip install pymupdf
# pip install python-docx
# pip install tkinter

import os
from pdf2docx import Converter
import fitz  # PyMuPDF
from tkinter import Tk, filedialog

def select_file():
    """选择PDF文件"""
    root = Tk()
    root.withdraw()  # 隐藏Tk窗口
    file_path = filedialog.askopenfilename(
        title="选择PDF文件",
        filetypes=[("PDF Files", "*.pdf")]
    )
    return file_path

def pdf_to_word(pdf_path, docx_path=None):
    """将PDF转换为Word文档"""
    try:
        # 使用pdf2docx库转换（保留格式）
        cv = Converter(pdf_path)
        if not docx_path:
            docx_path = pdf_path.replace(".pdf", "_converted.docx")
        cv.convert(docx_path, start=0, end=None)  # 转换全部页面
        cv.close()
        print(f"转换成功！文件已保存至: {docx_path}")
        return True
    except Exception as e:
        print(f"转换失败: {str(e)}")
        return False

if __name__ == "__main__":
    pdf_path = select_file()
    if pdf_path:
        pdf_to_word(pdf_path)
    else:
        print("未选择文件！")

效果展示：

pdf文字版文件转word文件

2，）针对图片类型的pdf文件

代码逻辑：

使用PyMuPDF库扫描提取所有pdf的图片，将提取到的pdf图片暂存到当前目录下的临时目录中，然后调用base64库将提取暂存的图片转为base64格式，之后调用百度云的OCR接口获取识别后的文本。最后将获取到的所有文本整合到word文件中。

import os
import fitz  # PyMuPDF
import base64
import requests
from docx import Document
from tkinter import Tk, filedialog

# 百度OCR配置（替换成您的实际API信息）
API_KEY = "xxxxxxxxxxxxx"
SECRET_KEY = "xxxxxxxxxxxxxxxxxxxxxxxxxxx"

# 百度OCR接口参数
OCR_URL = "https://aip.baidubce.com/rest/2.0/ocr/v1/xxxxxx_basic"  
# 高精度版接口 具体可以登录百度云官网查看接口，
# 链接：https://console.bce.baidu.com/support/?timestamp=1742695013150#/api?product=AI&project=%E6%96%87%E5%AD%97%E8%AF%86%E5%88%AB&parent=%E9%80%9A%E7%94%A8%E5%9C%BA%E6%99%AFOCR&api=rest%2F2.0%2Focr%2Fv1%2Fgeneral_basic&method=post


class PDFToWordConverter:
    def __init__(self):
        self.access_token = self.get_access_token()
        self.doc = Document()
        self.temp_img_folder = "temp_pdf_images"

    def get_access_token(self):
        """获取百度OCR的Access Token"""
        url = "https://aip.baidubce.com/oauth/2.0/token"
        params = {
            "grant_type": "client_credentials",
            "client_id": API_KEY,
            "client_secret": SECRET_KEY
        }
        return requests.post(url, params=params).json().get("access_token")

    def extract_images_from_pdf(self, pdf_path):
        """从PDF提取所有图片到临时文件夹"""
        if not os.path.exists(self.temp_img_folder):
            os.makedirs(self.temp_img_folder)

        doc = fitz.open(pdf_path)
        image_paths = []

        for page_num in range(len(doc)):
            page = doc.load_page(page_num)
            image_list = page.get_images(full=True)

            for img_index, img in enumerate(image_list):
                xref = img[0]
                base_image = doc.extract_image(xref)
                image_bytes = base_image["image"]
                image_ext = base_image["ext"]
                image_filename = f"{self.temp_img_folder}/page{page_num}_img{img_index}.{image_ext}"

                with open(image_filename, "wb") as img_file:
                    img_file.write(image_bytes)
                image_paths.append(image_filename)

        doc.close()
        return image_paths

    def image_to_base64(self, image_path):
        """将图片转换为Base64编码"""
        with open(image_path, "rb") as f:
            return base64.b64encode(f.read()).decode("utf-8")

    def baidu_ocr(self, image_base64):
        """调用百度OCR接口识别图片文字"""
        headers = {'Content-Type': 'application/x-www-form-urlencoded'}
        payload = {
            "image": image_base64,
            "access_token": self.access_token,
            "language_type": "CHN_ENG"  # 中英文混合
        }
        response = requests.post(OCR_URL, headers=headers, data=payload)
        if response.status_code == 200:
            return response.json()
        return None

    def process_pdf(self, pdf_path):
        """处理PDF主流程"""
        # 1. 提取PDF中的图片
        image_paths = self.extract_images_from_pdf(pdf_path)
        if not image_paths:
            raise ValueError("未检测到PDF中的图片内容")

        # 2. 逐张识别并写入Word
        for img_path in image_paths:
            # 转换为Base64
            img_base64 = self.image_to_base64(img_path)

            # 调用OCR
            result = self.baidu_ocr(img_base64)

            # 解析结果
            if result and "words_result" in result:
                for item in result["words_result"]:
                    self.doc.add_paragraph(item["words"])
                self.doc.add_page_break()  # 保持分页

        # 3. 保存Word文件
        output_path = pdf_path.replace(".pdf", "_OCR.docx")
        self.doc.save(output_path)
        print(f"转换完成！文件已保存至：{output_path}")

        # 4. 清理临时文件（可选）
        # import shutil
        # shutil.rmtree(self.temp_img_folder)


def main():
    root = Tk()
    root.withdraw()
    pdf_path = filedialog.askopenfilename(
        title="选择PDF文件",
        filetypes=[("PDF Files", "*.pdf")]
    )

    if not pdf_path:
        print("未选择文件")
        return

    converter = PDFToWordConverter()
    converter.process_pdf(pdf_path)


if __name__ == "__main__":
    main()

效果展示：

pdf图片版文件转word文件

注意事项：

1，）上述代码需要对应安装各类python库。

2，）代码运行后会在当前目录下生成一个图片目录，用于存放提取的pdf图片，代码运行完后不需要可以自行删除。

3，）百度云的OCR有使用限制，个人用户使用标准文字识别接口有2000次免费，超过后需要付费使用。

百度云OCR相关链接：

1，OCR控制台界面：百度智能云控制台

2，OCR接口文档界面：服务与支持

十四，python 制作个税计算小工具

效果展示：

代码实现：

import tkinter as tk
from tkinter import ttk, messagebox
import matplotlib.pyplot as plt
from matplotlib.backends.backend_tkagg import FigureCanvasTkAgg

# 税率表（2023年最新）
TAX_RATES = [
    {"min": 0, "max": 36000, "rate": 0.03, "deduction": 0},
    {"min": 36000, "max": 144000, "rate": 0.1, "deduction": 2520},
    {"min": 144000, "max": 300000, "rate": 0.2, "deduction": 16920},
    {"min": 300000, "max": 420000, "rate": 0.25, "deduction": 31920},
    {"min": 420000, "max": 660000, "rate": 0.3, "deduction": 52920},
    {"min": 660000, "max": 960000, "rate": 0.35, "deduction": 85920},
    {"min": 960000, "max": float('inf'), "rate": 0.45, "deduction": 181920}
]

# 专项附加扣除标准
SPECIAL_DEDUCTIONS = {
    "子女教育": 1000,
    "继续教育": 400,
    "大病医疗": 0,  # 实际金额据实扣除
    "住房贷款利息": 1000,
    "住房租金": 800,
    "赡养老人": 1000
}

plt.rcParams['font.sans-serif'] = ['SimHei'] # 设置显示中文字体
plt.rcParams['axes.unicode_minus'] = False  # 设置正常显示符号

class TaxCalculator:
    def __init__(self, root):
        self.root = root
        self.root.title("个人所得税计算器")
        self.root.geometry("900x700+400+50")
        self.root.resizable(True, True)
        self.root.configure(bg="#f0f8ff")

        # 设置应用图标
        try:
            self.root.iconbitmap("tax_icon.ico")  # 如果有图标文件的话
        except:
            pass

        # 创建样式
        self.style = ttk.Style()
        self.style.configure("TFrame", background="#f0f8ff")
        self.style.configure("TLabel", background="#f0f8ff", font=("微软雅黑", 10))
        self.style.configure("TButton", font=("微软雅黑", 10))
        self.style.configure("Header.TLabel", font=("微软雅黑", 16, "bold"), foreground="#2c3e50")
        self.style.configure("Result.TLabel", font=("微软雅黑", 12, "bold"), foreground="#e74c3c")

        # 创建主框架
        self.main_frame = ttk.Frame(root)
        self.main_frame.pack(fill=tk.BOTH, expand=True, padx=20, pady=20)

        # 创建标题
        self.header = ttk.Label(self.main_frame, text="个人所得税计算器", style="Header.TLabel")
        self.header.pack(pady=20)

        # 创建输入框架
        self.input_frame = ttk.LabelFrame(self.main_frame, text="收入信息")
        self.input_frame.pack(fill=tk.X, padx=10, pady=10)

        # 创建输入字段
        ttk.Label(self.input_frame, text="月收入 (元):").grid(row=0, column=0, padx=10, pady=10, sticky=tk.W)
        self.monthly_income = tk.DoubleVar(value=10000)
        ttk.Entry(self.input_frame, textvariable=self.monthly_income, width=15).grid(row=0, column=1, padx=10, pady=10)

        ttk.Label(self.input_frame, text="社保公积金 (元):").grid(row=0, column=2, padx=10, pady=10, sticky=tk.W)
        self.social_security = tk.DoubleVar(value=1500)
        ttk.Entry(self.input_frame, textvariable=self.social_security, width=15).grid(row=0, column=3, padx=10, pady=10)

        ttk.Label(self.input_frame, text="专项附加扣除 (元):").grid(row=1, column=0, padx=10, pady=10, sticky=tk.W)
        self.special_deduction = tk.DoubleVar(value=0)
        ttk.Entry(self.input_frame, textvariable=self.special_deduction, width=15).grid(row=1, column=1, padx=10,
                                                                                        pady=10)

        ttk.Label(self.input_frame, text="其他扣除 (元):").grid(row=1, column=2, padx=10, pady=10, sticky=tk.W)
        self.other_deduction = tk.DoubleVar(value=0)
        ttk.Entry(self.input_frame, textvariable=self.other_deduction, width=15).grid(row=1, column=3, padx=10, pady=10)

        # 专项附加扣除选项
        self.deductions_frame = ttk.LabelFrame(self.main_frame, text="专项附加扣除选项")
        self.deductions_frame.pack(fill=tk.X, padx=10, pady=10)

        self.deduction_vars = {}
        row_idx = 0
        col_idx = 0
        for idx, (deduct_name, amount) in enumerate(SPECIAL_DEDUCTIONS.items()):
            var = tk.BooleanVar(value=False)
            self.deduction_vars[deduct_name] = var
            cb = ttk.Checkbutton(self.deductions_frame, text=f"{deduct_name} ({amount}元)",
                                 variable=var, command=self.update_special_deduction)
            cb.grid(row=row_idx, column=col_idx, padx=5, pady=5, sticky=tk.W)

            col_idx += 1
            if col_idx > 2:
                col_idx = 0
                row_idx += 1

        # 创建按钮
        self.button_frame = ttk.Frame(self.main_frame)
        self.button_frame.pack(pady=20)

        ttk.Button(self.button_frame, text="计算个税", command=self.calculate_tax, width=15).pack(side=tk.LEFT, padx=10)
        ttk.Button(self.button_frame, text="重置", command=self.reset_fields, width=15).pack(side=tk.LEFT, padx=10)
        ttk.Button(self.button_frame, text="退出", command=root.quit, width=15).pack(side=tk.LEFT, padx=10)

        # 创建结果显示区域
        self.result_frame = ttk.LabelFrame(self.main_frame, text="计算结果")
        self.result_frame.pack(fill=tk.BOTH, expand=True, padx=10, pady=10)

        # 创建结果标签
        ttk.Label(self.result_frame, text="应纳税所得额:").grid(row=0, column=0, padx=10, pady=5, sticky=tk.W)
        self.taxable_income_label = ttk.Label(self.result_frame, text="0.00 元", style="Result.TLabel")
        self.taxable_income_label.grid(row=0, column=1, padx=10, pady=5, sticky=tk.W)

        ttk.Label(self.result_frame, text="适用税率:").grid(row=1, column=0, padx=10, pady=5, sticky=tk.W)
        self.tax_rate_label = ttk.Label(self.result_frame, text="0%", style="Result.TLabel")
        self.tax_rate_label.grid(row=1, column=1, padx=10, pady=5, sticky=tk.W)

        ttk.Label(self.result_frame, text="速算扣除数:").grid(row=2, column=0, padx=10, pady=5, sticky=tk.W)
        self.quick_deduction_label = ttk.Label(self.result_frame, text="0.00 元", style="Result.TLabel")
        self.quick_deduction_label.grid(row=2, column=1, padx=10, pady=5, sticky=tk.W)

        ttk.Label(self.result_frame, text="应缴个人所得税:").grid(row=3, column=0, padx=10, pady=5, sticky=tk.W)
        self.tax_amount_label = ttk.Label(self.result_frame, text="0.00 元", style="Result.TLabel")
        self.tax_amount_label.grid(row=3, column=1, padx=10, pady=5, sticky=tk.W)

        ttk.Label(self.result_frame, text="税后收入:").grid(row=4, column=0, padx=10, pady=5, sticky=tk.W)
        self.net_income_label = ttk.Label(self.result_frame, text="0.00 元", style="Result.TLabel")
        self.net_income_label.grid(row=4, column=1, padx=10, pady=5, sticky=tk.W)

        # 创建图表区域
        self.chart_frame = ttk.Frame(self.result_frame)
        self.chart_frame.grid(row=0, column=2, rowspan=5, padx=20, pady=10, sticky=tk.NSEW)

        # 初始图表
        self.fig, self.ax = plt.subplots(figsize=(4, 3), dpi=80)
        self.canvas = FigureCanvasTkAgg(self.fig, master=self.chart_frame)
        self.canvas.get_tk_widget().pack(fill=tk.BOTH, expand=True)
        self.update_chart([100], ["收入分布"])

        # 添加状态栏
        self.status_bar = ttk.Label(root, text="就绪", relief=tk.SUNKEN, anchor=tk.W)
        self.status_bar.pack(side=tk.BOTTOM, fill=tk.X)

        # 绑定事件
        self.root.bind("<Return>", lambda event: self.calculate_tax())

    def update_special_deduction(self):
        """更新专项附加扣除总额"""
        total = 0
        for deduct_name, var in self.deduction_vars.items():
            if var.get():
                total += SPECIAL_DEDUCTIONS[deduct_name]
        self.special_deduction.set(total)

    def calculate_taxable_income(self):
        """计算应纳税所得额"""
        try:
            # 获取输入值
            monthly_income = self.monthly_income.get()
            social_security = self.social_security.get()
            special_deduction = self.special_deduction.get()
            other_deduction = self.other_deduction.get()

            # 计算年收入
            annual_income = monthly_income * 12

            # 计算应纳税所得额
            taxable_income = annual_income - 60000  # 基本减除费用（5000*12）
            taxable_income -= social_security * 12  # 社保公积金
            taxable_income -= special_deduction * 12  # 专项附加扣除
            taxable_income -= other_deduction * 12  # 其他扣除

            return max(0, taxable_income)
        except:
            messagebox.showerror("输入错误", "请输入有效的数值")
            return 0

    def find_tax_rate(self, taxable_income):
        """根据应纳税所得额查找适用税率"""
        for level in TAX_RATES:
            if taxable_income > level["min"] and taxable_income <= level["max"]:
                return level["rate"], level["deduction"]
        return 0.45, 181920  # 默认最高税率

    def calculate_tax(self):
        """计算个人所得税"""
        taxable_income = self.calculate_taxable_income()

        if taxable_income <= 0:
            tax_rate = 0
            quick_deduction = 0
            tax_amount = 0
        else:
            tax_rate, quick_deduction = self.find_tax_rate(taxable_income)
            tax_amount = taxable_income * tax_rate - quick_deduction
            tax_amount = max(0, tax_amount)  # 确保税额不为负

        # 更新结果标签
        self.taxable_income_label.config(text=f"{taxable_income:,.2f} 元")
        self.tax_rate_label.config(text=f"{tax_rate * 100:.1f}%")
        self.quick_deduction_label.config(text=f"{quick_deduction:,.2f} 元")
        self.tax_amount_label.config(text=f"{tax_amount:,.2f} 元")

        # 计算税后收入
        net_income = (self.monthly_income.get() - self.social_security.get()
                      - (tax_amount / 12) - self.other_deduction.get())
        self.net_income_label.config(text=f"{net_income:,.2f} 元")

        # 更新图表
        tax_per_month = tax_amount / 12
        labels = ['税前收入', '社保公积金', '个人所得税', '税后收入']
        sizes = [
            self.monthly_income.get(),
            self.social_security.get(),
            tax_per_month,
            net_income
        ]
        self.update_chart(sizes, labels)

        # 更新状态栏
        self.status_bar.config(
            text=f"计算完成: 月收入 {self.monthly_income.get():,.2f} 元, 个税 {tax_per_month:,.2f} 元")

    def update_chart(self, sizes, labels):
        """更新饼图"""
        self.ax.clear()

        # 过滤掉值为0的部分
        filtered_sizes = []
        filtered_labels = []
        for size, label in zip(sizes, labels):
            if size > 0:
                filtered_sizes.append(size)
                filtered_labels.append(label)

        if filtered_sizes:
            colors = ['#4CAF50', '#2196F3', '#F44336', '#FFC107']
            self.ax.pie(filtered_sizes, labels=filtered_labels, autopct='%1.1f%%',
                        colors=colors[:len(filtered_sizes)], startangle=90)
            self.ax.axis('equal')  # 保证饼图是圆形
            self.ax.set_title('收入分配比例')
        else:
            self.ax.text(0.5, 0.5, '无数据', ha='center', va='center', fontsize=12)

        self.canvas.draw()

    def reset_fields(self):
        """重置所有输入字段"""
        self.monthly_income.set(10000)
        self.social_security.set(1500)
        self.special_deduction.set(0)
        self.other_deduction.set(0)

        # 重置复选框
        for var in self.deduction_vars.values():
            var.set(False)

        # 重置结果
        self.taxable_income_label.config(text="0.00 元")
        self.tax_rate_label.config(text="0%")
        self.quick_deduction_label.config(text="0.00 元")
        self.tax_amount_label.config(text="0.00 元")
        self.net_income_label.config(text="0.00 元")

        # 重置图表
        self.update_chart([100], ["收入分布"])
        self.status_bar.config(text="已重置所有字段")


if __name__ == "__main__":
    root = tk.Tk()
    app = TaxCalculator(root)
    root.mainloop()