pythone 标注工具。人工智能,标注工具,YOLOv8框架

管理员 2025-06-17 10:17

这是针对YOLOv8框架,训练数据的标注,人工智能,标注工具

import os
import re
import cv2
import glob
import numpy as np
from PIL import Image, ImageDraw, ImageFont


# 004这个代码 拉框有点卡，显示中文  能正常标注。
# 005 修改004的问题。  这个代码运行不显示图片。需要标注一下。才会显示。
# 006 显示图片了。  但是标注第2个图片，第1个图片的标注还存在。

class SmoothYOLOAnnotator:
    def __init__(self, image_folder):
        self.image_folder = image_folder

        self.images = sorted(glob.glob(os.path.join(image_folder, "*.jpg")) +
                             glob.glob(os.path.join(image_folder, "*.png")),
                             key=lambda x: int(re.search(r'\d+', os.path.basename(x)).group()))

        # glob.glob() 函数解析 通过通配符匹配文件路径，返回符合条件的文件列表
        # * 任意数量字符 *.jpg匹配所有JPG
        # ?  单个字   pic?.png匹配pic1.png
        # []  指定字符范围[a - z].txt匹配a - z开头的txt
        # sorted 对可迭代对象（列表、元组、字符串等）进行排序 返回一个新的排序后列表，不修改原对象
        print(self.images)

        self.current_index = 0 #从第1个开始标注  0就是从1     1就是从第2个标注
        self.annotations = []
        self.temp_box = None
        self.classes = {1: "小明", 2: "小红", 3: "小刚"}
        self.cache_img = None
        self.font = self.load_font()
        self.window_name = "YOLO标注工具"
        self.crosshair_color = (0, 0, 255)  # 红色十字线
        self.crosshair_thickness = 1



    def load_font(self):
        try:
            return ImageFont.truetype("simhei.ttf", 20)
        except:
            return ImageFont.load_default()

    def init_display(self):
        """初始化显示图片"""
        # 清空上一张图的标注
        self.annotations = []
        self.temp_box = None

        # 从图片列表中读取当前索引对应的图片
        self.current_img = cv2.imread(self.images[self.current_index])
        if self.current_img is None:
            print(f"无法加载图片: {self.images[self.current_index]}")
            return
        # 更新缓存图片（添加标注框和文字）

        # 重置缓存并更新显示
        self.cache_img = None
        self.update_cache()
        # 在指定窗口中显示处理后的图片
        cv2.imshow(self.window_name, self.cache_img)
        cv2.waitKey(1)  # 强制刷新显示

    def update_cache(self):
        # 复制当前图片到缓存（避免修改原图）  所有修改都在缓存图片上进行，不破坏原图
        self.cache_img = self.current_img.copy()
        # 遍历所有标注信息（class_id是类别，x1,y1是左上角，x2,y2是右下角）
        for (class_id, x1, y1, x2, y2) in self.annotations:
            # 画绿色矩形框（线宽2像素）
            cv2.rectangle(self.cache_img, (x1, y1), (x2, y2), (0, 255, 0), 2)
            # 转换到PIL格式（因为OpenCV和PIL处理图片方式不同）
            pil_img = Image.fromarray(cv2.cvtColor(self.cache_img, cv2.COLOR_BGR2RGB))
            # 准备在图片上写字  绿色矩形框（标记物体位置）
            # 绿色文字标签（说明物体类别）
            draw = ImageDraw.Draw(pil_img)
            # 在框上方25像素处写类别名称（绿色文字）
            draw.text((x1, y1 - 25), self.classes[class_id], font=self.font, fill=(0, 255, 0))
            # 转回OpenCV格式
            self.cache_img = cv2.cvtColor(np.array(pil_img), cv2.COLOR_RGB2BGR)

    def mouse_callback(self, event, x, y, flags, param):

        """增强的鼠标回调函数"""
        # 十字线绘制逻辑
        display_img = self.cache_img.copy() if self.cache_img is not None else self.current_img.copy()
        cv2.line(display_img, (0, y), (display_img.shape[1], y),
                 self.crosshair_color, self.crosshair_thickness)
        cv2.line(display_img, (x, 0), (x, display_img.shape[0]),
                 self.crosshair_color, self.crosshair_thickness)
        # 十字线绘制逻辑

        if event == cv2.EVENT_LBUTTONDOWN:
            self.temp_box = [x, y, x, y]
        elif event == cv2.EVENT_MOUSEMOVE:
            if self.temp_box:
                self.temp_box[2:] = [x, y]
                display_img = self.cache_img.copy()
                cv2.rectangle(display_img,
                              (self.temp_box[0], self.temp_box[1]),
                              (self.temp_box[2], self.temp_box[3]),
                              (255, 0, 0), 1)
                cv2.imshow(self.window_name, display_img)
        elif event == cv2.EVENT_LBUTTONUP:
            if self.temp_box:
                x1, y1 = min(self.temp_box[0], x), min(self.temp_box[1], y)
                x2, y2 = max(self.temp_box[0], x), max(self.temp_box[1], y)
                self.select_class(x1, y1, x2, y2)
                self.temp_box = None
        self.update_display(display_img)

    def update_display(self, img=None):
        """更新显示内容"""
        if img is None:
            img = self.current_img.copy()
            self.update_cache()
            if self.cache_img is not None:
                img = self.cache_img.copy()
        cv2.imshow(self.window_name, img)

    def select_class(self, x1, y1, x2, y2):
        # 创建当前图像的副本用于显示选择界面
        selection_img = self.current_img.copy()
        # 将OpenCV格式(BGR)转为PIL格式(RGB)
        pil_img = Image.fromarray(cv2.cvtColor(selection_img, cv2.COLOR_BGR2RGB))
        draw = ImageDraw.Draw(pil_img)
        # 绘制分类选择提示文字（红色）
        draw.text((10, 20), "选择分类:", font=self.font, fill=(0, 0, 255))
        # 遍历classes字典显示所有可选类别（1.小明 2.小红 3.小刚）

        for i, (class_id, name) in enumerate(self.classes.items()):
            draw.text((10, 50 + i * 30), f"{class_id}. {name}", font=self.font, fill=(0, 0, 255))
            # 显示选择窗口（转回OpenCV格式）
        cv2.imshow("选择分类", cv2.cvtColor(np.array(pil_img), cv2.COLOR_RGB2BGR))

        # 等待键盘输入（0表示无限等待）
        key = cv2.waitKey(0) & 0xFF
        cv2.destroyWindow("选择分类")  # 关闭选择窗口

        # 如果按了1/2/3键（ASCII码49-51）
        if 49 <= key <= 51:
            # 保存标注（key-48将ASCII码转为数字1/2/3）
            self.annotations.append((key - 48, x1, y1, x2, y2))
            self.update_cache()# 更新显示
            cv2.imshow(self.window_name, self.cache_img)

    def run(self):
        # 创建显示窗口并设置鼠标回调函数
        cv2.namedWindow(self.window_name)
        cv2.setMouseCallback(self.window_name, self.mouse_callback)
        self.init_display()  # 初始化显示第一张图片

        # 主循环（遍历所有图片）
        while self.current_index < len(self.images):
            key = cv2.waitKey(10) & 0xFF  # 10ms等待按键
            if key == ord("n"):  # 按n键下一张
                self.save_annotations() # 保存当前标注
                self.current_index += 1
                if self.current_index < len(self.images):
                    self.init_display()  # 显示新图片
            elif key == ord("p"): # 按p键上一张
                self.save_annotations()
                self.current_index = max(0, self.current_index - 1)
                self.init_display()
            elif key == ord("d"):# 按d键删除最后一个标注
                if self.annotations:
                    self.annotations.pop()# 移除最后标注
                    self.update_cache()
                    cv2.imshow(self.window_name, self.cache_img)
            elif key == ord("q"):  # 按q键退出
                break
        cv2.destroyAllWindows()# 关闭所有窗口


    def save_annotations(self): #标注保存
        if not self.annotations: return

        height, width = self.current_img.shape[:2]
        txt_path = os.path.splitext(self.images[self.current_index])[0] + ".txt"

        with open(txt_path, "w") as f:
            for (class_id, x1, y1, x2, y2) in self.annotations:
                x_center = ((x1 + x2) / 2) / width
                y_center = ((y1 + y2) / 2) / height
                box_width = abs(x2 - x1) / width
                box_height = abs(y2 - y1) / height
                f.write(f"{class_id - 1} {x_center:.6f} {y_center:.6f} {box_width:.6f} {box_height:.6f}\n")


if __name__ == "__main__":
    image_folder = "E:/123";
    # image_folder = input("输入图片文件夹路径: ")
    annotator = SmoothYOLOAnnotator(image_folder)
    annotator.run()

输入文件夹路径。下面的图片名称必须是 1 到 n 后缀名 jpg png 都可以。

        self.classes = {1: "小明", 2: "小红", 3: "小刚"}  这是分类。请自行修改。

        self.current_index = 0 #从第1个开始标注  0就是从1     1就是从第2个标注
        
        假如我们想从第5张图片标注 请输入4
        
        0是从1第个图片标注。

针对标注窗口显示分数乱码，安装了一个东西。

pip install opencv-python pillow numpy
显示分类名称乱码的时候，安装了这个库。

联系站长

站长微信:xiaomao0055

站长QQ:14496453

按分类分组

java(172)

python(31)

MySQL(28)

layUI(10)

公众号相关(3)

MybatisPlush(6)

Cocos Creator音爆小游戏_01(2)

Cocos Creator零基础游戏开发视频教程_01(34)

Cocos Creator计算器(4)

CocosCreator 飞机大战(29)

CocosCreator 拼图游戏(16)

CocosCreator棋牌炸金花(22)

CocosCreator 3D出租车-官方(19)

Cocos 3D 懒猫跑酷(13)

MyBatis-Plus教程(1)

vue3UI-ElementPlush 使用文档(21)

CocosCreator3D基础(27)

SpringBoot资料(109)

Linux系统(10)

windows系统(2)

VUE(35)

eclipse-tomcat(15)

我是医生(12)

爬虫相关(2)

小程序(139)

小游戏(4)

小程序-商城-shop-01(6)

手机(1)

docker(3)

JS/CSS/HTML(169)

电脑知识(22)

typescript教程(4)

python-selenium(6)

python-BeautifulSoup(1)

java-selenium(4)

jsoup解析html(1)

IDEA(27)

物联网(8)

excel技巧(6)

抖音小程序(1)

微信小程序，基础教程(1)

excel(2)

视频制作(12)

古诗、古文(3)

电影(1)

秘术(1)

个人分类(93)

其它分类(7)

实验室软件(3)

基金证券(1)

歌曲(1)

按日期分组

2026年01月(16)

2025年12月(14)

2025年11月(11)

2025年10月(24)

2025年09月(10)

2025年08月(30)

2025年07月(19)

2025年06月(18)

2025年05月(19)

2025年04月(18)

2025年03月(7)

2025年02月(8)

2025年01月(11)

2024年12月(12)

2024年11月(12)

2024年10月(10)

2024年09月(2)

2024年08月(5)

2024年06月(1)

2024年05月(4)

2024年04月(8)

2024年03月(15)

2024年02月(11)

2024年01月(12)

2023年12月(18)

2023年11月(10)

2023年10月(8)

2023年09月(5)

2023年07月(12)

2023年05月(13)

2023年04月(24)

2023年03月(14)

2023年02月(5)

2023年01月(8)

2022年12月(11)

2022年11月(17)

2022年10月(39)

2022年09月(12)

2022年08月(6)

2022年07月(1)

2022年06月(5)

2022年05月(10)

2022年04月(10)

2022年03月(15)

2022年02月(8)

2022年01月(11)

2021年12月(9)

2021年11月(59)

2021年10月(46)

2021年09月(37)

2021年08月(68)

2021年07月(15)

2021年06月(5)

2021年05月(8)

2021年04月(10)

2021年03月(12)

2021年02月(20)

2021年01月(4)

2020年12月(8)

2020年11月(8)

2020年10月(16)

2020年09月(12)

2020年08月(11)

2020年07月(20)

2020年06月(23)

2020年05月(8)

2020年04月(14)

2020年03月(15)

2020年02月(18)

2020年01月(6)

2019年12月(12)

2019年11月(18)

2019年10月(18)

2019年09月(30)

2019年08月(19)

2019年07月(21)

2019年06月(20)