[目标检测]labelme标注数据转yoloV8需要的.txt格式

🕗 发布于 2024-07-07 14:34 目标检测 YOLO 人工智能

1、首先需要知道yoloV8目标检测的标签格式：

yolov8标签数据格式说明

After using a tool like Roboflow Annotate to label your images, export your labels to YOLO format, with one *.txt file per image (if no objects in image, no *.txt file is required). The *.txt file specifications are:

    One row per object
    Each row is class x_center y_center width height format.
    Box coordinates must be in normalized xywh format (from 0 - 1). If your boxes are in pixels, divide x_center and width by image width, and y_center and height by image height.
    Class numbers are zero-indexed (start from 0).

主要包括五个数字 id 、x 、y 、w,、h，分别代表标签类别、目标对象在图像中的中心位置（x,y）、目标对象的宽和高。

注意的是中心位置坐标、以及目标对象的宽和高都需要进行归一化到0-1之间。如下：

0 0.060000 0.460000 0.12 0.65
1 0.450000 0.480000 0.38 0.68
0 0.880000 0.470000 0.24 0.63

2、示例有两种标签类型，转化为.txt的代码如下：

import json
import os
import shutil
import random

# Convert label to idx
with open("labels.txt", "r") as f:
    classes = [c.strip() for c in f.readlines()]
    idx_dict = {c: str(i) for i, c in enumerate(classes)}

def convert_labelmes_to_yolo(labelme_folder, output_folder):
    label_folder = os.path.join(output_folder, "labels")         # label_folder = image_folder/labels
    os.makedirs(label_folder, exist_ok=True)
    image_folder = os.path.join(output_folder, "images")         # image_folder = image_folder/images
    os.makedirs(image_folder, exist_ok=True)

    for root, dirs, files in os.walk(labelme_folder):          # root-文件夹所在路径  dir-路经下的文件夹   file-里面的文件
        for file in files:
            file_path = os.path.join(root, file)
            if os.path.splitext(file)[-1] != ".json":      # 分割文件名和扩展名
                shutil.copy(file_path, image_folder)
                print(f"Copied {file_path} to {image_folder}")
            else:
                # 读取json文件
                with open(file_path, 'r') as f:
                    labelme_data = json.load(f)

                image_filename = labelme_data["imagePath"]
                image_width = labelme_data["imageWidth"]
                image_height = labelme_data["imageHeight"]

                txt_filename = os.path.splitext(image_filename)[0] + ".txt"
                txt_path = os.path.join(label_folder, txt_filename)

                with open(txt_path, 'w') as f:
                    for shape in labelme_data["shapes"]:
                        label = shape["label"]
                        points = shape["points"]
                        x_min, y_min = points[0]
                        x_max, y_max = points[1]

                        center_x = round(((x_min + x_max) / 2) / image_width , 2)
                        center_y = round(((y_min + y_max) / 2) / image_height ,2)
                        width = round(abs(x_min - x_max) / image_width, 2)
                        height = round(abs(y_min - y_max) / image_height, 2)

                        class_id = label_dict[label]
                        f.write(f"{class_id}  {center_x:.6f} {center_y:.6f} {width} {height}\n")

                print(f"Converted {file} to {txt_path}")

    print("转换成功")

def split_data(output_folder, dataset_folder):
    random.seed(0)
    split_rate = 0.2 #验证集占比
    origin_label_path = os.path.join(output_folder, "labels")
    origin_image_path = os.path.join(output_folder, "images")
    train_label_path = os.path.join(dataset_folder, "train", "labels")
    os.makedirs(train_label_path, exist_ok=True)
    train_image_path = os.path.join(dataset_folder, "train", "images")
    os.makedirs(train_image_path, exist_ok=True)
    val_label_path = os.path.join(dataset_folder, "val", "labels")
    os.makedirs(val_label_path, exist_ok=True)
    val_image_path = os.path.join(dataset_folder, "val", "images")
    os.makedirs(val_image_path, exist_ok=True)

    images = os.listdir(origin_image_path)
    num = len(images)
    eval_index = random.sample(images,k=int(num*split_rate))
    for single_image in images:
        origin_single_image_path = os.path.join(origin_image_path, single_image)
        single_txt = os.path.splitext(single_image)[0] + ".txt"
        origin_single_txt_path = os.path.join(origin_label_path, single_txt)
        if single_image in eval_index:
            #single_json_path = os.path.join(val_label_path,single_json)
            shutil.copy(origin_single_image_path, val_image_path)
            shutil.copy(origin_single_txt_path, val_label_path)
        else:
            #single_json_path = os.path.join(train_label_path,single_json)
            shutil.copy(origin_single_image_path, train_image_path)
            shutil.copy(origin_single_txt_path, train_label_path)

    print("数据集划分完成")

    with open(os.path.join(dataset_folder,"data.yaml"),"w") as f:
        f.write(f"train: {dataset_folder}\n")
        f.write(f"val: {val_image_path}\n")
        f.write(f"test: {val_image_path}\n\n")
        f.write(f"nc: {len(classes)}\n")
        f.write(f"names: {classes}\n")

if __name__ == '__main__':
    label_dict = {"incp_tank": 0, "cp_tank": 1}
    labelme_folder = "./labelme_folder" #labelme生成的标注文件所在的文件夹
    output_folder = "./test" #存储yolo标注文件的文件夹
    dataset_folder = "./mydata" #存储划分好的数据集的文件夹
    convert_labelmes_to_yolo(labelme_folder, output_folder)#将labelme标注文件转换为yolo格式
    split_data(output_folder, dataset_folder)#划分训练集和验证级

注意：你需要新建一个label.txt文件，把涉及到的标签名字输入进去，会自动得到.yaml文件。当然也可以把这一步省略，后面我们直接copy已有的.yaml把训练、验证的路径加进去即可。

原文地址：https://blog.csdn.net/m0_48919875/article/details/140232032

免责声明：本站文章内容转载自网络资源，如本站内容侵犯了原著者的合法权益，可联系本站删除。更多内容请关注自学内容网（zxcms.com）！

上一篇：Vue项目使用mockjs模拟后端接口
下一篇：improved-diffusion-main代码理解

CSS——唯美窗口
通过上述步骤，我们成功创建了一个唯美的弹窗窗口。这个弹窗不仅在视觉上给人以美的享受，而且在用户体验上也做到了简洁而高效。希望这个教程能帮助你在自己的项目中实现更加优雅和美观的弹窗设计。记住，好的设计不
阅读更多2024-11-06
前端入门一之CSS知识详解
CSS中的继承: 子标签会继承父标签的某些样式，如文本颜色和字号。恰当地使用继承可以简化代码，降低 CSS 样式的复杂性。相同选择器给设置相同的样式，此时一个样式就会覆盖（层叠）另一个冲突的样式。盒子
阅读更多2024-11-06
Midjourney国内直登
Midjourney确实是一个强大的AI绘画工具，能够根据用户输入的文本生成高质量的图像。然而，由于国内的网络限制，直接访问Midjourney可能会遇到障碍。目前，已经有一些国内代理或中转平台可以帮
阅读更多2024-11-06
Go 语言的错误处理
Go 语言允许你创建自定义错误类型，以便在错误发生时提供更多的信息。自定义错误类型通常是实现了Error()方法的结构体。= nil {在这个例子中，我们创建了一个FileError结构体来封装文件错
阅读更多2024-11-06
使用Spring Validation实现数据校验详解
在现代Web应用开发中，数据校验是不可忽视的重要环节。Spring提供了强大的数据校验框架——Spring Validation，可以有效提升数据输入的安全性与应用的稳定性。本文将介绍如何使用Spri
阅读更多2024-11-06
phpstudy 使用php8.2.9版本报错问题
在切换php版本到更高版本时在终端查看php版本时报如下界面错误。
阅读更多2024-11-06
微信小程序高校教材征订系统
系统分为三个角色，分别是教材科、系教学秘书、教研室主任。系统主要完成功能是教材科要发布教材征订信息，系部教学秘书根据教学计划通知各个教研室主任指定教材征订计划，系部教学秘书汇总教材征订计划表并上报教材
阅读更多2024-11-06
自制inscode项目推荐:色块小游戏
颜色匹配小游戏是一款基于HTML、CSS和JavaScript开发的简单而有趣的网页游戏。游戏的目标是通过点击颜色块，将整个游戏板上的所有方块变成同一种颜色。玩家需要在有限的步数内完成任务，否则游戏将
阅读更多2024-11-06
微服务day03
由于已有相关项目则要关闭DockerComponent中的已开启的项目创建网络用来连接项目容器创建并运行Mysql容器。
阅读更多2024-11-06
Linux中sysctl、systemctl、systemd、init的区别
用于管理系统和服务。两者在Linux系统中扮演着不同的角色，服务于不同的管理需求。是现代Linux系统中的主流系统和服务管理器，它提供了比传统的。的命令行工具，使得管理系统和服务变得更加方便和高效。更
阅读更多2024-11-06

[目标检测]labelme标注数据转yoloV8需要的.txt格式

相关文章