labelme的json标注文件转yolo的txt训练文件，及划分训练集代码（YOLOv8）

一、代码块目录详情

二、json2txt.py

 import json
import os
 
 
def convert_annotation(json_file, txt_file, label_to_id_mapping):
    # Read the JSON file
    with open(json_file, 'r', encoding='utf-8') as f:
        data = json.load(f)
 
        # Extract image dimensions, assuming 'imageWidth' and 'imageHeight' fields are present
    image_width = data.get('imageWidth')
    image_height = data.get('imageHeight')
 
    # Check if image dimensions are present
    if image_width is None or image_height is None:
        raise ValueError(f"Missing image dimensions in {json_file}")
 
        # Iterate over all shapes (annotations)
    with open(txt_file, 'w', encoding='utf-8') as out_file:
        for shape in data.get('shapes', []):
            # Extract point coordinates, assuming each shape has a 'points' field
            points = shape.get('points', [])
 
            # Check if points are present
            if not points:
                raise ValueError(f"Missing points in a shape in {json_file}")
 
            x_values = [point[0] for point in points]
            y_values = [point[1] for point in points]
 
            x_min = min(x_values)
            y_min = min(y_values)
            x_max = max(x_values)
            y_max = max(y_values)
 
            # Calculate bounding box center, width, and height
            bbox_center_x = (x_min + x_max) / 2
            bbox_center_y = (y_min + y_max) / 2
            bbox_width = x_max - x_min
            bbox_height = y_max - y_min
 
            # Convert bounding box coordinates to ratios relative to image dimensions
            bbox_center_x_ratio = bbox_center_x / image_width
            bbox_center_y_ratio = bbox_center_y / image_height
            bbox_width_ratio = bbox_width / image_width
            bbox_height_ratio = bbox_height / image_height
 
            # Get the category ID, assuming each shape has a 'label' field
            category_id = shape.get('label', "unknown")
            if isinstance(category_id, str):
                # If the label is a string, map it to a numeric ID using the provided mapping
                category_id = label_to_id_mapping.get(category_id, -1)  # Default to -1 if label is unknown
 
            # Write the result to the TXT file in YOLO format
            out_file.write(
                f"{int(category_id)} {bbox_center_x_ratio} {bbox_center_y_ratio} {bbox_width_ratio} {bbox_height_ratio}\n")
 
        # Input and output folder paths
 
 
input_folder = 'D:/sss/datasets/VOCdevkit/jsons'
output_folder = 'D:/sss/datasets/VOCdevkit/txt'
os.makedirs(output_folder, exist_ok=True)
 
# 标注物体的类别名
label_to_id_mapping = {
    'Red Light': 0,
    'Red Light': 1,
    'Yellow Light': 2
    # Add more mappings as needed
}
 
# Iterate over all JSON files in the input folder
for filename in os.listdir(input_folder):
    if filename.endswith('.json'):
        json_file = os.path.join(input_folder, filename)
        txt_file = os.path.join(output_folder, filename.replace('.json', '.txt'))
        try:
            convert_annotation(json_file, txt_file, label_to_id_mapping)
            print(f'{txt_file},Conversion successful!')
        except Exception as e:
            print(f"An error occurred while processing {json_file}: {e}")复制

三、split_data.py

 import os, shutil
from sklearn.model_selection import train_test_split
 
val_size = 0.1
test_size = 0.1
postfix = 'jpg'
imgpath = 'VOCdevkit/images'
txtpath = 'VOCdevkit/txt'
 
os.makedirs('images/train', exist_ok=True)
os.makedirs('images/val', exist_ok=True)
os.makedirs('images/test', exist_ok=True)
os.makedirs('labels/train', exist_ok=True)
os.makedirs('labels/val', exist_ok=True)
os.makedirs('labels/test', exist_ok=True)
 
listdir = [i for i in os.listdir(txtpath) if 'txt' in i]
train, test = train_test_split(listdir, test_size=test_size, shuffle=True, random_state=0)
train, val = train_test_split(train, test_size=val_size, shuffle=True, random_state=0)
print(f'train set size:{len(train)} val set size:{len(val)} test set size:{len(test)}')
 
for i in train:
    shutil.copy('{}/{}.{}'.format(imgpath, i[:-4], postfix), 'images/train/{}.{}'.format(i[:-4], postfix))
    shutil.copy('{}/{}'.format(txtpath, i), 'labels/train/{}'.format(i))
 
for i in val:
    shutil.copy('{}/{}.{}'.format(imgpath, i[:-4], postfix), 'images/val/{}.{}'.format(i[:-4], postfix))
    shutil.copy('{}/{}'.format(txtpath, i), 'labels/val/{}'.format(i))
 
for i in test:
    shutil.copy('{}/{}.{}'.format(imgpath, i[:-4], postfix), 'images/test/{}.{}'.format(i[:-4], postfix))
    shutil.copy('{}/{}'.format(txtpath, i), 'labels/test/{}'.format(i))复制

四、data.yaml

 # 划分数据集的地址
train: D:\sss\datasets\images\train
val: D:\sss\datasets\images\val
test: D:\sss\datasets\images\test
 
# 标注的类别数量
nc: 3
 
# 类别名称
names: ['Red Light', 'Red Light', 'Yellow Light']复制

兄台，本章对你有用的话，记得一键三连哦！

更多资源，请移步至本人的github首页：lcx9451 (lcx9451) (github.com)

labelme的json标注文件转yolo的txt训练文件，及划分训练集代码（YOLOv8）

一、代码块目录详情

二、json2txt.py

三、split_data.py

四、data.yaml

Postman导出JSON文件轻松转换为HTML或Markdown

python requests编写 api接收json

前端-javaScript:jquery补充

java中Object和json相互转换的方式

Flutter Dart Macro 宏简化 JSON 序列化

中国地区 code.json文件

JSONObject 使用对比 hutool、alibaba

PG数据库的Jsonb全文检索查询

【开发工具】IntelliJ IDEA插件推荐：Json Helper——让JSON处理更高效

JSON 的常见格式总结

前端哥

运行npm error code ENOENTnpm error syscall opennpm error path C:\Users\ultra\Desktop\Vue-Project\pac

前端提高篇（102）：jQuery高级方法callbacks、deferred

解决npm install 报错 “npm err code 1“

【常见错误】npm ERR! code CERT_HAS_EXPIRED & errno CERT_HAS_EXPIRED

vue前端页面弹出红色报错遮罩层 Uncaught runtime errors:at handleError (webpack-internal:///./node_modules/webpack

npm ERR! code CERT_HAS_EXPIRED npm ERR! errno CERT_HAS_EXPIRED npm ERR! request to https://registry.

JQuery中的load()、$

《WEB前端框架开发技术》HTML5响应式旅游景区网站——榆林子州HTML CSS JavaScript (1)

基于Java SpringBoot Vue HTML5药店管理系统(源码 LW 调试文档讲解等)/药店管理软件/药店进销存系统/药店库存管理系统/药店销售系统/药品管理系统/药店收银系统

基于Java SpringBoot Vue HTML5宠物健康顾问系统(源码 LW 调试文档讲解等)/宠物健康/顾问系统/宠物护理/宠物医疗/宠物保健/宠物咨询/宠物医生/宠物健康管理/宠物健康服务

1
【Echarts系列】—— 实现电池图、3D立体圆形柱状图

2024-03-03 11:03:011001

2
CSS常用属性（文本属性）

2024-11-04 09:11:111000

3
TypeScript 中的 Number 类型，Number 类型的特性、常见操作和注意事项

2024-09-30 23:09:061000

4
CSS写代码使页面划分为左右两个区域

2024-09-09 00:09:071000

5
vue使用datav echarts

2024-09-06 00:09:381000

6
使用TweenMax.js和CSS3创建冰球运动员动画效果教程

2024-09-04 23:09:411000

7
使用CDN提高jQuery加载速度

2024-08-24 23:08:211000

8
小兔鲜儿网页首页制作黑马程序员前端基础项目自学笔记

2024-08-19 22:08:161000

9
《Vue》你的弹窗能拖动吗？Vue自定义指令实现可拖动弹窗

2024-08-19 22:08:121000

10
npm的使用

2024-08-18 00:08:131000

	import json
	import os


	def convert_annotation(json_file, txt_file, label_to_id_mapping):
	# Read the JSON file
	with open(json_file, 'r', encoding='utf-8') as f:
	data = json.load(f)

	# Extract image dimensions, assuming 'imageWidth' and 'imageHeight' fields are present
	image_width = data.get('imageWidth')
	image_height = data.get('imageHeight')

	# Check if image dimensions are present
	if image_width is None or image_height is None:
	raise ValueError(f"Missing image dimensions in {json_file}")

	# Iterate over all shapes (annotations)
	with open(txt_file, 'w', encoding='utf-8') as out_file:
	for shape in data.get('shapes', []):
	# Extract point coordinates, assuming each shape has a 'points' field
	points = shape.get('points', [])

	# Check if points are present
	if not points:
	raise ValueError(f"Missing points in a shape in {json_file}")

	x_values = [point[0] for point in points]
	y_values = [point[1] for point in points]

	x_min = min(x_values)
	y_min = min(y_values)
	x_max = max(x_values)
	y_max = max(y_values)

	# Calculate bounding box center, width, and height
	bbox_center_x = (x_min + x_max) / 2
	bbox_center_y = (y_min + y_max) / 2
	bbox_width = x_max - x_min
	bbox_height = y_max - y_min

	# Convert bounding box coordinates to ratios relative to image dimensions
	bbox_center_x_ratio = bbox_center_x / image_width
	bbox_center_y_ratio = bbox_center_y / image_height
	bbox_width_ratio = bbox_width / image_width
	bbox_height_ratio = bbox_height / image_height

	# Get the category ID, assuming each shape has a 'label' field
	category_id = shape.get('label', "unknown")
	if isinstance(category_id, str):
	# If the label is a string, map it to a numeric ID using the provided mapping
	category_id = label_to_id_mapping.get(category_id, -1) # Default to -1 if label is unknown

	# Write the result to the TXT file in YOLO format
	out_file.write(
	f"{int(category_id)} {bbox_center_x_ratio} {bbox_center_y_ratio} {bbox_width_ratio} {bbox_height_ratio}\n")

	# Input and output folder paths


	input_folder = 'D:/sss/datasets/VOCdevkit/jsons'
	output_folder = 'D:/sss/datasets/VOCdevkit/txt'
	os.makedirs(output_folder, exist_ok=True)

	# 标注物体的类别名
	label_to_id_mapping = {
	'Red Light': 0,
	'Red Light': 1,
	'Yellow Light': 2
	# Add more mappings as needed
	}

	# Iterate over all JSON files in the input folder
	for filename in os.listdir(input_folder):
	if filename.endswith('.json'):
	json_file = os.path.join(input_folder, filename)
	txt_file = os.path.join(output_folder, filename.replace('.json', '.txt'))
	try:
	convert_annotation(json_file, txt_file, label_to_id_mapping)
	print(f'{txt_file},Conversion successful!')
	except Exception as e:
	print(f"An error occurred while processing {json_file}: {e}")

	import os, shutil
	from sklearn.model_selection import train_test_split

	val_size = 0.1
	test_size = 0.1
	postfix = 'jpg'
	imgpath = 'VOCdevkit/images'
	txtpath = 'VOCdevkit/txt'

	os.makedirs('images/train', exist_ok=True)
	os.makedirs('images/val', exist_ok=True)
	os.makedirs('images/test', exist_ok=True)
	os.makedirs('labels/train', exist_ok=True)
	os.makedirs('labels/val', exist_ok=True)
	os.makedirs('labels/test', exist_ok=True)

	listdir = [i for i in os.listdir(txtpath) if 'txt' in i]
	train, test = train_test_split(listdir, test_size=test_size, shuffle=True, random_state=0)
	train, val = train_test_split(train, test_size=val_size, shuffle=True, random_state=0)
	print(f'train set size:{len(train)} val set size:{len(val)} test set size:{len(test)}')

	for i in train:
	shutil.copy('{}/{}.{}'.format(imgpath, i[:-4], postfix), 'images/train/{}.{}'.format(i[:-4], postfix))
	shutil.copy('{}/{}'.format(txtpath, i), 'labels/train/{}'.format(i))

	for i in val:
	shutil.copy('{}/{}.{}'.format(imgpath, i[:-4], postfix), 'images/val/{}.{}'.format(i[:-4], postfix))
	shutil.copy('{}/{}'.format(txtpath, i), 'labels/val/{}'.format(i))

	for i in test:
	shutil.copy('{}/{}.{}'.format(imgpath, i[:-4], postfix), 'images/test/{}.{}'.format(i[:-4], postfix))
	shutil.copy('{}/{}'.format(txtpath, i), 'labels/test/{}'.format(i))

	# 划分数据集的地址
	train: D:\sss\datasets\images\train
	val: D:\sss\datasets\images\val
	test: D:\sss\datasets\images\test

	# 标注的类别数量
	nc: 3

	# 类别名称
	names: ['Red Light', 'Red Light', 'Yellow Light']

labelme的json标注文件转yolo的txt训练文件，及划分训练集代码（YOLOv8）

一、代码块目录详情

二、json2txt.py

三、split_data.py

四、data.yaml

微信扫一扫：分享