Recently, I used the labelme tool to label a batch of data sets in json format, but I want to use yolov5 to try the detection effect. Trouble is coming! I need to convert the data set into txt format. I want to find for nothing on the Internet for a long time, but I can't find what I want. In the end, I have to tailor it for myself!
1. My folder directory
image folder: store original pictures
json folder: store the corresponding json file
txt_label folder: store converted txt files
2. JSON format data set
The json format is as follows:
3. The converted txt format
txt format is as follows:
4. Convert code
import json
import os
import xml.etree.ElementTree as ET
import cv2
# 将x1, y1, x2, y2转换成yolov5所需要的x, y, w, h格式
def xyxy2xywh(size, box):
dw = 1. / size[0]
dh = 1. / size[1]
x = (box[0] + box[2]) / 2 * dw
y = (box[1] + box[3]) / 2 * dh
w = (box[2] - box[0]) * dw
h = (box[3] - box[1]) * dh
return (x, y, w, h) # 返回的都是标准化后的值
def voc2yolo(path):
# 可以打印看看该路径是否正确
print(len(os.listdir(path)))
pic_path = '' # 原始图片路径
txt_out_path = '' # 转换后txt保存路径
# 遍历每一个xml文件
for file in os.listdir(path):
print(file)
if "json" in str(file):
with open(os.path.join(path, file), 'r') as f:
data = json.load(f)
print(data)
points = data['shapes'][0]['points']
pic_name = os.path.join(pic_path, data['imagePath'])
txt_name = data['imagePath'].split(".")[0] + ".txt"
imread = cv2.imread(pic_name)
h = imread.shape[0]
w = imread.shape[1]
print(imread.shape)
xmin = points[0][0]
ymin = points[0][1]
xmax = points[2][0]
ymax = points[2][1]
box = [float(xmin), float(ymin), float(xmax),
float(ymax)]
print(box)
#
# # 将x1, y1, x2, y2转换成yolov5所需要的x, y, w, h格式
bbox = xyxy2xywh((w, h), box)
print(bbox)
# # 写入目标文件中,格式为 id x y w h
with open(os.path.join(txt_out_path, txt_name), 'w') as out_file:
out_file.write(str(0) + " " + " ".join(str(x) for x in bbox) + '\n')
out_file.close()
#exit()
if __name__ == '__main__':
# json格式数据路径
path = ''
voc2yolo(path)