-------Start

在开始以下操作之前需要安装Anaconda，并在Anaconda中配置pytorch深度学习环境. 完成以上配置之后再进行接下来的操作。

---------官方YOLOV5代码

---------地铁异物检测数据集

1. 下载代码，数据集，预训练权重

1.1 代码下载

在这里插入图片描述

文件解压

在这里插入图片描述

1.2 数据集下载

在这里插入图片描述

下载以下2个文件，并解压。

xml为数据的标签文件，共8929个文件，至于xml文件中的内容大家可以百度学习下，这里不做讲解。

在这里插入图片描述

jpg文件为检测的X光图像，共8929张图像，一张图像对应一个xml文件。

在这里插入图片描述

1.3 预训练权重下载

在这里插入图片描述

2. 数据集整理

2.1 首先新建SIXray文件，里面包含如下内容：Annotations文件夹里为所有的xml文件，Images文件夹里为所有的jpg文件，ImageSets文件夹里再新建一个main文件夹，labels为空文件夹。

在这里插入图片描述

2.2 先修改以下代码的convert_annotation函数中in_file ，out_file 文件路径为你自己数据集所对应的路径。

import xml.etree.ElementTree as ET
import os
from os import getcwd
sets = ['train', 'val', 'test']
classes = ["Gun", "Knife","Wrench","Pliers", "Scissors"]
def convert(size, box):
    dw = 1. / (size[0])
    dh = 1. / (size[1])
    x = (box[0] + box[1]) / 2.0 - 1
    y = (box[2] + box[3]) / 2.0 - 1
    w = box[1] - box[0]
    h = box[3] - box[2]
    x = x * dw
    w = w * dw
    y = y * dh
    h = h * dh
    return x, y, w, h

def convert_annotation(image_id):
    in_file = open('E:/chongda/SIXray/Annotations/%s.xml' % (image_id), encoding='UTF-8')
    out_file = open('E:/chongda/SIXray/labels/%s.txt' % (image_id), 'w')
    tree = ET.parse(in_file)
    root = tree.getroot()
    w = int(root.find('size').find('width').text)
    h = int(root.find('size').find('height').text)
    for obj in root.iter('object'):
        try:
            cls = obj.find('name').text
        except:
            continue
        if cls not in classes == 1:
            continue
        cls_id = classes.index(cls)
        xmlbox = obj.find('bndbox')
        b = (float(xmlbox.find('xmin').text), float(xmlbox.find('xmax').text), float(xmlbox.find('ymin').text),
             float(xmlbox.find('ymax').text))
        b1, b2, b3, b4 = b
        # 标注越界修正
        if b2 > w:
            b2 = w
        if b4 > h:
            b4 = h
        b = (b1, b2, b3, b4)
        bb = convert((w, h), b)
        out_file.write(str(cls_id) + " " + " ".join([str(a) for a in bb]) + '\n')

#划分训练集，测试集，验证集
def test():
    import os
    import random
    import argparse
    parser = argparse.ArgumentParser()
    # xml文件的地址，根据自己的数据进行修改 xml一般存放在Annotations下
    parser.add_argument('--xml_path', default=r'E:\chongda\SIXray\labels', type=str, help='input xml label path')
    # 数据集的划分，地址选择自己数据下的ImageSets/Main
    parser.add_argument('--txt_path', default=r'E:\chongda\SIXray\ImageSets\Main', type=str, help='output txt label path')
    opt = parser.parse_args()
	#训练集：验证集的比例
    trainval_percent = 0.9
    #训练集+验证集：测试集的比例
    train_percent = 0.9
    xmlfilepath = opt.xml_path
    txtsavepath = opt.txt_path
    total_xml = os.listdir(xmlfilepath)
    if not os.path.exists(txtsavepath):
        os.makedirs(txtsavepath)
    random.seed(2022)
    num = len(total_xml)
    list_index = range(num)
    tv = int(num * trainval_percent)
    tr = int(tv * train_percent)
    trainval = random.sample(list_index, tv)
    train = random.sample(trainval, tr)

    file_trainval = open(txtsavepath + '/trainval.txt', 'w')
    file_test = open(txtsavepath + '/test.txt', 'w')
    file_train = open(txtsavepath + '/train.txt', 'w')
    file_val = open(txtsavepath + '/val.txt', 'w')

    for i in list_index:
        name = total_xml[i][:-4] + '\n'
        if i in trainval:
            file_trainval.write(name)
            if i in train:
                file_train.write(name)
            else:
                file_val.write(name)
        else:
            file_test.write(name)

    file_trainval.close()
    file_train.close()
    file_val.close()
    file_test.close()
#根据划分的数据集生成对应的文件路径
def test2():
    for image_set in sets:

        image_ids = open(r'E:\chongda\SIXray\ImageSets\Main\%s.txt' % (image_set)).read().strip().split()
        list_file = open(r'E:\chongda\SIXray\%s.txt' % (image_set), 'w')
        for image_id in image_ids:
            list_file.write('E:\chongda\SIXray\images\%s.jpg\n' % (image_id))
        list_file.close()
#将原数据标签转化成我们需要的标签
def test3():
    path = r'E:\chongda\SIXray\Annotations'
    for image_id in os.listdir(path):
        convert_annotation(image_id[:-4])