EADST

YOLOv5: Data Preparation for Training

YOLOv5: Data Preparation for Training, from VOC Format to YOLO Format

First, split the data to train and val, and get txt files

import os
import random

train_percent = 0.95 xmlfilepath = 'bucket_v1/Annotations' txtsavepath = 'bucket_v1/ImageSets' total_xml = os.listdir(xmlfilepath)

num = len(total_xml) trainval = range(num) tr = int(num * train_percent) train = random.sample(trainval, tr)

ftrain = open('bucket_v1/ImageSets/Main/train.txt', 'w') fval = open('bucket_v1/ImageSets/Main/val.txt', 'w')

for i in trainval: name = total_xml[i][:-4] + '\n' if i in train: ftrain.write(name) else: fval.write(name)

Second, convert VOC format data (xml) to YOLO format data (txt)

import os
from tqdm import tqdm
from lxml import etree
import json
import shutil

voc_root = "/dfs/data/others/byolov5/dataset/bucket_v1" voc_version = "bucket_v1"

train_txt = "train.txt" val_txt = "val.txt" save_file_root = "/dfs/data/others/byolov5/dataset/yolo_data"

voc_images_path = os.path.join(voc_root, "JPEGImages") voc_xml_path = os.path.join(voc_root, "Annotations") train_txt_path = os.path.join(voc_root, "ImageSets", "Main", train_txt) val_txt_path = os.path.join(voc_root, "ImageSets", "Main", val_txt)

def parse_xml_to_dict(xml): if len(xml) == 0: return {xml.tag: xml.text} result = {} for child in xml: child_result = parse_xml_to_dict(child)
if child.tag != 'object': result[child.tag] = child_result[child.tag] else: if child.tag not in result:
result[child.tag] = [] result[child.tag].append(child_result[child.tag]) return {xml.tag: result}

def translate_info(file_names: list, save_root: str, class_dict: dict, train_val='train'): save_txt_path = os.path.join(save_root, train_val, "labels") if os.path.exists(save_txt_path) is False: os.makedirs(save_txt_path) save_images_path = os.path.join(save_root, train_val, "images") if os.path.exists(save_images_path) is False: os.makedirs(save_images_path)

for file in tqdm(file_names, desc="translate {} file...".format(train_val)):
    img_path = os.path.join(voc_images_path, file + ".jpg")
    assert os.path.exists(img_path), "file:{} not exist...".format(img_path)

    xml_path = os.path.join(voc_xml_path, file + ".xml")
    assert os.path.exists(xml_path), "file:{} not exist...".format(xml_path)

    # read xml
    with open(xml_path, encoding='UTF-8') as fid:
        xml_str = fid.read()
    xml = etree.fromstring(xml_str)
    data = parse_xml_to_dict(xml)["annotation"]
    img_height = int(data["size"]["height"])
    img_width = int(data["size"]["width"])
    # write object info into txt
    # assert "object" in data.keys(), "file: '{}' lack of object key.".format(xml_path)
    if "object" not in data.keys():
        print("Warning: in '{}' xml, there are no objects.".format(xml_path))
        continue

    with open(os.path.join(save_txt_path, file + ".txt"), "w") as f:
        for index, obj in enumerate(data["object"]):
            xmin = float(obj["bndbox"]["xmin"])
            xmax = float(obj["bndbox"]["xmax"])
            ymin = float(obj["bndbox"]["ymin"])
            ymax = float(obj["bndbox"]["ymax"])
            class_name = obj["name"]
            class_index = class_dict[class_name] - 1

            if xmax <= xmin or ymax <= ymin:
                print("Warning: in '{}' xml, there are some bbox w/h <=0".format(xml_path))
                continue

            xcenter = xmin + (xmax - xmin) / 2
            ycenter = ymin + (ymax - ymin) / 2
            w = xmax - xmin
            h = ymax - ymin

            xcenter = round(xcenter / img_width, 6)
            ycenter = round(ycenter / img_height, 6)
            w = round(w / img_width, 6)
            h = round(h / img_height, 6)

            info = [str(i) for i in [class_index, xcenter, ycenter, w, h]]

            if index == 0:
                f.write(" ".join(info))
            else:
                f.write("\n" + " ".join(info))

    # copy image into save_images_path
    path_copy_to = os.path.join(save_images_path, img_path.split(os.sep)[-1])
    if os.path.exists(path_copy_to) is False:
        shutil.copyfile(img_path, path_copy_to)

def main(): class_dict = {"b": 1, "t": 2} with open(train_txt_path, "r") as r: train_file_names = [i for i in r.read().splitlines() if len(i.strip()) > 0] translate_info(train_file_names, save_file_root, class_dict, "train") with open(val_txt_path, "r") as r: val_file_names = [i for i in r.read().splitlines() if len(i.strip()) > 0] translate_info(val_file_names, save_file_root, class_dict, "val")

if name == "main": main()

Reference:

Train Custom Data

相关标签
About Me
XD
Goals determine what you are going to be.
Category
标签云
Distillation CV CUDA TensorRT Proxy v2ray Shortcut ResNet-50 MD5 Miniforge 版权 云服务器 Website LoRA Attention transformers JSON Logo Pandas Bin git CAM Excel Hungarian 关于博主 Nginx Input LaTeX SQL SAM ModelScope Qwen2.5 多进程 uwsgi logger Ptyhon Hilton Disk SQLite OpenAI Sklearn Permission Llama Magnet DeepSeek Heatmap Freesound 报税 diffusers Vmess OpenCV Crawler scipy GoogLeNet ChatGPT 多线程 Template Firewall CSV llama.cpp GIT BTC Markdown 域名 NLTK 签证 UI SPIE Django YOLO Data Git COCO Tracking Conda Interview Pillow 强化学习 UNIX 顶会 uWSGI Bipartite Baidu 财报 Base64 tqdm Review Domain ONNX Tiktoken Image2Text BeautifulSoup AI Anaconda VPN Datetime 公式 图形思考法 PDF LLAMA GGML 第一性原理 FP32 递归学习法 CC Zip hf QWEN 音频 飞书 Ubuntu Google VSCode Tensor SVR Breakpoint TensorFlow git-lfs C++ mmap CLAP Password 继承 RAR FP8 XGBoost Land TSV Plate Algorithm Translation RGB Streamlit News LLM Pytorch tar Docker Diagram Web Card 阿里云 Augmentation Jetson NLP Color Quantization torchinfo printf Paper 算法题 FP64 FP16 Vim Qwen2 Pickle Bitcoin Use Statistics Animate FastAPI InvalidArgumentError Qwen Dataset BF16 PIP Linux VGG-16 WebCrawler EXCEL CEIR Knowledge XML GPT4 Math Video Mixtral Hotel Agent Paddle Numpy FlashAttention LeetCode Search WAN Quantize Github 证件照 Claude NameSilo 搞笑 CTC Random Safetensors Food HaggingFace 腾讯云 Plotly TTS Michelin GPTQ HuggingFace Transformers PyCharm Jupyter Bert v0.dev Gemma PyTorch Clash DeepStream OCR Cloudreve Windows PDB Python 净利润 API IndexTTS2
站点统计

本站现有博文321篇,共被浏览773615

本站已经建立2463天!

热门文章
文章归档
回到顶部