python将json格式标签转换为txt格式标签(yolo格式)

大模型研究僧

已于 2023-03-13 15:23:50 修改

阅读量2.7k

点赞数 3

分类专栏：机器学习文章标签： python json YOLO

于 2023-03-10 11:10:14 首次发布

本文链接：https://blog.youkuaiyun.com/weixin_44006686/article/details/129438580

版权

机器学习专栏收录该内容

6 篇文章

订阅专栏

该代码实现了一个Python脚本，主要功能是从指定的JSON文件中读取数据，将数据转换成多个TXT文件，并执行XYXY到XYWH的坐标转换。它首先读取JSON文件，然后遍历内容，根据图片路径创建对应的TXT文件，写入转换后的坐标信息。此外，还包含了一个方法用于在TXT文件中添加序号。

摘要生成于 C知道，由 DeepSeek-R1 满血版支持，前往体验 >

话不多说直接附代码
这个代码主要是解析一个json文件转换成多个txt文件使用的
并且进行了xyxy—>xywh的转换,如果不需要就不要调用xyxyToXywh方法
基本上修改的话就是json_dir out_dir 需要修改
write_txt 方法内地址需要修改
get_json方法中读取的内容需要修改,没了

import os
import json
import jsonpath
import numpy as np

json_dir = r'D:\desktop\data_set\StanfordExtra\stanfordextra_v12\StanfordExtra_v12.json'  # json文件路径
out_dir = r'D:\desktop\data_set\StanfordExtra\labels'  # 输出的 txt 文件路径


def get_json():
    # 读取 json 文件数据
    object = json.load(open(json_dir, 'r', encoding='utf-8'))
    for le in object:
        path = le["img_path"]  # 名称
        imgWidth =  le['img_width']
        imgHeight = le['img_height']
        img_bbox = le['img_bbox']
        strTxt = ''
        x,y,w,h = xyxyToXywh(img_bbox,imgWidth,imgHeight)   # 对数据进行转换
        strTxt +=  str(x) + ' ' + str(y) + ' ' + str(w) + ' ' + str(h)
        print('strtxt -----' ,strTxt)
        print(path)  # 获取名称
        dirPath = path.split('/')
          # 文件夹名称

        print_dir = out_dir + '\\' + dirPath[0]
        if os.path.exists(print_dir) != True:
            os.mkdir(print_dir)  # 创建文件夹
        jpgName = dirPath[1].split('.')  # 这个jpg就是名称去掉.jpg
        with open(print_dir + "\\" + jpgName[0] + '.txt', "w", encoding="utf-8") as txt:
            txt.write(strTxt)
            txt.close()


def xyxyToXywh(imgPathList,imgWidth,imgHeight):
    x = np.round(abs(imgPathList[0] + imgPathList[2]/ 2)  / imgWidth,6)
    y = np.round(abs(imgPathList[1] + imgPathList[3]/ 2)  / imgHeight,6)
    w = imgPathList[2]  
    h = imgPathList[3]   
    w = np.round(float(w) / imgWidth,6)
    h = np.round(float(h) / imgWidth,6)
    print(x,y,w,h)
    return x,y,w,h

# 根据地址循环文件夹数量
def add_kind(dir):
    i = -2
    for root, dirs, files in os.walk(dir):
        i = i+1
        for file in files:
            strtxt = ''
             # 打开文件 读取文件第一行
            with open(os.path.join(root, file), 'r', encoding='utf-8') as f:
               line = f.readline()
               strtxt += str(i) + ' ' + str(line)
            with open(os.path.join(root, file), 'w', encoding='utf-8') as f:
                f.write(strtxt)

# 生成种类txt对应文件
def write_txt(dir):
    # dir是目标文件夹
    i = -1
    with open(r'D:\desktop\data_set\StanfordExtra\class\classify.txt', 'w+', encoding='utf-8') as f:
        pass
    with open(r'D:\desktop\data_set\StanfordExtra\class\classify.json', 'w+', encoding='utf-8') as f:
        f.write('[')
    for root, dirs, files in os.walk(dir):
        for dirr in dirs:
            i = i + 1
            with open(r'D:\desktop\data_set\StanfordExtra\class\classify.txt', 'a', encoding='utf-8') as f:
                f.write(str(i) + ' ' + dirr + '\n')
            with open(r'D:\desktop\data_set\StanfordExtra\class\classify.json', 'a', encoding='utf-8') as f:
                f.write('\''+ dirr+'\'' +',')
    with open(r'D:\desktop\data_set\StanfordExtra\class\classify.json', 'a', encoding='utf-8') as f:
        f.write(']')

def main():
    get_json()      # 解释json文件,转成txt文件
    add_kind(out_dir)
    # write_txt(out_dir)   # 生成种类txt对应文件
    print('结束')

if __name__ == '__main__':
    main()