【json批量转为语义分割数据集的label和img】

本文链接：https://blog.youkuaiyun.com/qq_42598221/article/details/136386529

文章讲述了如何使用Python脚本将Labelme生成的带有注释的JSON文件转换为包含原始图像和标签的语义分割数据集，适合计算机视觉项目需求。

摘要生成于 C知道，由 DeepSeek-R1 满血版支持，前往体验 >

功能

利用Labelme标注之后生成的json文件，生成语义分割数据集的label和原图

代码

import base64
import json
import os
import os.path as osp

import imgviz
import PIL.Image

from labelme.logger import logger
from labelme import utils
from tqdm import tqdm


def main():
    logger.warning(
        "This script is aimed to demonstrate how to convert the "
        "JSON file to a single image dataset."
    )
    logger.warning(
        "It won't handle multiple JSON files to generate a "
        "real-use dataset."
    )

    # json_file是标注完之后生成的json文件的目录。out_jpgs_path是输出的原始图像目录，out_mask_path是输出的label目录
    json_file = r"**/json"

    out_jpgs_path = "**/JPEGImages"
    out_mask_path = "**/Annotations"

    # 如果输出的路径不存在，则自动创建这个路径
    if not osp.exists(out_jpgs_path):
        os.mkdir(out_jpgs_path)

    if not osp.exists(out_mask_path):
        os.mkdir(out_mask_path)
    num = 0
    for file_name in tqdm(os.listdir(json_file)):
        # 遍历json_file里面所有的文件，并判断这个文件是不是以.json结尾
        if file_name.endswith(".json"):
            path = os.path.join(json_file, file_name)
            if os.path.isfile(path):
                data = json.load(open(path))

                # 获取json里面的图片数据，也就是二进制数据
                imageData = data.get("imageData")
                # 如果通过data.get获取到的数据为空，就重新读取图片数据
                if not imageData:
                    imagePath = os.path.join(json_file, data["imagePath"])
                    with open(imagePath, "rb") as f:
                        imageData = f.read()
                        imageData = base64.b64encode(imageData).decode("utf-8")
                #  将二进制数据转变成numpy格式的数据
                img = utils.img_b64_to_arr(imageData)

                # 将类别名称转换成数值，以便于计算
                label_name_to_value = {"_background_": 0}
                for shape in sorted(data["shapes"], key=lambda x: x["label"]):
                    label_name = shape["label"]
                    if label_name in label_name_to_value:
                        label_value = label_name_to_value[label_name]
                    else:
                        label_value = len(label_name_to_value)
                        label_name_to_value[label_name] = label_value
                lbl, _ = utils.shapes_to_label(img.shape, data["shapes"], label_name_to_value)

                label_names = [None] * (max(label_name_to_value.values()) + 1)
                for name, value in label_name_to_value.items():
                    label_names[value] = name

                lbl_viz = imgviz.label2rgb(
                    label=lbl, image=imgviz.asgray(img), label_names=label_names, loc="rb"
                )

                # 将输出结果保存，
                PIL.Image.fromarray(img).save(osp.join(out_jpgs_path, str(num) + '.png'))
                utils.lblsave(osp.join(out_mask_path, "%s.png" % str(num)), lbl)
                num += 1

    print("Done")


if __name__ == "__main__":
    main()