功能
利用Labelme标注之后生成的json文件,生成语义分割数据集的label和原图
代码
import base64
import json
import os
import os.path as osp
import imgviz
import PIL.Image
from labelme.logger import logger
from labelme import utils
from tqdm import tqdm
def main():
logger.warning(
"This script is aimed to demonstrate how to convert the "
"JSON file to a single image dataset."
)
logger.warning(
"It won't handle multiple JSON files to generate a "
"real-use dataset."
)
# json_file是标注完之后生成的json文件的目录。out_jpgs_path是输出的原始图像目录,out_mask_path是输出的label目录
json_file = r"**/json"
out_jpgs_path = "**/JPEGImages"
out_mask_path = "**/Annotations"
# 如果输出的路径不存在,则自动创建这个路径
if not osp.exists(out_jpgs_path):
os.mkdir(out_jpgs_path)
if not osp.exists(out_mask_path):
os.mkdir(out_mask_path)
num = 0
for file_name in tqdm(os.listdir(json_file)):
# 遍历json_file里面所有的文件,并判断这个文件是不是以.json结尾
if file_name.endswith(".json"):
path = os.path.join(json_file, file_name)
if os.path.isfile(path):
data = json.load(open(path))
# 获取json里面的图片数据,也就是二进制数据
imageData = data.get("imageData")
# 如果通过data.get获取到的数据为空,就重新读取图片数据
if not imageData:
imagePath = os.path.join(json_file, data["imagePath"])
with open(imagePath, "rb") as f:
imageData = f.read()
imageData = base64.b64encode(imageData).decode("utf-8")
# 将二进制数据转变成numpy格式的数据
img = utils.img_b64_to_arr(imageData)
# 将类别名称转换成数值,以便于计算
label_name_to_value = {"_background_": 0}
for shape in sorted(data["shapes"], key=lambda x: x["label"]):
label_name = shape["label"]
if label_name in label_name_to_value:
label_value = label_name_to_value[label_name]
else:
label_value = len(label_name_to_value)
label_name_to_value[label_name] = label_value
lbl, _ = utils.shapes_to_label(img.shape, data["shapes"], label_name_to_value)
label_names = [None] * (max(label_name_to_value.values()) + 1)
for name, value in label_name_to_value.items():
label_names[value] = name
lbl_viz = imgviz.label2rgb(
label=lbl, image=imgviz.asgray(img), label_names=label_names, loc="rb"
)
# 将输出结果保存,
PIL.Image.fromarray(img).save(osp.join(out_jpgs_path, str(num) + '.png'))
utils.lblsave(osp.join(out_mask_path, "%s.png" % str(num)), lbl)
num += 1
print("Done")
if __name__ == "__main__":
main()