yolo 检查数据

原创于 2025-11-07 15:31:24 发布 · 222 阅读

0 ·

CC 4.0 BY-SA版权

文章标签：

#YOLO #python #开发语言

yolo 专栏收录该内容

88 篇文章

订阅专栏

yolo 检查数据

import os

import yaml
def load_dataset_paths(yaml_path):
    with open(yaml_path, 'r', encoding='utf-8') as f:
        data = yaml.safe_load(f)

    train_paths = data.get("train", [])
    val_paths = data.get("val", [])
    test_paths = data.get("test", [])

    # 保证是列表
    if not isinstance(train_paths, list):
        train_paths = [train_paths]
    if not isinstance(val_paths, list):
        val_paths = [val_paths]
    if not isinstance(test_paths, list):
        test_paths = [test_paths]

    return train_paths, val_paths, test_paths

if __name__ == '__main__':


    # 示例
    yaml_file = r"data_jiezhi_jita.yaml"
    train_paths, val_paths, test_paths = load_dataset_paths(yaml_file)

    print("Train paths:")
    for dir_a in train_paths:
        img_files = ['%s/%s' % (i[0], j) for i in os.walk(dir_a) for j in i[-1] if j.endswith(('.cache', 'xpng', 'jpeg'))]
        for cache_path in img_files:
            os.remove(cache_path)
        print("  ", dir_a)

    print("\nVal paths:")
    for dir_a in val_paths:

        img_files = ['%s/%s' % (i[0], j) for i in os.walk(dir_a) for j in i[-1] if j.endswith(('.cache', 'xpng', 'jpeg'))]

        for cache_path in img_files:
            os.remove(cache_path)

        print("  ", dir_a)