下面注释掉的这部分就是多线程访问读取,会报错。还是with h5py 打开hdf5文件后再用多线程执行文件比较靠谱
# def read_dataset(h5_filename, dataset_name):
# “”"
# 读取 HDF5 文件中的指定数据集。
# “”"
# # with h5py.File(h5_filename, ‘r’) as h5f:
# # data = h5f[dataset_name] # 读取数据集
# # return data,dataset_name
#
# try:
# with h5py.File(h5_filename, ‘r’) as h5f:
# data = h5f[dataset_name] # 读取数据集
# # print(dataset_name)
# # print(data.keys())
# return data, dataset_name
# except Exception as e:
# raise RuntimeError(f’Error processing {dataset_name}: {e}')
# # raise print(f"Error reading dataset ‘{name}’: {e}“)
# # return None, name
#
# def read_hdf5_parallel(h5_filename, n_workers=4):
# “””
# 并行读取 HDF5 文件中的所有数据集。
# “”"
# # 先获取所有数据集的名称
# with h5py.File(h5_filename, ‘r’) as h5f:
# dataset_names = list(h5f.keys())
#
# # 使用 ThreadPoolExecutor 并行读取
# results=[]
# with concurrent.futures.ThreadPoolExecutor(max_workers=n_workers) as e
07-22
1240
1240

最低0.47元/天 解锁文章

被折叠的 条评论
为什么被折叠?



