多个coco数据标注文件合并

一、coco数据集是什么？

COCO（Common Objects in Context）是一个用于目标检测和图像分割任务的标注格式。如果你有多个COCO格式的JSON文件，你可能需要将它们合并成一个文件，以便更方便地处理和管理数据。在这篇博客中，我们将介绍一个用Python编写的脚本，可以实现这一合并操作。

二、完整代码

import json
import osdef merge_coco_files(folder_path):merged_data = {"info": {"year": 2023,"version": "1","date_created": "no need record"},"images": [],"annotations": [],"licenses": [{"id": 1,"name": "Unknown","url": ""}],"categories": [{"id": 1,"name": "hd","supercategory": ""}]}image_id_counter = 1annotation_id_counter = 1for root, dirs, files in os.walk(folder_path):for file in files:if file.endswith(".json"):file_path = os.path.join(root, file)with open(file_path, 'r') as f:data = json.load(f)# Update image IDs and filenamesfor image in data["images"]:image["id"] = image_id_counterimage_id_counter += 1# Use the original file name from the COCO fileimage["file_name"] = image["file_name"]# Append the updated image to the merged_data only if it's not already presentif image not in merged_data["images"]:merged_data["images"].append(image)# Update annotation IDs and image IDsfor annotation in data["annotations"]:annotation["id"] = annotation_id_counterannotation_id_counter += 1annotation["image_id"] = image_id_counter - 1  # Use the last assigned image ID# Append the updated annotation to the merged_datamerged_data["annotations"].append(annotation)# Save the merged data to a new JSON fileoutput_path = os.path.join(folder_path, "merged_coco.json")with open(output_path, 'w') as output_file:json.dump(merged_data, output_file, indent=4)print(f'Merged data saved to: {output_path}')# Provide the path to the folder containing the COCO JSON files
folder_path = r''
merge_coco_files(folder_path)