init

2024-11-27 23:22:08 +08:00
commit 28c518b355
108 changed files with 30312 additions and 0 deletions
@@ -0,0 +1,117 @@
+#-------------------------------------------------------#
+#   用于处理COCO数据集，根据json文件生成txt文件用于训练
+#-------------------------------------------------------#
+import json
+import os
+from collections import defaultdict
+
+#-------------------------------------------------------#
+#   指向了COCO训练集与验证集图片的路径
+#-------------------------------------------------------#
+train_datasets_path     = "coco_dataset/train2017"
+val_datasets_path       = "coco_dataset/val2017"
+
+#-------------------------------------------------------#
+#   指向了COCO训练集与验证集标签的路径
+#-------------------------------------------------------#
+train_annotation_path   = "coco_dataset/annotations/instances_train2017.json"
+val_annotation_path     = "coco_dataset/annotations/instances_val2017.json"
+
+#-------------------------------------------------------#
+#   生成的txt文件路径
+#-------------------------------------------------------#
+train_output_path       = "coco_train.txt"
+val_output_path         = "coco_val.txt"
+
+if __name__ == "__main__":
+    name_box_id = defaultdict(list)
+    id_name     = dict()
+    f           = open(train_annotation_path, encoding='utf-8')
+    data        = json.load(f)
+
+    annotations = data['annotations']
+    for ant in annotations:
+        id = ant['image_id']
+        name = os.path.join(train_datasets_path, '%012d.jpg' % id)
+        cat = ant['category_id']
+        if cat >= 1 and cat <= 11:
+            cat = cat - 1
+        elif cat >= 13 and cat <= 25:
+            cat = cat - 2
+        elif cat >= 27 and cat <= 28:
+            cat = cat - 3
+        elif cat >= 31 and cat <= 44:
+            cat = cat - 5
+        elif cat >= 46 and cat <= 65:
+            cat = cat - 6
+        elif cat == 67:
+            cat = cat - 7
+        elif cat == 70:
+            cat = cat - 9
+        elif cat >= 72 and cat <= 82:
+            cat = cat - 10
+        elif cat >= 84 and cat <= 90:
+            cat = cat - 11
+        name_box_id[name].append([ant['bbox'], cat])
+
+    f = open(train_output_path, 'w')
+    for key in name_box_id.keys():
+        f.write(key)
+        box_infos = name_box_id[key]
+        for info in box_infos:
+            x_min = int(info[0][0])
+            y_min = int(info[0][1])
+            x_max = x_min + int(info[0][2])
+            y_max = y_min + int(info[0][3])
+
+            box_info = " %d,%d,%d,%d,%d" % (
+                x_min, y_min, x_max, y_max, int(info[1]))
+            f.write(box_info)
+        f.write('\n')
+    f.close()
+
+    name_box_id = defaultdict(list)
+    id_name     = dict()
+    f           = open(val_annotation_path, encoding='utf-8')
+    data        = json.load(f)
+
+    annotations = data['annotations']
+    for ant in annotations:
+        id = ant['image_id']
+        name = os.path.join(val_datasets_path, '%012d.jpg' % id)
+        cat = ant['category_id']
+        if cat >= 1 and cat <= 11:
+            cat = cat - 1
+        elif cat >= 13 and cat <= 25:
+            cat = cat - 2
+        elif cat >= 27 and cat <= 28:
+            cat = cat - 3
+        elif cat >= 31 and cat <= 44:
+            cat = cat - 5
+        elif cat >= 46 and cat <= 65:
+            cat = cat - 6
+        elif cat == 67:
+            cat = cat - 7
+        elif cat == 70:
+            cat = cat - 9
+        elif cat >= 72 and cat <= 82:
+            cat = cat - 10
+        elif cat >= 84 and cat <= 90:
+            cat = cat - 11
+        name_box_id[name].append([ant['bbox'], cat])
+
+    f = open(val_output_path, 'w')
+    for key in name_box_id.keys():
+        f.write(key)
+        box_infos = name_box_id[key]
+        for info in box_infos:
+            x_min = int(info[0][0])
+            y_min = int(info[0][1])
+            x_max = x_min + int(info[0][2])
+            y_max = y_min + int(info[0][3])
+
+            box_info = " %d,%d,%d,%d,%d" % (
+                x_min, y_min, x_max, y_max, int(info[1]))
+            f.write(box_info)
+        f.write('\n')
+    f.close()
@@ -0,0 +1,113 @@
+import json
+import os
+
+import numpy as np
+import torch
+from PIL import Image
+from pycocotools.coco import COCO
+from pycocotools.cocoeval import COCOeval
+from tqdm import tqdm
+from utils.utils import cvtColor, get_classes, preprocess_input, resize_image
+from utils.utils_bbox import decode_outputs, non_max_suppression
+from yolo import YOLO
+
+#---------------------------------------------------------------------------#
+#   map_mode用于指定该文件运行时计算的内容
+#   map_mode为0代表整个map计算流程，包括获得预测结果、计算map。
+#   map_mode为1代表仅仅获得预测结果。
+#   map_mode为2代表仅仅获得计算map。
+#---------------------------------------------------------------------------#
+map_mode            = 0
+#-------------------------------------------------------#
+#   指向了验证集标签与图片路径
+#-------------------------------------------------------#
+cocoGt_path         = 'coco_dataset/annotations/instances_val2017.json'
+dataset_img_path    = 'coco_dataset/val2017'
+#-------------------------------------------------------#
+#   结果输出的文件夹，默认为map_out
+#-------------------------------------------------------#
+temp_save_path      = 'map_out/coco_eval'
+
+class mAP_YOLO(YOLO):
+    #---------------------------------------------------#
+    #   检测图片
+    #---------------------------------------------------#
+    def detect_image(self, image_id, image, results):
+        #---------------------------------------------------#
+        #   计算输入图片的高和宽
+        #---------------------------------------------------#
+        image_shape = np.array(np.shape(image)[0:2])
+        #---------------------------------------------------------#
+        #   在这里将图像转换成RGB图像，防止灰度图在预测时报错。
+        #   代码仅仅支持RGB图像的预测，所有其它类型的图像都会转化成RGB
+        #---------------------------------------------------------#
+        image       = cvtColor(image)
+        #---------------------------------------------------------#
+        #   给图像增加灰条，实现不失真的resize
+        #   也可以直接resize进行识别
+        #---------------------------------------------------------#
+        image_data  = resize_image(image, (self.input_shape[1],self.input_shape[0]), self.letterbox_image)
+        #---------------------------------------------------------#
+        #   添加上batch_size维度
+        #---------------------------------------------------------#
+        image_data  = np.expand_dims(np.transpose(preprocess_input(np.array(image_data, dtype='float32')), (2, 0, 1)), 0)
+
+        with torch.no_grad():
+            images = torch.from_numpy(image_data)
+            if self.cuda:
+                images = images.cuda()
+            #---------------------------------------------------------#
+            #   将图像输入网络当中进行预测！
+            #---------------------------------------------------------#
+            outputs = self.net(images)
+            outputs = decode_outputs(outputs, self.input_shape)
+            #---------------------------------------------------------#
+            #   将预测框进行堆叠，然后进行非极大抑制
+            #---------------------------------------------------------#
+            outputs = non_max_suppression(outputs, self.num_classes, self.input_shape, 
+                        image_shape, self.letterbox_image, conf_thres = self.confidence, nms_thres = self.nms_iou)
+                                                    
+            if outputs[0] is None: 
+                return results
+
+            top_label   = np.array(outputs[0][:, 6], dtype = 'int32')
+            top_conf    = outputs[0][:, 4] * outputs[0][:, 5]
+            top_boxes   = outputs[0][:, :4]
+
+        for i, c in enumerate(top_label):
+            result                      = {}
+            top, left, bottom, right    = top_boxes[i]
+
+            result["image_id"]      = int(image_id)
+            result["category_id"]   = clsid2catid[c]
+            result["bbox"]          = [float(left),float(top),float(right-left),float(bottom-top)]
+            result["score"]         = float(top_conf[i])
+            results.append(result)
+        return results
+
+if __name__ == "__main__":
+    if not os.path.exists(temp_save_path):
+        os.makedirs(temp_save_path)
+
+    cocoGt      = COCO(cocoGt_path)
+    ids         = list(cocoGt.imgToAnns.keys())
+    clsid2catid = cocoGt.getCatIds()
+
+    if map_mode == 0 or map_mode == 1:
+        yolo = mAP_YOLO(confidence = 0.001, nms_iou = 0.65)
+
+        with open(os.path.join(temp_save_path, 'eval_results.json'),"w") as f:
+            results = []
+            for image_id in tqdm(ids):
+                image_path  = os.path.join(dataset_img_path, cocoGt.loadImgs(image_id)[0]['file_name'])
+                image       = Image.open(image_path)
+                results     = yolo.detect_image(image_id, image, results)
+            json.dump(results, f)
+
+    if map_mode == 0 or map_mode == 2:
+        cocoDt      = cocoGt.loadRes(os.path.join(temp_save_path, 'eval_results.json'))
+        cocoEval    = COCOeval(cocoGt, cocoDt, 'bbox') 
+        cocoEval.evaluate()
+        cocoEval.accumulate()
+        cocoEval.summarize()
+        print("Get map done.")