Add evaluation code

ChunML · ChunML · commit 0654107cb2f5 · 2019-12-17T14:33:03.000+09:00
diff --git a/test.py b/test.py
@@ -8,7 +8,7 @@
 
 from anchor import generate_default_boxes
 from box_utils import decode, compute_nms
-from data import create_batch_generator
+from voc_data import create_batch_generator
 from image_utils import ImageVisualizer
 from losses import create_losses
 from network import create_ssd
@@ -118,13 +118,12 @@ def predict(imgs, default_boxes):
         visualizer.save_image(
             original_image, boxes, classes, '{}.jpg'.format(filename))
 
-        log_file = os.path.join('outputs/detects', '{}.txt'.format(filename))
+        log_file = os.path.join('outputs/detects', '{}.txt')
 
-        with open(log_file, 'w') as f:
-            log = []
-            for cls, box, score in zip(classes, boxes, scores):
-                cls_name = info['idx_to_name'][cls - 1]
-                log.append(
-                    ','.join([cls_name, *[str(c) for c in box], str(score)]))
-            log = '\n'.join(log)
-            f.write(log)
+        for cls, box, score in zip(classes, boxes, scores):
+            cls_name = info['idx_to_name'][cls - 1]
+            with open(log_file.format(cls_name), 'a') as f:
+                f.write('{} {} {} {} {} {}\n'.format(
+                    filename,
+                    score,
+                    *[coord for coord in box]))
diff --git a/train.py b/train.py
@@ -6,7 +6,7 @@
 import yaml
 
 from tensorflow.keras.optimizers.schedules import PiecewiseConstantDecay
-from data import create_batch_generator
+from voc_data import create_batch_generator
 from anchor import generate_default_boxes
 from network import create_ssd
 from losses import create_losses
@@ -110,7 +110,7 @@ def train_step(imgs, gt_confs, gt_locs, ssd, criterion, optimizer):
             avg_loss = (avg_loss * i + loss.numpy()) / (i + 1)
             avg_conf_loss = (avg_conf_loss * i + conf_loss.numpy()) / (i + 1)
             avg_loc_loss = (avg_loc_loss * i + loc_loss.numpy()) / (i + 1)
-            if (i + 1) % 2 == 0:
+            if (i + 1) % 50 == 0:
                 print('Epoch: {} Batch {} Time: {:.2}s | Loss: {:.4f} Conf: {:.4f} Loc: {:.4f}'.format(
                     epoch + 1, i + 1, time.time() - start, avg_loss, avg_conf_loss, avg_loc_loss))
 
diff --git a/voc_data.py b/voc_data.py
diff --git a/voc_eval.py b/voc_eval.py
@@ -0,0 +1,173 @@
+import os
+import numpy as np
+import xml.etree.ElementTree as ET
+import argparse
+
+
+parser = argparse.ArgumentParser()
+parser.add_argument('--data-dir', default='../dataset')
+parser.add_argument('--data-year', default='2007')
+parser.add_argument('--detect-dir', default='./outputs/detects')
+parser.add_argument('--use-07-metric', type=bool, default=False)
+args = parser.parse_args()
+
+
+def get_annotation(anno_file):
+    tree = ET.parse(anno_file)
+    objects = []
+    for obj in tree.findall('object'):
+        obj_struct = {}
+        obj_struct['name'] = obj.find('name').text
+        obj_struct['pose'] = obj.find('pose').text
+        obj_struct['truncated'] = int(obj.find('truncated').text)
+        obj_struct['difficult'] = int(obj.find('difficult').text)
+        bbox = obj.find('bndbox')
+        obj_struct['bbox'] = [int(bbox.find('xmin').text),
+                              int(bbox.find('ymin').text),
+                              int(bbox.find('xmax').text),
+                              int(bbox.find('ymax').text)]
+        objects.append(obj_struct)
+
+    return objects
+
+
+def compute_ap(rec, prec, ap, use_07_metric=False):
+    if use_07_metric:
+        ap = 0.0
+        for t in np.arange(0.0, 1.1, 0.1):
+            if np.sum(rec >= t) == 0:
+                p = 0
+            else:
+                p = np.max(prec[rec >= t])
+            ap = ap + p / 11.0
+    else:
+        mrec = np.concatenate(([0.0], rec, [1.0]))
+        mprec = np.concatenate(([0.0], prec, [0.0]))
+
+        for i in range(mprec.size - 1, 0, -1):
+            mprec[i - 1] = np.maximum(mprec[i - 1], mprec[i])
+
+        i = np.where(mrec[1:] != mrec[:-1])[0]
+
+        ap = np.sum((mrec[i + 1] - mrec[i]) * mprec[i + 1])
+
+    return ap
+
+
+def voc_eval(det_path, anno_path, cls_name, iou_thresh=0.5, use_07_metric=False):
+    det_file = det_path.format(cls_name)
+    with open(det_file, 'r') as f:
+        lines = f.readlines()
+
+    lines = [x.strip().split(' ') for x in lines]
+    image_ids = [x[0] for x in lines]
+    confs = np.array([float(x[1]) for x in lines])
+    boxes = np.array([[float(z) for z in x[2:]] for x in lines])
+
+    gts = {}
+    cls_gts = {}
+    npos = 0
+    for image_id in image_ids:
+        gts[image_id] = get_annotation(anno_path.format(image_id))
+        R = [obj for obj in gts[image_id] if obj['name'] == cls_name]
+        gt_boxes = np.array([x['bbox'] for x in R])
+        difficult = np.array([x['difficult'] for x in R]).astype(np.bool)
+        det = [False] * len(R)
+        npos = npos + sum(~difficult)
+        cls_gts[image_id] = {
+            'gt_boxes': gt_boxes,
+            'difficult': difficult,
+            'det': det
+        }
+
+    sorted_ids = np.argsort(-confs)
+    sorted_scores = np.sort(-confs)
+    boxes = boxes[sorted_ids, :]
+    image_ids = [image_ids[x] for x in sorted_ids]
+
+    nd = len(image_ids)
+    tp = np.zeros(nd)
+    fp = np.zeros(nd)
+    for d in range(nd):
+        R = cls_gts[image_ids[d]]
+        box = boxes[d, :].astype(float)
+        iou_max = -np.inf
+        gt_box = R['gt_boxes'].astype(float)
+
+        if gt_box.size > 0:
+            ixmin = np.maximum(gt_box[:, 0], box[0])
+            ixmax = np.maximum(gt_box[:, 2], box[2])
+            iymin = np.maximum(gt_box[:, 1], box[1])
+            iymax = np.maximum(gt_box[:, 3], box[3])
+            iw = np.maximum(ixmax - ixmin + 1.0, 0.0)
+            ih = np.maximum(iymax - iymin + 1.0, 0.0)
+            inters = iw * ih
+
+            uni = ((box[2] - box[0] + 1.0) * (box[3] - box[1] + 1.0) +
+                   (gt_box[:, 2] - gt_box[:, 0] + 1.0) *
+                   (gt_box[:, 3] - gt_box[:, 1] + 1.0) - inters)
+
+            ious = inters / uni
+            iou_max = np.max(ious)
+            jmax = np.argmax(ious)
+
+        if iou_max > iou_thresh:
+            if not R['difficult'][jmax]:
+                if not R['det'][jmax]:
+                    tp[d] = 1.0
+                    R['det'][jmax] = 1
+                else:
+                    fp[d] = 1.0
+        else:
+            fp[d] = 1.0
+
+    fp = np.cumsum(fp)
+    tp = np.cumsum(tp)
+    recall = tp / float(npos)
+    precision = tp / np.maximum(tp + fp, np.finfo(np.float64).eps)
+
+    ap = compute_ap(recall, precision, use_07_metric)
+
+    return recall, precision, ap
+
+
+if __name__ == '__main__':
+    aps = {
+        'aeroplane': 0.0,
+        'bicycle': 0.0,
+        'bird': 0.0,
+        'boat': 0.0,
+        'bottle': 0.0,
+        'bus': 0.0,
+        'car': 0.0,
+        'cat': 0.0,
+        'chair': 0.0,
+        'cow': 0.0,
+        'diningtable': 0.0,
+        'dog': 0.0,
+        'horse': 0.0,
+        'motorbike': 0.0,
+        'person': 0.0,
+        'pottedplant': 0.0,
+        'sheep': 0.0,
+        'sofa': 0.0,
+        'train': 0.0,
+        'tvmonitor': 0.0,
+        'mAP': []
+    }
+    for cls_name in aps.keys():
+        det_path = os.path.join(args.detect_dir, '{}.txt')
+        anno_path = os.path.join(
+            args.data_dir, 'VOC{}'.format(args.data_year), 'Annotations', '{}.xml')
+        if os.path.exists(det_path.format(cls_name)):
+            recall, precision, ap = voc_eval(
+                det_path,
+                anno_path,
+                cls_name,
+                use_07_metric=args.use_07_metric)
+            aps[cls_name] = ap
+            aps['mAP'].append(ap)
+
+    aps['mAP'] = np.mean(aps['mAP'])
+    for key, value in aps.items():
+        print('{}: {}'.format(key, value))