# Copyright 2017 The TensorFlow Authors. All Rights Reserved.
|
|
#
|
|
# Licensed under the Apache License, Version 2.0 (the "License");
|
|
# you may not use this file except in compliance with the License.
|
|
# You may obtain a copy of the License at
|
|
#
|
|
# http://www.apache.org/licenses/LICENSE-2.0
|
|
#
|
|
# Unless required by applicable law or agreed to in writing, software
|
|
# distributed under the License is distributed on an "AS IS" BASIS,
|
|
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
# See the License for the specific language governing permissions and
|
|
# limitations under the License.
|
|
# ==============================================================================
|
|
"""Tests for tensorflow_model.object_detection.metrics.coco_tools."""
|
|
import json
|
|
import os
|
|
import re
|
|
import numpy as np
|
|
|
|
from pycocotools import mask
|
|
|
|
import tensorflow as tf
|
|
|
|
from object_detection.metrics import coco_tools
|
|
|
|
|
|
class CocoToolsTest(tf.test.TestCase):
|
|
|
|
def setUp(self):
|
|
groundtruth_annotations_list = [
|
|
{
|
|
'id': 1,
|
|
'image_id': 'first',
|
|
'category_id': 1,
|
|
'bbox': [100., 100., 100., 100.],
|
|
'area': 100.**2,
|
|
'iscrowd': 0
|
|
},
|
|
{
|
|
'id': 2,
|
|
'image_id': 'second',
|
|
'category_id': 1,
|
|
'bbox': [50., 50., 50., 50.],
|
|
'area': 50.**2,
|
|
'iscrowd': 0
|
|
},
|
|
]
|
|
image_list = [{'id': 'first'}, {'id': 'second'}]
|
|
category_list = [{'id': 0, 'name': 'person'},
|
|
{'id': 1, 'name': 'cat'},
|
|
{'id': 2, 'name': 'dog'}]
|
|
self._groundtruth_dict = {
|
|
'annotations': groundtruth_annotations_list,
|
|
'images': image_list,
|
|
'categories': category_list
|
|
}
|
|
|
|
self._detections_list = [
|
|
{
|
|
'image_id': 'first',
|
|
'category_id': 1,
|
|
'bbox': [100., 100., 100., 100.],
|
|
'score': .8
|
|
},
|
|
{
|
|
'image_id': 'second',
|
|
'category_id': 1,
|
|
'bbox': [50., 50., 50., 50.],
|
|
'score': .7
|
|
},
|
|
]
|
|
|
|
def testCocoWrappers(self):
|
|
groundtruth = coco_tools.COCOWrapper(self._groundtruth_dict)
|
|
detections = groundtruth.LoadAnnotations(self._detections_list)
|
|
evaluator = coco_tools.COCOEvalWrapper(groundtruth, detections)
|
|
summary_metrics, _ = evaluator.ComputeMetrics()
|
|
self.assertAlmostEqual(1.0, summary_metrics['Precision/mAP'])
|
|
|
|
def testExportGroundtruthToCOCO(self):
|
|
image_ids = ['first', 'second']
|
|
groundtruth_boxes = [np.array([[100, 100, 200, 200]], np.float),
|
|
np.array([[50, 50, 100, 100]], np.float)]
|
|
groundtruth_classes = [np.array([1], np.int32), np.array([1], np.int32)]
|
|
categories = [{'id': 0, 'name': 'person'},
|
|
{'id': 1, 'name': 'cat'},
|
|
{'id': 2, 'name': 'dog'}]
|
|
output_path = os.path.join(tf.test.get_temp_dir(), 'groundtruth.json')
|
|
result = coco_tools.ExportGroundtruthToCOCO(
|
|
image_ids,
|
|
groundtruth_boxes,
|
|
groundtruth_classes,
|
|
categories,
|
|
output_path=output_path)
|
|
self.assertDictEqual(result, self._groundtruth_dict)
|
|
with tf.gfile.GFile(output_path, 'r') as f:
|
|
written_result = f.read()
|
|
# The json output should have floats written to 4 digits of precision.
|
|
matcher = re.compile(r'"bbox":\s+\[\n\s+\d+.\d\d\d\d,', re.MULTILINE)
|
|
self.assertTrue(matcher.findall(written_result))
|
|
written_result = json.loads(written_result)
|
|
self.assertAlmostEqual(result, written_result)
|
|
|
|
def testExportDetectionsToCOCO(self):
|
|
image_ids = ['first', 'second']
|
|
detections_boxes = [np.array([[100, 100, 200, 200]], np.float),
|
|
np.array([[50, 50, 100, 100]], np.float)]
|
|
detections_scores = [np.array([.8], np.float), np.array([.7], np.float)]
|
|
detections_classes = [np.array([1], np.int32), np.array([1], np.int32)]
|
|
categories = [{'id': 0, 'name': 'person'},
|
|
{'id': 1, 'name': 'cat'},
|
|
{'id': 2, 'name': 'dog'}]
|
|
output_path = os.path.join(tf.test.get_temp_dir(), 'detections.json')
|
|
result = coco_tools.ExportDetectionsToCOCO(
|
|
image_ids,
|
|
detections_boxes,
|
|
detections_scores,
|
|
detections_classes,
|
|
categories,
|
|
output_path=output_path)
|
|
self.assertListEqual(result, self._detections_list)
|
|
with tf.gfile.GFile(output_path, 'r') as f:
|
|
written_result = f.read()
|
|
# The json output should have floats written to 4 digits of precision.
|
|
matcher = re.compile(r'"bbox":\s+\[\n\s+\d+.\d\d\d\d,', re.MULTILINE)
|
|
self.assertTrue(matcher.findall(written_result))
|
|
written_result = json.loads(written_result)
|
|
self.assertAlmostEqual(result, written_result)
|
|
|
|
def testExportSegmentsToCOCO(self):
|
|
image_ids = ['first', 'second']
|
|
detection_masks = [np.array(
|
|
[[[0, 1, 0, 1], [0, 1, 1, 0], [0, 0, 0, 1], [0, 1, 0, 1]]],
|
|
dtype=np.uint8), np.array(
|
|
[[[0, 1, 0, 1], [0, 1, 1, 0], [0, 0, 0, 1], [0, 1, 0, 1]]],
|
|
dtype=np.uint8)]
|
|
|
|
for i, detection_mask in enumerate(detection_masks):
|
|
detection_masks[i] = detection_mask[:, :, :, None]
|
|
|
|
detection_scores = [np.array([.8], np.float), np.array([.7], np.float)]
|
|
detection_classes = [np.array([1], np.int32), np.array([1], np.int32)]
|
|
|
|
categories = [{'id': 0, 'name': 'person'},
|
|
{'id': 1, 'name': 'cat'},
|
|
{'id': 2, 'name': 'dog'}]
|
|
output_path = os.path.join(tf.test.get_temp_dir(), 'segments.json')
|
|
result = coco_tools.ExportSegmentsToCOCO(
|
|
image_ids,
|
|
detection_masks,
|
|
detection_scores,
|
|
detection_classes,
|
|
categories,
|
|
output_path=output_path)
|
|
with tf.gfile.GFile(output_path, 'r') as f:
|
|
written_result = f.read()
|
|
written_result = json.loads(written_result)
|
|
mask_load = mask.decode([written_result[0]['segmentation']])
|
|
self.assertTrue(np.allclose(mask_load, detection_masks[0]))
|
|
self.assertAlmostEqual(result, written_result)
|
|
|
|
def testExportKeypointsToCOCO(self):
|
|
image_ids = ['first', 'second']
|
|
detection_keypoints = [
|
|
np.array(
|
|
[[[100, 200], [300, 400], [500, 600]],
|
|
[[50, 150], [250, 350], [450, 550]]], dtype=np.int32),
|
|
np.array(
|
|
[[[110, 210], [310, 410], [510, 610]],
|
|
[[60, 160], [260, 360], [460, 560]]], dtype=np.int32)]
|
|
|
|
detection_scores = [np.array([.8, 0.2], np.float),
|
|
np.array([.7, 0.3], np.float)]
|
|
detection_classes = [np.array([1, 1], np.int32), np.array([1, 1], np.int32)]
|
|
|
|
categories = [{'id': 1, 'name': 'person', 'num_keypoints': 3},
|
|
{'id': 2, 'name': 'cat'},
|
|
{'id': 3, 'name': 'dog'}]
|
|
|
|
output_path = os.path.join(tf.test.get_temp_dir(), 'keypoints.json')
|
|
result = coco_tools.ExportKeypointsToCOCO(
|
|
image_ids,
|
|
detection_keypoints,
|
|
detection_scores,
|
|
detection_classes,
|
|
categories,
|
|
output_path=output_path)
|
|
|
|
with tf.gfile.GFile(output_path, 'r') as f:
|
|
written_result = f.read()
|
|
written_result = json.loads(written_result)
|
|
self.assertAlmostEqual(result, written_result)
|
|
|
|
def testSingleImageDetectionBoxesExport(self):
|
|
boxes = np.array([[0, 0, 1, 1],
|
|
[0, 0, .5, .5],
|
|
[.5, .5, 1, 1]], dtype=np.float32)
|
|
classes = np.array([1, 2, 3], dtype=np.int32)
|
|
scores = np.array([0.8, 0.2, 0.7], dtype=np.float32)
|
|
coco_boxes = np.array([[0, 0, 1, 1],
|
|
[0, 0, .5, .5],
|
|
[.5, .5, .5, .5]], dtype=np.float32)
|
|
coco_annotations = coco_tools.ExportSingleImageDetectionBoxesToCoco(
|
|
image_id='first_image',
|
|
category_id_set=set([1, 2, 3]),
|
|
detection_boxes=boxes,
|
|
detection_classes=classes,
|
|
detection_scores=scores)
|
|
for i, annotation in enumerate(coco_annotations):
|
|
self.assertEqual(annotation['image_id'], 'first_image')
|
|
self.assertEqual(annotation['category_id'], classes[i])
|
|
self.assertAlmostEqual(annotation['score'], scores[i])
|
|
self.assertTrue(np.all(np.isclose(annotation['bbox'], coco_boxes[i])))
|
|
|
|
def testSingleImageDetectionMaskExport(self):
|
|
masks = np.array(
|
|
[[[1, 1,], [1, 1]],
|
|
[[0, 0], [0, 1]],
|
|
[[0, 0], [0, 0]]], dtype=np.uint8)
|
|
classes = np.array([1, 2, 3], dtype=np.int32)
|
|
scores = np.array([0.8, 0.2, 0.7], dtype=np.float32)
|
|
coco_annotations = coco_tools.ExportSingleImageDetectionMasksToCoco(
|
|
image_id='first_image',
|
|
category_id_set=set([1, 2, 3]),
|
|
detection_classes=classes,
|
|
detection_scores=scores,
|
|
detection_masks=masks)
|
|
expected_counts = ['04', '31', '4']
|
|
for i, mask_annotation in enumerate(coco_annotations):
|
|
self.assertEqual(mask_annotation['segmentation']['counts'],
|
|
expected_counts[i])
|
|
self.assertTrue(np.all(np.equal(mask.decode(
|
|
mask_annotation['segmentation']), masks[i])))
|
|
self.assertEqual(mask_annotation['image_id'], 'first_image')
|
|
self.assertEqual(mask_annotation['category_id'], classes[i])
|
|
self.assertAlmostEqual(mask_annotation['score'], scores[i])
|
|
|
|
def testSingleImageGroundtruthExport(self):
|
|
masks = np.array(
|
|
[[[1, 1,], [1, 1]],
|
|
[[0, 0], [0, 1]],
|
|
[[0, 0], [0, 0]]], dtype=np.uint8)
|
|
boxes = np.array([[0, 0, 1, 1],
|
|
[0, 0, .5, .5],
|
|
[.5, .5, 1, 1]], dtype=np.float32)
|
|
coco_boxes = np.array([[0, 0, 1, 1],
|
|
[0, 0, .5, .5],
|
|
[.5, .5, .5, .5]], dtype=np.float32)
|
|
classes = np.array([1, 2, 3], dtype=np.int32)
|
|
is_crowd = np.array([0, 1, 0], dtype=np.int32)
|
|
next_annotation_id = 1
|
|
expected_counts = ['04', '31', '4']
|
|
|
|
# Tests exporting without passing in is_crowd (for backward compatibility).
|
|
coco_annotations = coco_tools.ExportSingleImageGroundtruthToCoco(
|
|
image_id='first_image',
|
|
category_id_set=set([1, 2, 3]),
|
|
next_annotation_id=next_annotation_id,
|
|
groundtruth_boxes=boxes,
|
|
groundtruth_classes=classes,
|
|
groundtruth_masks=masks)
|
|
for i, annotation in enumerate(coco_annotations):
|
|
self.assertEqual(annotation['segmentation']['counts'],
|
|
expected_counts[i])
|
|
self.assertTrue(np.all(np.equal(mask.decode(
|
|
annotation['segmentation']), masks[i])))
|
|
self.assertTrue(np.all(np.isclose(annotation['bbox'], coco_boxes[i])))
|
|
self.assertEqual(annotation['image_id'], 'first_image')
|
|
self.assertEqual(annotation['category_id'], classes[i])
|
|
self.assertEqual(annotation['id'], i + next_annotation_id)
|
|
|
|
# Tests exporting with is_crowd.
|
|
coco_annotations = coco_tools.ExportSingleImageGroundtruthToCoco(
|
|
image_id='first_image',
|
|
category_id_set=set([1, 2, 3]),
|
|
next_annotation_id=next_annotation_id,
|
|
groundtruth_boxes=boxes,
|
|
groundtruth_classes=classes,
|
|
groundtruth_masks=masks,
|
|
groundtruth_is_crowd=is_crowd)
|
|
for i, annotation in enumerate(coco_annotations):
|
|
self.assertEqual(annotation['segmentation']['counts'],
|
|
expected_counts[i])
|
|
self.assertTrue(np.all(np.equal(mask.decode(
|
|
annotation['segmentation']), masks[i])))
|
|
self.assertTrue(np.all(np.isclose(annotation['bbox'], coco_boxes[i])))
|
|
self.assertEqual(annotation['image_id'], 'first_image')
|
|
self.assertEqual(annotation['category_id'], classes[i])
|
|
self.assertEqual(annotation['iscrowd'], is_crowd[i])
|
|
self.assertEqual(annotation['id'], i + next_annotation_id)
|
|
|
|
|
|
if __name__ == '__main__':
|
|
tf.test.main()
|