yigitcolakoglu
/
MyCity

# Copyright 2017 The TensorFlow Authors. All Rights Reserved.## Licensed under the Apache License, Version 2.0 (the "License");# you may not use this file except in compliance with the License.# You may obtain a copy of the License at##     http://www.apache.org/licenses/LICENSE-2.0## Unless required by applicable law or agreed to in writing, software# distributed under the License is distributed on an "AS IS" BASIS,# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.# See the License for the specific language governing permissions and# limitations under the License.# =============================================================================="""Model input function for tf-learn object detection model."""
from __future__ import absolute_importfrom __future__ import divisionfrom __future__ import print_function
import functools
import tensorflow as tffrom object_detection.builders import dataset_builderfrom object_detection.builders import image_resizer_builderfrom object_detection.builders import model_builderfrom object_detection.builders import preprocessor_builderfrom object_detection.core import preprocessorfrom object_detection.core import standard_fields as fieldsfrom object_detection.data_decoders import tf_example_decoderfrom object_detection.protos import eval_pb2from object_detection.protos import input_reader_pb2from object_detection.protos import model_pb2from object_detection.protos import train_pb2from object_detection.utils import config_utilfrom object_detection.utils import ops as util_opsfrom object_detection.utils import shape_utils
HASH_KEY = 'hash'HASH_BINS = 1 << 31SERVING_FED_EXAMPLE_KEY = 'serialized_example'
# A map of names to methods that help build the input pipeline.INPUT_BUILDER_UTIL_MAP = {    'dataset_build': dataset_builder.build,    'model_build': model_builder.build,}

def transform_input_data(tensor_dict,                         model_preprocess_fn,                         image_resizer_fn,                         num_classes,                         data_augmentation_fn=None,                         merge_multiple_boxes=False,                         retain_original_image=False,                         use_multiclass_scores=False,                         use_bfloat16=False):  """A single function that is responsible for all input data transformations.

  Data transformation functions are applied in the following order.  1. If key fields.InputDataFields.image_additional_channels is present in     tensor_dict, the additional channels will be merged into     fields.InputDataFields.image.  2. data_augmentation_fn (optional): applied on tensor_dict.  3. model_preprocess_fn: applied only on image tensor in tensor_dict.  4. image_resizer_fn: applied on original image and instance mask tensor in     tensor_dict.  5. one_hot_encoding: applied to classes tensor in tensor_dict.  6. merge_multiple_boxes (optional): when groundtruth boxes are exactly the     same they can be merged into a single box with an associated k-hot class     label.
  Args:    tensor_dict: dictionary containing input tensors keyed by      fields.InputDataFields.    model_preprocess_fn: model's preprocess function to apply on image tensor.      This function must take in a 4-D float tensor and return a 4-D preprocess      float tensor and a tensor containing the true image shape.    image_resizer_fn: image resizer function to apply on groundtruth instance      `masks. This function must take a 3-D float tensor of an image and a 3-D      tensor of instance masks and return a resized version of these along with      the true shapes.    num_classes: number of max classes to one-hot (or k-hot) encode the class      labels.    data_augmentation_fn: (optional) data augmentation function to apply on      input `tensor_dict`.    merge_multiple_boxes: (optional) whether to merge multiple groundtruth boxes      and classes for a given image if the boxes are exactly the same.    retain_original_image: (optional) whether to retain original image in the      output dictionary.    use_multiclass_scores: whether to use multiclass scores as      class targets instead of one-hot encoding of `groundtruth_classes`.    use_bfloat16: (optional) a bool, whether to use bfloat16 in training.
  Returns:    A dictionary keyed by fields.InputDataFields containing the tensors obtained    after applying all the transformations.  """
  # Reshape flattened multiclass scores tensor into a 2D tensor of shape  # [num_boxes, num_classes].  if fields.InputDataFields.multiclass_scores in tensor_dict:    tensor_dict[fields.InputDataFields.multiclass_scores] = tf.reshape(        tensor_dict[fields.InputDataFields.multiclass_scores], [            tf.shape(tensor_dict[fields.InputDataFields.groundtruth_boxes])[0],            num_classes        ])  if fields.InputDataFields.groundtruth_boxes in tensor_dict:    tensor_dict = util_ops.filter_groundtruth_with_nan_box_coordinates(        tensor_dict)    tensor_dict = util_ops.filter_unrecognized_classes(tensor_dict)
  if retain_original_image:    tensor_dict[fields.InputDataFields.original_image] = tf.cast(        image_resizer_fn(tensor_dict[fields.InputDataFields.image], None)[0],        tf.uint8)
  if fields.InputDataFields.image_additional_channels in tensor_dict:    channels = tensor_dict[fields.InputDataFields.image_additional_channels]    tensor_dict[fields.InputDataFields.image] = tf.concat(        [tensor_dict[fields.InputDataFields.image], channels], axis=2)
  # Apply data augmentation ops.  if data_augmentation_fn is not None:    tensor_dict = data_augmentation_fn(tensor_dict)
  # Apply model preprocessing ops and resize instance masks.  image = tensor_dict[fields.InputDataFields.image]  preprocessed_resized_image, true_image_shape = model_preprocess_fn(      tf.expand_dims(tf.cast(image, dtype=tf.float32), axis=0))  if use_bfloat16:    preprocessed_resized_image = tf.cast(        preprocessed_resized_image, tf.bfloat16)  tensor_dict[fields.InputDataFields.image] = tf.squeeze(      preprocessed_resized_image, axis=0)  tensor_dict[fields.InputDataFields.true_image_shape] = tf.squeeze(      true_image_shape, axis=0)  if fields.InputDataFields.groundtruth_instance_masks in tensor_dict:    masks = tensor_dict[fields.InputDataFields.groundtruth_instance_masks]    _, resized_masks, _ = image_resizer_fn(image, masks)    if use_bfloat16:      resized_masks = tf.cast(resized_masks, tf.bfloat16)    tensor_dict[fields.InputDataFields.                groundtruth_instance_masks] = resized_masks
  # Transform groundtruth classes to one hot encodings.  label_offset = 1  zero_indexed_groundtruth_classes = tensor_dict[      fields.InputDataFields.groundtruth_classes] - label_offset  tensor_dict[fields.InputDataFields.groundtruth_classes] = tf.one_hot(      zero_indexed_groundtruth_classes, num_classes)
  if use_multiclass_scores:    tensor_dict[fields.InputDataFields.groundtruth_classes] = tensor_dict[        fields.InputDataFields.multiclass_scores]  tensor_dict.pop(fields.InputDataFields.multiclass_scores, None)
  if fields.InputDataFields.groundtruth_confidences in tensor_dict:    groundtruth_confidences = tensor_dict[        fields.InputDataFields.groundtruth_confidences]    # Map the confidences to the one-hot encoding of classes    tensor_dict[fields.InputDataFields.groundtruth_confidences] = (        tf.reshape(groundtruth_confidences, [-1, 1]) *        tensor_dict[fields.InputDataFields.groundtruth_classes])  else:    groundtruth_confidences = tf.ones_like(        zero_indexed_groundtruth_classes, dtype=tf.float32)    tensor_dict[fields.InputDataFields.groundtruth_confidences] = (        tensor_dict[fields.InputDataFields.groundtruth_classes])
  if merge_multiple_boxes:    merged_boxes, merged_classes, merged_confidences, _ = (        util_ops.merge_boxes_with_multiple_labels(            tensor_dict[fields.InputDataFields.groundtruth_boxes],            zero_indexed_groundtruth_classes,            groundtruth_confidences,            num_classes))    merged_classes = tf.cast(merged_classes, tf.float32)    tensor_dict[fields.InputDataFields.groundtruth_boxes] = merged_boxes    tensor_dict[fields.InputDataFields.groundtruth_classes] = merged_classes    tensor_dict[fields.InputDataFields.groundtruth_confidences] = (        merged_confidences)  if fields.InputDataFields.groundtruth_boxes in tensor_dict:    tensor_dict[fields.InputDataFields.num_groundtruth_boxes] = tf.shape(        tensor_dict[fields.InputDataFields.groundtruth_boxes])[0]
  return tensor_dict

def pad_input_data_to_static_shapes(tensor_dict, max_num_boxes, num_classes,                                    spatial_image_shape=None):  """Pads input tensors to static shapes.

  In case num_additional_channels > 0, we assume that the additional channels  have already been concatenated to the base image.
  Args:    tensor_dict: Tensor dictionary of input data    max_num_boxes: Max number of groundtruth boxes needed to compute shapes for      padding.    num_classes: Number of classes in the dataset needed to compute shapes for      padding.    spatial_image_shape: A list of two integers of the form [height, width]      containing expected spatial shape of the image.
  Returns:    A dictionary keyed by fields.InputDataFields containing padding shapes for    tensors in the dataset.
  Raises:    ValueError: If groundtruth classes is neither rank 1 nor rank 2, or if we      detect that additional channels have not been concatenated yet.  """

  if not spatial_image_shape or spatial_image_shape == [-1, -1]:    height, width = None, None  else:    height, width = spatial_image_shape  # pylint: disable=unpacking-non-sequence
  num_additional_channels = 0  if fields.InputDataFields.image_additional_channels in tensor_dict:    num_additional_channels = shape_utils.get_dim_as_int(tensor_dict[        fields.InputDataFields.image_additional_channels].shape[2])
  # We assume that if num_additional_channels > 0, then it has already been  # concatenated to the base image (but not the ground truth).  num_channels = 3  if fields.InputDataFields.image in tensor_dict:    num_channels = shape_utils.get_dim_as_int(        tensor_dict[fields.InputDataFields.image].shape[2])
  if num_additional_channels:    if num_additional_channels >= num_channels:      raise ValueError(          'Image must be already concatenated with additional channels.')
    if (fields.InputDataFields.original_image in tensor_dict and        shape_utils.get_dim_as_int(            tensor_dict[fields.InputDataFields.original_image].shape[2]) ==        num_channels):      raise ValueError(          'Image must be already concatenated with additional channels.')
  padding_shapes = {      fields.InputDataFields.image: [          height, width, num_channels      ],      fields.InputDataFields.original_image_spatial_shape: [2],      fields.InputDataFields.image_additional_channels: [          height, width, num_additional_channels      ],      fields.InputDataFields.source_id: [],      fields.InputDataFields.filename: [],      fields.InputDataFields.key: [],      fields.InputDataFields.groundtruth_difficult: [max_num_boxes],      fields.InputDataFields.groundtruth_boxes: [max_num_boxes, 4],      fields.InputDataFields.groundtruth_classes: [max_num_boxes, num_classes],      fields.InputDataFields.groundtruth_instance_masks: [          max_num_boxes, height, width      ],      fields.InputDataFields.groundtruth_is_crowd: [max_num_boxes],      fields.InputDataFields.groundtruth_group_of: [max_num_boxes],      fields.InputDataFields.groundtruth_area: [max_num_boxes],      fields.InputDataFields.groundtruth_weights: [max_num_boxes],      fields.InputDataFields.groundtruth_confidences: [          max_num_boxes, num_classes      ],      fields.InputDataFields.num_groundtruth_boxes: [],      fields.InputDataFields.groundtruth_label_types: [max_num_boxes],      fields.InputDataFields.groundtruth_label_weights: [max_num_boxes],      fields.InputDataFields.true_image_shape: [3],      fields.InputDataFields.groundtruth_image_classes: [num_classes],      fields.InputDataFields.groundtruth_image_confidences: [num_classes],  }
  if fields.InputDataFields.original_image in tensor_dict:    padding_shapes[fields.InputDataFields.original_image] = [        height, width,        shape_utils.get_dim_as_int(tensor_dict[fields.InputDataFields.                                               original_image].shape[2])    ]  if fields.InputDataFields.groundtruth_keypoints in tensor_dict:    tensor_shape = (        tensor_dict[fields.InputDataFields.groundtruth_keypoints].shape)    padding_shape = [max_num_boxes,                     shape_utils.get_dim_as_int(tensor_shape[1]),                     shape_utils.get_dim_as_int(tensor_shape[2])]    padding_shapes[fields.InputDataFields.groundtruth_keypoints] = padding_shape  if fields.InputDataFields.groundtruth_keypoint_visibilities in tensor_dict:    tensor_shape = tensor_dict[fields.InputDataFields.                               groundtruth_keypoint_visibilities].shape    padding_shape = [max_num_boxes, shape_utils.get_dim_as_int(tensor_shape[1])]    padding_shapes[fields.InputDataFields.                   groundtruth_keypoint_visibilities] = padding_shape
  padded_tensor_dict = {}  for tensor_name in tensor_dict:    padded_tensor_dict[tensor_name] = shape_utils.pad_or_clip_nd(        tensor_dict[tensor_name], padding_shapes[tensor_name])
  # Make sure that the number of groundtruth boxes now reflects the  # padded/clipped tensors.  if fields.InputDataFields.num_groundtruth_boxes in padded_tensor_dict:    padded_tensor_dict[fields.InputDataFields.num_groundtruth_boxes] = (        tf.minimum(            padded_tensor_dict[fields.InputDataFields.num_groundtruth_boxes],            max_num_boxes))  return padded_tensor_dict

def augment_input_data(tensor_dict, data_augmentation_options):  """Applies data augmentation ops to input tensors.

  Args:    tensor_dict: A dictionary of input tensors keyed by fields.InputDataFields.    data_augmentation_options: A list of tuples, where each tuple contains a      function and a dictionary that contains arguments and their values.      Usually, this is the output of core/preprocessor.build.
  Returns:    A dictionary of tensors obtained by applying data augmentation ops to the    input tensor dictionary.  """
  tensor_dict[fields.InputDataFields.image] = tf.expand_dims(      tf.cast(tensor_dict[fields.InputDataFields.image], dtype=tf.float32), 0)
  include_instance_masks = (fields.InputDataFields.groundtruth_instance_masks                            in tensor_dict)  include_keypoints = (fields.InputDataFields.groundtruth_keypoints                       in tensor_dict)  include_label_weights = (fields.InputDataFields.groundtruth_weights                           in tensor_dict)  include_label_confidences = (fields.InputDataFields.groundtruth_confidences                               in tensor_dict)  include_multiclass_scores = (fields.InputDataFields.multiclass_scores in                               tensor_dict)  tensor_dict = preprocessor.preprocess(      tensor_dict, data_augmentation_options,      func_arg_map=preprocessor.get_default_func_arg_map(          include_label_weights=include_label_weights,          include_label_confidences=include_label_confidences,          include_multiclass_scores=include_multiclass_scores,          include_instance_masks=include_instance_masks,          include_keypoints=include_keypoints))  tensor_dict[fields.InputDataFields.image] = tf.squeeze(      tensor_dict[fields.InputDataFields.image], axis=0)  return tensor_dict

def _get_labels_dict(input_dict):  """Extracts labels dict from input dict."""  required_label_keys = [      fields.InputDataFields.num_groundtruth_boxes,      fields.InputDataFields.groundtruth_boxes,      fields.InputDataFields.groundtruth_classes,      fields.InputDataFields.groundtruth_weights,  ]  labels_dict = {}  for key in required_label_keys:    labels_dict[key] = input_dict[key]
  optional_label_keys = [      fields.InputDataFields.groundtruth_confidences,      fields.InputDataFields.groundtruth_keypoints,      fields.InputDataFields.groundtruth_instance_masks,      fields.InputDataFields.groundtruth_area,      fields.InputDataFields.groundtruth_is_crowd,      fields.InputDataFields.groundtruth_difficult  ]
  for key in optional_label_keys:    if key in input_dict:      labels_dict[key] = input_dict[key]  if fields.InputDataFields.groundtruth_difficult in labels_dict:    labels_dict[fields.InputDataFields.groundtruth_difficult] = tf.cast(        labels_dict[fields.InputDataFields.groundtruth_difficult], tf.int32)  return labels_dict

def _replace_empty_string_with_random_number(string_tensor):  """Returns string unchanged if non-empty, and random string tensor otherwise.

  The random string is an integer 0 and 2**63 - 1, casted as string.

  Args:    string_tensor: A tf.tensor of dtype string.
  Returns:    out_string: A tf.tensor of dtype string. If string_tensor contains the empty      string, out_string will contain a random integer casted to a string.      Otherwise string_tensor is returned unchanged.
  """

  empty_string = tf.constant('', dtype=tf.string, name='EmptyString')
  random_source_id = tf.as_string(      tf.random_uniform(shape=[], maxval=2**63 - 1, dtype=tf.int64))
  out_string = tf.cond(      tf.equal(string_tensor, empty_string),      true_fn=lambda: random_source_id,      false_fn=lambda: string_tensor)
  return out_string

def _get_features_dict(input_dict):  """Extracts features dict from input dict."""
  source_id = _replace_empty_string_with_random_number(      input_dict[fields.InputDataFields.source_id])
  hash_from_source_id = tf.string_to_hash_bucket_fast(source_id, HASH_BINS)  features = {      fields.InputDataFields.image:          input_dict[fields.InputDataFields.image],      HASH_KEY: tf.cast(hash_from_source_id, tf.int32),      fields.InputDataFields.true_image_shape:          input_dict[fields.InputDataFields.true_image_shape],      fields.InputDataFields.original_image_spatial_shape:          input_dict[fields.InputDataFields.original_image_spatial_shape]  }  if fields.InputDataFields.original_image in input_dict:    features[fields.InputDataFields.original_image] = input_dict[        fields.InputDataFields.original_image]  return features

def create_train_input_fn(train_config, train_input_config,                          model_config):  """Creates a train `input` function for `Estimator`.

  Args:    train_config: A train_pb2.TrainConfig.    train_input_config: An input_reader_pb2.InputReader.    model_config: A model_pb2.DetectionModel.
  Returns:    `input_fn` for `Estimator` in TRAIN mode.  """

  def _train_input_fn(params=None):    return train_input(train_config, train_input_config, model_config,                       params=params)
  return _train_input_fn

def train_input(train_config, train_input_config,                model_config, model=None, params=None):  """Returns `features` and `labels` tensor dictionaries for training.

  Args:    train_config: A train_pb2.TrainConfig.    train_input_config: An input_reader_pb2.InputReader.    model_config: A model_pb2.DetectionModel.    model: A pre-constructed Detection Model.      If None, one will be created from the config.    params: Parameter dictionary passed from the estimator.
  Returns:    A tf.data.Dataset that holds (features, labels) tuple.
    features: Dictionary of feature tensors.      features[fields.InputDataFields.image] is a [batch_size, H, W, C]        float32 tensor with preprocessed images.      features[HASH_KEY] is a [batch_size] int32 tensor representing unique        identifiers for the images.      features[fields.InputDataFields.true_image_shape] is a [batch_size, 3]        int32 tensor representing the true image shapes, as preprocessed        images could be padded.      features[fields.InputDataFields.original_image] (optional) is a        [batch_size, H, W, C] float32 tensor with original images.    labels: Dictionary of groundtruth tensors.      labels[fields.InputDataFields.num_groundtruth_boxes] is a [batch_size]        int32 tensor indicating the number of groundtruth boxes.      labels[fields.InputDataFields.groundtruth_boxes] is a        [batch_size, num_boxes, 4] float32 tensor containing the corners of        the groundtruth boxes.      labels[fields.InputDataFields.groundtruth_classes] is a        [batch_size, num_boxes, num_classes] float32 one-hot tensor of        classes.      labels[fields.InputDataFields.groundtruth_weights] is a        [batch_size, num_boxes] float32 tensor containing groundtruth weights        for the boxes.      -- Optional --      labels[fields.InputDataFields.groundtruth_instance_masks] is a        [batch_size, num_boxes, H, W] float32 tensor containing only binary        values, which represent instance masks for objects.      labels[fields.InputDataFields.groundtruth_keypoints] is a        [batch_size, num_boxes, num_keypoints, 2] float32 tensor containing        keypoints for each box.
  Raises:    TypeError: if the `train_config`, `train_input_config` or `model_config`      are not of the correct type.  """
  if not isinstance(train_config, train_pb2.TrainConfig):    raise TypeError('For training mode, the `train_config` must be a '                    'train_pb2.TrainConfig.')  if not isinstance(train_input_config, input_reader_pb2.InputReader):    raise TypeError('The `train_input_config` must be a '                    'input_reader_pb2.InputReader.')  if not isinstance(model_config, model_pb2.DetectionModel):    raise TypeError('The `model_config` must be a '                    'model_pb2.DetectionModel.')
  if model is None:    model_preprocess_fn = INPUT_BUILDER_UTIL_MAP['model_build'](        model_config, is_training=True).preprocess  else:    model_preprocess_fn = model.preprocess
  def transform_and_pad_input_data_fn(tensor_dict):    """Combines transform and pad operation."""    data_augmentation_options = [        preprocessor_builder.build(step)        for step in train_config.data_augmentation_options    ]    data_augmentation_fn = functools.partial(        augment_input_data,        data_augmentation_options=data_augmentation_options)
    image_resizer_config = config_util.get_image_resizer_config(model_config)    image_resizer_fn = image_resizer_builder.build(image_resizer_config)    transform_data_fn = functools.partial(        transform_input_data, model_preprocess_fn=model_preprocess_fn,        image_resizer_fn=image_resizer_fn,        num_classes=config_util.get_number_of_classes(model_config),        data_augmentation_fn=data_augmentation_fn,        merge_multiple_boxes=train_config.merge_multiple_label_boxes,        retain_original_image=train_config.retain_original_images,        use_multiclass_scores=train_config.use_multiclass_scores,        use_bfloat16=train_config.use_bfloat16)
    tensor_dict = pad_input_data_to_static_shapes(        tensor_dict=transform_data_fn(tensor_dict),        max_num_boxes=train_input_config.max_number_of_boxes,        num_classes=config_util.get_number_of_classes(model_config),        spatial_image_shape=config_util.get_spatial_image_size(            image_resizer_config))    return (_get_features_dict(tensor_dict), _get_labels_dict(tensor_dict))
  dataset = INPUT_BUILDER_UTIL_MAP['dataset_build'](      train_input_config,      transform_input_data_fn=transform_and_pad_input_data_fn,      batch_size=params['batch_size'] if params else train_config.batch_size)  return dataset

def create_eval_input_fn(eval_config, eval_input_config, model_config):  """Creates an eval `input` function for `Estimator`.

  Args:    eval_config: An eval_pb2.EvalConfig.    eval_input_config: An input_reader_pb2.InputReader.    model_config: A model_pb2.DetectionModel.
  Returns:    `input_fn` for `Estimator` in EVAL mode.  """

  def _eval_input_fn(params=None):    return eval_input(eval_config, eval_input_config, model_config,                      params=params)
  return _eval_input_fn

def eval_input(eval_config, eval_input_config, model_config,               model=None, params=None):  """Returns `features` and `labels` tensor dictionaries for evaluation.

  Args:    eval_config: An eval_pb2.EvalConfig.    eval_input_config: An input_reader_pb2.InputReader.    model_config: A model_pb2.DetectionModel.    model: A pre-constructed Detection Model.      If None, one will be created from the config.    params: Parameter dictionary passed from the estimator.
  Returns:    A tf.data.Dataset that holds (features, labels) tuple.
    features: Dictionary of feature tensors.      features[fields.InputDataFields.image] is a [1, H, W, C] float32 tensor        with preprocessed images.      features[HASH_KEY] is a [1] int32 tensor representing unique        identifiers for the images.      features[fields.InputDataFields.true_image_shape] is a [1, 3]        int32 tensor representing the true image shapes, as preprocessed        images could be padded.      features[fields.InputDataFields.original_image] is a [1, H', W', C]        float32 tensor with the original image.    labels: Dictionary of groundtruth tensors.      labels[fields.InputDataFields.groundtruth_boxes] is a [1, num_boxes, 4]        float32 tensor containing the corners of the groundtruth boxes.      labels[fields.InputDataFields.groundtruth_classes] is a        [num_boxes, num_classes] float32 one-hot tensor of classes.      labels[fields.InputDataFields.groundtruth_area] is a [1, num_boxes]        float32 tensor containing object areas.      labels[fields.InputDataFields.groundtruth_is_crowd] is a [1, num_boxes]        bool tensor indicating if the boxes enclose a crowd.      labels[fields.InputDataFields.groundtruth_difficult] is a [1, num_boxes]        int32 tensor indicating if the boxes represent difficult instances.      -- Optional --      labels[fields.InputDataFields.groundtruth_instance_masks] is a        [1, num_boxes, H, W] float32 tensor containing only binary values,        which represent instance masks for objects.
  Raises:    TypeError: if the `eval_config`, `eval_input_config` or `model_config`      are not of the correct type.  """
  params = params or {}  if not isinstance(eval_config, eval_pb2.EvalConfig):    raise TypeError('For eval mode, the `eval_config` must be a '                    'train_pb2.EvalConfig.')  if not isinstance(eval_input_config, input_reader_pb2.InputReader):    raise TypeError('The `eval_input_config` must be a '                    'input_reader_pb2.InputReader.')  if not isinstance(model_config, model_pb2.DetectionModel):    raise TypeError('The `model_config` must be a '                    'model_pb2.DetectionModel.')
  if model is None:    model_preprocess_fn = INPUT_BUILDER_UTIL_MAP['model_build'](        model_config, is_training=False).preprocess  else:    model_preprocess_fn = model.preprocess
  def transform_and_pad_input_data_fn(tensor_dict):    """Combines transform and pad operation."""    num_classes = config_util.get_number_of_classes(model_config)
    image_resizer_config = config_util.get_image_resizer_config(model_config)    image_resizer_fn = image_resizer_builder.build(image_resizer_config)
    transform_data_fn = functools.partial(        transform_input_data, model_preprocess_fn=model_preprocess_fn,        image_resizer_fn=image_resizer_fn,        num_classes=num_classes,        data_augmentation_fn=None,        retain_original_image=eval_config.retain_original_images)    tensor_dict = pad_input_data_to_static_shapes(        tensor_dict=transform_data_fn(tensor_dict),        max_num_boxes=eval_input_config.max_number_of_boxes,        num_classes=config_util.get_number_of_classes(model_config),        spatial_image_shape=config_util.get_spatial_image_size(            image_resizer_config))    return (_get_features_dict(tensor_dict), _get_labels_dict(tensor_dict))  dataset = INPUT_BUILDER_UTIL_MAP['dataset_build'](      eval_input_config,      batch_size=params['batch_size'] if params else eval_config.batch_size,      transform_input_data_fn=transform_and_pad_input_data_fn)  return dataset

def create_predict_input_fn(model_config, predict_input_config):  """Creates a predict `input` function for `Estimator`.

  Args:    model_config: A model_pb2.DetectionModel.    predict_input_config: An input_reader_pb2.InputReader.
  Returns:    `input_fn` for `Estimator` in PREDICT mode.  """

  def _predict_input_fn(params=None):    """Decodes serialized tf.Examples and returns `ServingInputReceiver`.

    Args:      params: Parameter dictionary passed from the estimator.
    Returns:      `ServingInputReceiver`.    """
    del params    example = tf.placeholder(dtype=tf.string, shape=[], name='tf_example')
    num_classes = config_util.get_number_of_classes(model_config)    model_preprocess_fn = INPUT_BUILDER_UTIL_MAP['model_build'](        model_config, is_training=False).preprocess
    image_resizer_config = config_util.get_image_resizer_config(model_config)    image_resizer_fn = image_resizer_builder.build(image_resizer_config)
    transform_fn = functools.partial(        transform_input_data, model_preprocess_fn=model_preprocess_fn,        image_resizer_fn=image_resizer_fn,        num_classes=num_classes,        data_augmentation_fn=None)
    decoder = tf_example_decoder.TfExampleDecoder(        load_instance_masks=False,        num_additional_channels=predict_input_config.num_additional_channels)    input_dict = transform_fn(decoder.decode(example))    images = tf.cast(input_dict[fields.InputDataFields.image], dtype=tf.float32)    images = tf.expand_dims(images, axis=0)    true_image_shape = tf.expand_dims(        input_dict[fields.InputDataFields.true_image_shape], axis=0)
    return tf.estimator.export.ServingInputReceiver(        features={            fields.InputDataFields.image: images,            fields.InputDataFields.true_image_shape: true_image_shape},        receiver_tensors={SERVING_FED_EXAMPLE_KEY: example})
  return _predict_input_fn