tensorflow
diff --git a/‎tensorflow_examples/lite/model_maker/core/data_util/object_detector_dataloader.py
Lines changed: 283 additions & 0 deletions b/‎tensorflow_examples/lite/model_maker/core/data_util/object_detector_dataloader.py
Lines changed: 283 additions & 0 deletions
diff --git a/‎tensorflow_examples/lite/model_maker/core/data_util/object_detector_dataloader_test.py
Lines changed: 100 additions & 0 deletions b/‎tensorflow_examples/lite/model_maker/core/data_util/object_detector_dataloader_test.py
Lines changed: 100 additions & 0 deletions
@@ -0,0 +1,283 @@
+# Copyright 2020 The TensorFlow Authors. All Rights Reserved.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+"""Dataloader for object detection."""
+
+from __future__ import absolute_import
+from __future__ import division
+from __future__ import print_function
+
+import glob
+import hashlib
+import json
+import os
+import tempfile
+
+from lxml import etree
+import tensorflow as tf
+from tensorflow_examples.lite.model_maker.core.data_util import dataloader
+import yaml
+
+HAS_OBJECT_DETECTION = True
+try:
+  # pylint: disable=g-import-not-at-top
+  from efficientdet import dataloader as det_dataloader
+  from efficientdet.dataset import create_pascal_tfrecord
+  from efficientdet.dataset import tfrecord_util
+  from efficientdet.keras import label_util
+  # pylint: enable=g-import-not-at-top
+except ImportError:
+  HAS_OBJECT_DETECTION = False
+
+
+def _get_cache_prefix(image_dir, annotations_dir, annotations_list):
+  """Get the prefix for cached files."""
+
+  def _get_dir_basename(dirname):
+    return os.path.basename(os.path.abspath(dirname))
+
+  hasher = hashlib.md5()
+  hasher.update(_get_dir_basename(image_dir).encode('utf-8'))
+  hasher.update(_get_dir_basename(annotations_dir).encode('utf-8'))
+  if annotations_list:
+    hasher.update(' '.join(sorted(annotations_list)).encode('utf-8'))
+  return hasher.hexdigest()
+
+
+def _get_object_detector_cache_filenames(cache_dir, image_dir, annotations_dir,
+                                         annotations_list, num_shards):
+  """Gets cache filenames for obejct detector."""
+  if cache_dir is None:
+    cache_dir = tempfile.mkdtemp()
+    print('Create the cache directory: %s.', cache_dir)
+  cache_prefix = _get_cache_prefix(image_dir, annotations_dir, annotations_list)
+  cache_prefix = os.path.join(cache_dir, cache_prefix)
+
+  tfrecord_files = [
+      cache_prefix + '-%05d-of-%05d.tfrecord' % (i, num_shards)
+      for i in range(num_shards)
+  ]
+  annotations_json_file = cache_prefix + '_annotations.json'
+  meta_data_file = cache_prefix + '_meta_data.yaml'
+
+  all_cached_files = tfrecord_files + [annotations_json_file, meta_data_file]
+  is_cached = all(os.path.exists(path) for path in all_cached_files)
+  return is_cached, cache_prefix, tfrecord_files, annotations_json_file, meta_data_file
+
+
+def _get_label_map(label_map):
+  """Gets the label map dict."""
+  if isinstance(label_map, list):
+    label_map_dict = {}
+    for i, label in enumerate(label_map):
+      # 0 is resevered for background.
+      label_map_dict[i + 1] = label
+    label_map = label_map_dict
+  label_map = label_util.get_label_map(label_map)
+
+  if 0 in label_map and label_map[0] != 'background':
+    raise ValueError('0 must be resevered for background.')
+  label_map.pop(0, None)
+  name_set = set()
+  for idx, name in label_map.items():
+    if not isinstance(idx, int):
+      raise ValueError('The key (label id) in label_map must be integer.')
+    if not isinstance(name, str):
+      raise ValueError('The value (label name) in label_map must be string.')
+    if name in name_set:
+      raise ValueError('The value: %s (label name) can\'t be duplicated.' %
+                       name)
+    name_set.add(name)
+  return label_map
+
+
+class DataLoader(dataloader.DataLoader):
+  """DataLoader for object detector."""
+
+  def __init__(self,
+               tfrecord_file_patten,
+               size,
+               label_map,
+               annotations_json_file=None):
+    """Initialize DataLoader for object detector.
+
+    Args:
+      tfrecord_file_patten: Glob for tfrecord files. e.g. "/tmp/coco*.tfrecord".
+      size: The size of the dataset.
+      label_map: Variable shows mapping label integers ids to string label
+        names. 0 is the reserved key for `background` and doesn't need to be
+        included in label_map. Label names can't be duplicated. Supported
+        formats are:
+        1. Dict, map label integers ids to string label names, such as {1:
+          'person', 2: 'notperson'}. 2. List, a list of label names such as
+            ['person', 'notperson'] which is
+           the same as setting label_map={1: 'person', 2: 'notperson'}.
+        3. String, name for certain dataset. Accepted values are: 'coco', 'voc'
+          and 'waymo'. 4. String, yaml filename that stores label_map.
+      annotations_json_file: JSON with COCO data format containing golden
+        bounding boxes. Used for validation. If None, use the ground truth from
+        the dataloader. Refer to
+        https://towardsdatascience.com/coco-data-format-for-object-detection-a4c5eaf518c5
+          for the description of COCO data format.
+    """
+    if not HAS_OBJECT_DETECTION:
+      raise NotImplementedError("Haven't support object detection yet.")
+    super(DataLoader, self).__init__(dataset=None, size=size)
+    self.tfrecord_file_patten = tfrecord_file_patten
+    self.label_map = _get_label_map(label_map)
+    self.annotations_json_file = annotations_json_file
+
+  @classmethod
+  def from_pascal_voc(cls,
+                      images_dir,
+                      annotations_dir,
+                      label_map,
+                      annotations_list=None,
+                      ignore_difficult_instances=False,
+                      num_shards=100,
+                      max_num_images=None,
+                      cache_dir=None):
+    """Loads from dataset with PASCAL VOC format.
+
+    Refer to
+    https://towardsdatascience.com/coco-data-format-for-object-detection-a4c5eaf518c5#:~:text=Pascal%20VOC%20is%20an%20XML,for%20training%2C%20testing%20and%20validation
+    for the description of PASCAL VOC data format.
+
+    LabelImg Tool (https://github.com/tzutalin/labelImg) can annotate the image
+    and save annotations as XML files in PASCAL VOC data format.
+
+    Annotations are in the folder: ${annotations_dir}.
+    Raw images are in the foloder: ${images_dir}.
+
+    Args:
+      images_dir: Path to directory that store raw images.
+      annotations_dir: Path to the annotations directory.
+      label_map: Variable shows mapping label integers ids to string label
+        names. 0 is the reserved key for `background`. Label names can't be
+        duplicated. Supported format: 1. Dict, map label integers ids to string
+          label names, e.g.
+           {1: 'person', 2: 'notperson'}. 2. List, a list of label names. e.g.
+             ['person', 'notperson'] which is
+           the same as setting label_map={1: 'person', 2: 'notperson'}.
+        3. String, name for certain dataset. Accepted values are: 'coco', 'voc'
+          and 'waymo'. 4. String, yaml filename that stores label_map.
+      annotations_list: list of annotation filenames (strings) to be loaded. For
+        instance, if there're 3 annotation files [0.xml, 1.xml, 2.xml] in
+        `annotations_dir`, setting annotations_list=['0', '1'] makes this method
+        only load [0.xml, 1.xml].
+      ignore_difficult_instances: Whether to ignore difficult instances.
+        `difficult` can be set inside `object` item in the annotation xml file.
+      num_shards: Number of shards for output file.
+      max_num_images: Max number of imags to process.
+      cache_dir: The cache directory to save TFRecord and json file. When
+        cache_dir is not set, a temporary folder will be created and will not be
+        removed automatically after training which makes it can be used later.
+
+    Returns:
+      ObjectDetectorDataLoader object.
+    """
+    label_map = _get_label_map(label_map)
+    is_cached, cache_prefix, tfrecord_files, ann_json_file, meta_data_file = \
+        _get_object_detector_cache_filenames(cache_dir, images_dir,
+                                             annotations_dir, annotations_list,
+                                             num_shards)
+    # If not cached, write data into tfrecord_file_paths and
+    # annotations_json_file_path.
+    # If `num_shards` differs, it's still not cached.
+    if not is_cached:
+      cls._write_pascal_tfrecord(images_dir, annotations_dir, label_map,
+                                 annotations_list, ignore_difficult_instances,
+                                 num_shards, max_num_images, tfrecord_files,
+                                 ann_json_file, meta_data_file)
+
+    tfrecord_file_patten = cache_prefix + '-*-of-%05d.tfrecord' % num_shards
+    if not glob.glob(tfrecord_file_patten):
+      raise ValueError('TFRecord files are empty.')
+
+    with tf.io.gfile.GFile(meta_data_file, 'r') as f:
+      meta_data = yaml.load(f, Loader=yaml.FullLoader)
+    return DataLoader(tfrecord_file_patten, meta_data['size'],
+                      meta_data['label_map'], ann_json_file)
+
+  @classmethod
+  def _write_pascal_tfrecord(cls, images_dir, annotations_dir, label_map_dict,
+                             annotations_list, ignore_difficult_instances,
+                             num_shards, max_num_images, tfrecord_files,
+                             annotations_json_file, meta_data_file):
+    """Write TFRecord and json file for PASCAL VOC data."""
+    label_name2id_dict = {'background': 0}
+    for idx, name in label_map_dict.items():
+      label_name2id_dict[name] = idx
+    writers = [tf.io.TFRecordWriter(path) for path in tfrecord_files]
+    ann_json_dict = {'images': [], 'annotations': [], 'categories': []}
+    # Gets the paths to annotations.
+    if annotations_list:
+      ann_path_list = [
+          os.path.join(annotations_dir, annotation + '.xml')
+          for annotation in annotations_list
+      ]
+    else:
+      ann_path_list = list(tf.io.gfile.glob(annotations_dir + r'/*.xml'))
+
+    for idx, ann_path in enumerate(ann_path_list):
+      if max_num_images and idx >= max_num_images:
+        break
+      if idx % 100 == 0:
+        tf.compat.v1.logging.info('On image %d of %d', idx, len(ann_path_list))
+      with tf.io.gfile.GFile(ann_path, 'r') as fid:
+        xml_str = fid.read()
+      xml = etree.fromstring(xml_str)
+      data = tfrecord_util.recursive_parse_xml_to_dict(xml)['annotation']
+      tf_example = create_pascal_tfrecord.dict_to_tf_example(
+          data,
+          images_dir,
+          label_name2id_dict,
+          ignore_difficult_instances,
+          ann_json_dict=ann_json_dict)
+      writers[idx % num_shards].write(tf_example.SerializeToString())
+
+    meta_data = {'size': idx + 1, 'label_map': label_map_dict}
+    with tf.io.gfile.GFile(meta_data_file, 'w') as f:
+      yaml.dump(meta_data, f)
+
+    for writer in writers:
+      writer.close()
+
+    with tf.io.gfile.GFile(annotations_json_file, 'w') as f:
+      json.dump(ann_json_dict, f)
+
+  def gen_dataset(self,
+                  model_spec,
+                  batch_size=None,
+                  is_training=True,
+                  use_fake_data=False):
+    """Generate a batched tf.data.Dataset for training/evaluation.
+
+    Args:
+      model_spec: Specification for the model.
+      batch_size: A integer, the returned dataset will be batched by this size.
+      is_training: A boolean, when True, the returned dataset will be optionally
+        shuffled and repeated as an endless dataset.
+      use_fake_data: Use fake input.
+
+    Returns:
+      A TF dataset ready to be consumed by Keras model.
+    """
+    reader = det_dataloader.InputReader(
+        self.tfrecord_file_patten,
+        is_training=is_training,
+        use_fake_data=use_fake_data,
+        max_instances_per_image=model_spec.config.max_instances_per_image,
+        debug=model_spec.config.debug)
+    self._dataset = reader(model_spec.config.as_dict(), batch_size=batch_size)
+    return self._dataset
@@ -0,0 +1,100 @@
+# Copyright 2020 The TensorFlow Authors. All Rights Reserved.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+from __future__ import absolute_import
+from __future__ import division
+from __future__ import print_function
+
+import os
+
+import numpy as np
+import PIL.Image
+import tensorflow as tf
+from tensorflow_examples.lite.model_maker.core import test_util
+
+try:
+  # pylint: disable=g-import-not-at-top
+  from tensorflow_examples.lite.model_maker.core.data_util import object_detector_dataloader
+  from efficientdet import hparams_config
+  from efficientdet import utils
+# pylint: enable=g-import-not-at-top
+except ImportError:
+  pass
+
+
+class MockDetectorModelSpec(object):
+
+  def __init__(self, model_name):
+    self.model_name = model_name
+    config = hparams_config.get_detection_config(model_name)
+    config.image_size = utils.parse_image_size(config.image_size)
+    config.update({'debug': False})
+    self.config = config
+
+
+class ObjectDectectorDataLoaderTest(tf.test.TestCase):
+
+  def _create_pascal_voc(self):
+    # Saves the image into images_dir.
+    image_file_name = '2012_12.jpg'
+    image_data = np.random.rand(256, 256, 3)
+    images_dir = os.path.join(self.get_temp_dir(), 'images')
+    os.mkdir(images_dir)
+    save_path = os.path.join(images_dir, image_file_name)
+    image = PIL.Image.fromarray(image_data, 'RGB')
+    image.save(save_path)
+
+    # Gets the annonation path.
+    annotations_path = test_util.get_test_data_path('2012_12.xml')
+    annotations_dir = os.path.dirname(annotations_path)
+
+    label_map = {
+        1: 'person',
+        2: 'notperson',
+    }
+    return images_dir, annotations_dir, label_map
+
+  def test_from_pascal_voc(self):
+    if not object_detector_dataloader.HAS_OBJECT_DETECTION:
+      return
+
+    images_dir, annotations_dir, label_map = self._create_pascal_voc()
+    model_spec = MockDetectorModelSpec('efficientdet-lite0')
+
+    data = object_detector_dataloader.DataLoader.from_pascal_voc(
+        images_dir, annotations_dir, label_map)
+
+    self.assertIsInstance(data, object_detector_dataloader.DataLoader)
+    self.assertLen(data, 1)
+    self.assertEqual(data.label_map, label_map)
+
+    ds = data.gen_dataset(model_spec, batch_size=1, is_training=False)
+    for i, (images, labels) in enumerate(ds):
+      self.assertEqual(i, 0)
+      images_shape = tf.shape(images).numpy()
+      expected_shape = np.array([1, *model_spec.config.image_size, 3])
+      self.assertTrue((images_shape == expected_shape).all())
+      self.assertLen(labels, 15)
+
+    ds1 = data.gen_dataset(model_spec, batch_size=1, is_training=True)
+    self.assertEqual(ds1.cardinality(), tf.data.INFINITE_CARDINALITY)
+    for images, labels in ds1.take(10):
+      images_shape = tf.shape(images).numpy()
+      expected_shape = np.array([1, *model_spec.config.image_size, 3])
+      self.assertTrue((images_shape == expected_shape).all())
+      self.assertLen(labels, 15)
+
+
+if __name__ == '__main__':
+  tf.test.main()