Add object_dectector task in TFLite Model Maker

ziyeqinghan · copybara-github · commit a40bab43e6a2 · 2021-01-11T23:24:29.000-08:00
PiperOrigin-RevId: 351309014
diff --git a/tensorflow_examples/lite/model_maker/core/task/object_detector.py b/tensorflow_examples/lite/model_maker/core/task/object_detector.py
@@ -0,0 +1,119 @@
+# Copyright 2020 The TensorFlow Authors. All Rights Reserved.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+"""ObjectDetector class."""
+
+import tensorflow as tf
+from tensorflow_examples.lite.model_maker.core import compat
+from tensorflow_examples.lite.model_maker.core.task import custom_model
+from tensorflow_examples.lite.model_maker.core.task import model_spec as ms
+
+
+def create(train_data,
+           model_spec,
+           validation_data=None,
+           epochs=None,
+           batch_size=None,
+           do_train=True):
+  """Loads data and train the model for test classification.
+
+  Args:
+    train_data: Training data.
+    model_spec: Specification for the model.
+    validation_data: Validation data. If None, skips validation process.
+    epochs: Number of epochs for training.
+    batch_size: Batch size for training.
+    do_train: Whether to run training.
+
+  Returns:
+    TextClassifier
+  """
+  model_spec = ms.get(model_spec)
+  if compat.get_tf_behavior() not in model_spec.compat_tf_versions:
+    raise ValueError('Incompatible versions. Expect {}, but got {}.'.format(
+        model_spec.compat_tf_versions, compat.get_tf_behavior()))
+
+  object_detector = ObjectDetector(model_spec, train_data.label_map)
+
+  if do_train:
+    tf.compat.v1.logging.info('Retraining the models...')
+    object_detector.train(train_data, validation_data, epochs, batch_size)
+  else:
+    object_detector.create_model()
+
+  return object_detector
+
+
+class ObjectDetector(custom_model.CustomModel):
+  """ObjectDetector class for inference and exporting to tflite."""
+
+  def __init__(self, model_spec, label_map):
+    super().__init__(model_spec, shuffle=None)
+    if model_spec.config.label_map and model_spec.config.label_map != label_map:
+      tf.compat.v1.logging.warn(
+          'Label map is not the same as the previous label_map in model_spec.')
+    model_spec.config.label_map = label_map
+    model_spec.config.num_classes = len(label_map)
+
+  def create_model(self):
+    self.model = self.model_spec.create_model()
+    return self.model
+
+  def _get_dataset_and_steps(self, data, batch_size, is_training):
+    """Gets dataset, steps and annotations json file."""
+    if not data:
+      return None, 0, None
+    # TODO(b/171449557): Put this into DataLoader.
+    dataset = data.gen_dataset(
+        self.model_spec, batch_size, is_training=is_training)
+    steps = len(data) // batch_size
+    return dataset, steps, data.annotations_json_file
+
+  def train(self,
+            train_data,
+            validation_data=None,
+            epochs=None,
+            batch_size=None):
+    """Feeds the training data for training."""
+    batch_size = batch_size if batch_size else self.model_spec.batch_size
+    # TODO(b/171449557): Upstream this to the parent class.
+    if len(train_data) < batch_size:
+      raise ValueError('The size of the train_data (%d) couldn\'t be smaller '
+                       'than batch_size (%d). To solve this problem, set '
+                       'the batch_size smaller or increase the size of the '
+                       'train_data.' % (len(train_data), batch_size))
+
+    with self.model_spec.ds_strategy.scope():
+      self.create_model()
+      train_ds, steps_per_epoch, _ = self._get_dataset_and_steps(
+          train_data, batch_size, is_training=True)
+      validation_ds, validation_steps, val_json_file = self._get_dataset_and_steps(
+          validation_data, batch_size, is_training=False)
+      return self.model_spec.train(self.model, train_ds, steps_per_epoch,
+                                   validation_ds, validation_steps, epochs,
+                                   batch_size, val_json_file)
+
+  def evaluate(self, data, batch_size=None):
+    """Evaluates the model."""
+    batch_size = batch_size if batch_size else self.model_spec.batch_size
+    ds = data.gen_dataset(self.model_spec, batch_size, is_training=False)
+    steps = len(data) // batch_size
+    # TODO(b/171449557): Upstream this to the parent class.
+    if steps <= 0:
+      raise ValueError('The size of the validation_data (%d) couldn\'t be '
+                       'smaller than batch_size (%d). To solve this problem, '
+                       'set the batch_size smaller or increase the size of the '
+                       'validation_data.' % (len(data), batch_size))
+
+    return self.model_spec.evaluate(self.model, ds, steps,
+                                    data.annotations_json_file)
diff --git a/tensorflow_examples/lite/model_maker/core/task/object_detector_test.py b/tensorflow_examples/lite/model_maker/core/task/object_detector_test.py
@@ -0,0 +1,56 @@
+# Copyright 2020 The TensorFlow Authors. All Rights Reserved.
+#
+# Licensed under the Apache License, Version 2.0 (the 'License');
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an 'AS IS' BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+from __future__ import absolute_import
+from __future__ import division
+from __future__ import print_function
+
+import os
+
+import tensorflow.compat.v2 as tf
+from tensorflow_examples.lite.model_maker.core import compat
+from tensorflow_examples.lite.model_maker.core import test_util
+from tensorflow_examples.lite.model_maker.core.data_util import object_detector_dataloader
+from tensorflow_examples.lite.model_maker.core.task import object_detector
+from tensorflow_examples.lite.model_maker.core.task.model_spec import object_detector_spec
+
+
+class ObjectDetectorTest(tf.test.TestCase):
+
+  def testEfficientDetLite0(self):
+    # Gets model specification.
+    hub_path = test_util.get_test_data_path('fake_effdet_lite0_hub')
+    spec = object_detector_spec.EfficientDetModelSpec(
+        model_name='efficientdet-lite0', uri=hub_path)
+
+    # Prepare data.
+    images_dir, annotations_dir, label_map = test_util.create_pascal_voc(
+        self.get_temp_dir())
+    data = object_detector_dataloader.DataLoader.from_pascal_voc(
+        images_dir, annotations_dir, label_map)
+
+    # Train the model.
+    task = object_detector.create(data, spec, batch_size=1, epochs=1)
+
+    # Evaluate trained model
+    metrics = task.evaluate(data, batch_size=1)
+    self.assertIsInstance(metrics, dict)
+    self.assertGreaterEqual(metrics['AP'], 0)
+
+
+if __name__ == '__main__':
+  # Load compressed models from tensorflow_hub
+  os.environ['TFHUB_MODEL_LOAD_FORMAT'] = 'COMPRESSED'
+  compat.setup_tf_behavior(tf_version=2)
+  tf.test.main()