Model Maker: Add audio classification demo.

wangtz · MarkDaoust · commit 5e90c6c3ca05 · 2021-01-19T09:32:27.000-08:00
PiperOrigin-RevId: 352510173
diff --git a/tensorflow_examples/lite/model_maker/core/test_util.py b/tensorflow_examples/lite/model_maker/core/test_util.py
@@ -45,7 +45,7 @@ def test_srcdir():
 
 def get_test_data_path(file_or_dirname):
   """Return full test data path."""
-  for directory, subdirs, files in tf.io.gfile.walk(test_srcdir()):
+  for (directory, subdirs, files) in tf.io.gfile.walk(test_srcdir()):
     for f in subdirs + files:
       if f.endswith(file_or_dirname):
         return os.path.join(directory, f)
diff --git a/tensorflow_examples/lite/model_maker/demo/audio_classification_demo.py b/tensorflow_examples/lite/model_maker/demo/audio_classification_demo.py
@@ -0,0 +1,103 @@
+# Copyright 2020 The TensorFlow Authors. All Rights Reserved.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+"""Audio classification demo code of Model Maker for TFLite.
+
+Example usage:
+python audio_classification_demo.py --export_dir=/tmp
+
+Sample output:
+Downloading data from
+https://storage.googleapis.com/download.tensorflow.org/data/mini_speech_commands.zip
+182083584/182082353 [==============================] - 4s 0us/step
+182091776/182082353 [==============================] - 4s 0us/step
+Dataset has been downloaded to
+/usr/local/google/home/wangtz/.keras/datasets/mini_speech_commands
+Processing audio files:
+8000/8000 [==============================] - 354s 44ms/file
+Cached 7178 audio samples.
+Training the model
+5742/5742 [==============================] - 29s 5ms/step - loss: 3.2289 - acc:
+0.8029 - val_loss: 0.6229 - val_acc: 0.9638
+Evaluating the model
+15/15 [==============================] - 2s 12ms/step - loss: 1.3569 - acc:
+0.9270
+Test accuracy: 0.927039
+"""
+
+from __future__ import absolute_import
+from __future__ import division
+from __future__ import print_function
+
+from absl import app
+from absl import flags
+from absl import logging
+
+import tensorflow as tf
+from tensorflow_examples.lite.model_maker.core.data_util import audio_dataloader
+from tensorflow_examples.lite.model_maker.core.task import audio_classifier
+from tensorflow_examples.lite.model_maker.core.task import model_spec
+
+FLAGS = flags.FLAGS
+
+
+def define_flags():
+  flags.DEFINE_string('export_dir', None,
+                      'The directory to save exported files.')
+  flags.DEFINE_string('spec', 'audio_browser_fft',
+                      'Name of the model spec to use.')
+  flags.mark_flag_as_required('export_dir')
+
+
+def download_dataset(**kwargs):
+  """Downloads demo dataset, and returns directory path."""
+  tf.compat.v1.logging.info('Downloading mini speech command dataset.')
+  # ${HOME}/.keras/datasets/mini_speech_commands.zip
+  filepath = tf.keras.utils.get_file(
+      fname='mini_speech_commands.zip',
+      origin='https://storage.googleapis.com/download.tensorflow.org/data/mini_speech_commands.zip',
+      extract=True,
+      **kwargs)
+  # ${HOME}/.keras/datasets/mini_speech_commands
+  folder_path = filepath.rsplit('.', 1)[0]
+  print(f'Dataset has been downloaded to {folder_path}')
+  return folder_path
+
+
+def run(data_dir, export_dir, spec='audio_browser_fft', **kwargs):
+  """Runs demo."""
+  spec = model_spec.get(spec)
+  data = audio_dataloader.DataLoader.from_folder(spec, data_dir)
+
+  train_data, rest_data = data.split(0.8)
+  validation_data, test_data = rest_data.split(0.5)
+
+  print('Training the model')
+  model = audio_classifier.create(train_data, spec, validation_data, **kwargs)
+
+  print('Evaluating the model')
+  _, acc = model.evaluate(test_data)
+  print('Test accuracy: %f' % acc)
+
+  model.export(export_dir)
+
+
+def main(_):
+  logging.set_verbosity(logging.INFO)
+  data_dir = download_dataset()
+  run(data_dir, FLAGS.export_dir)
+
+
+if __name__ == '__main__':
+  define_flags()
+  app.run(main)
diff --git a/tensorflow_examples/lite/model_maker/demo/audio_classification_demo_test.py b/tensorflow_examples/lite/model_maker/demo/audio_classification_demo_test.py
@@ -0,0 +1,80 @@
+# Copyright 2019 The TensorFlow Authors. All Rights Reserved.
+#
+# Licensed under the Apache License, Version 2.0 (the 'License');
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an 'AS IS' BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+from __future__ import absolute_import
+from __future__ import division
+from __future__ import print_function
+
+import os
+import tempfile
+import unittest
+
+import tensorflow as tf
+
+from tensorflow_examples.lite.model_maker.core import test_util
+from tensorflow_examples.lite.model_maker.core.data_util.audio_dataloader import DataLoader
+from tensorflow_examples.lite.model_maker.demo import audio_classification_demo
+
+
+from_folder_fn = DataLoader.from_folder
+
+
+def patch_data_loader():
+  """Patch to train partial dataset rather than all of them."""
+
+  def side_effect(*args, **kwargs):
+    tf.compat.v1.logging.info('Train on partial dataset')
+    # This takes around 8 mins as it caches all files in the folder.
+    # We should be able to address this issue once the dataset is lazily loaded.
+    data_loader = from_folder_fn(*args, **kwargs)
+    if len(data_loader) > 10:  # Trim dataset to at most 10.
+      data_loader._size = 10
+      # TODO(b/171449557): Change this once the dataset is lazily loaded.
+      data_loader._dataset = data_loader._dataset.take(10)
+    return data_loader
+
+  return unittest.mock.patch.object(
+      DataLoader, 'from_folder', side_effect=side_effect)
+
+
+class AudioClassificationDemoTest(tf.test.TestCase):
+
+  def test_audio_classification_demo(self):
+    with patch_data_loader():
+      with tempfile.TemporaryDirectory() as temp_dir:
+        # Use cached training data if exists.
+        data_dir = audio_classification_demo.download_dataset(
+            cache_dir=test_util.get_cache_dir(temp_dir,
+                                              'mini_speech_commands.zip'),
+            file_hash='4b8a67bae2973844e84fa7ac988d1a44')
+
+        tflite_filename = os.path.join(temp_dir, 'model.tflite')
+        label_filename = os.path.join(temp_dir, 'labels.txt')
+        audio_classification_demo.run(
+            data_dir,
+            temp_dir,
+            spec='audio_browser_fft',
+            epochs=1,
+            batch_size=1)
+
+        self.assertTrue(tf.io.gfile.exists(tflite_filename))
+        self.assertGreater(os.path.getsize(tflite_filename), 0)
+
+        self.assertFalse(tf.io.gfile.exists(label_filename))
+
+
+if __name__ == '__main__':
+  # Load compressed models from tensorflow_hub
+  os.environ['TFHUB_MODEL_LOAD_FORMAT'] = 'COMPRESSED'
+  tf.test.main()