Change optimizer for image classification in TFLite Model Maker

ziyeqinghan · copybara-github · commit 9ee6190e7b39 · 2020-04-12T22:38:28.000-07:00
PiperOrigin-RevId: 306180023
diff --git a/tensorflow_examples/lite/model_maker/core/optimization/__init__.py b/tensorflow_examples/lite/model_maker/core/optimization/__init__.py
@@ -0,0 +1,13 @@
+# Copyright 2019 The TensorFlow Authors. All Rights Reserved.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
diff --git a/tensorflow_examples/lite/model_maker/core/optimization/warmup.py b/tensorflow_examples/lite/model_maker/core/optimization/warmup.py
@@ -0,0 +1,57 @@
+# Copyright 2019 The TensorFlow Authors. All Rights Reserved.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+"""Functions and classes related to optimization (weight updates)."""
+
+from __future__ import absolute_import
+from __future__ import division
+from __future__ import print_function
+
+import tensorflow.compat.v2 as tf
+
+
+class WarmUp(tf.keras.optimizers.schedules.LearningRateSchedule):
+  """Applies a warmup schedule on a given learning rate decay schedule."""
+
+  def __init__(self,
+               initial_learning_rate,
+               decay_schedule_fn,
+               warmup_steps,
+               name=None):
+    super(WarmUp, self).__init__()
+    self.initial_learning_rate = initial_learning_rate
+    self.warmup_steps = warmup_steps
+    self.decay_schedule_fn = decay_schedule_fn
+    self.name = name
+
+  def __call__(self, step):
+    with tf.name_scope(self.name or 'WarmUp') as name:
+      # Implements linear warmup. i.e., if global_step < warmup_steps, the
+      # learning rate will be `global_step/num_warmup_steps * init_lr`.
+      global_step_float = tf.cast(step, tf.float32)
+      warmup_steps_float = tf.cast(self.warmup_steps, tf.float32)
+      warmup_percent_done = global_step_float / warmup_steps_float
+      warmup_learning_rate = self.initial_learning_rate * warmup_percent_done
+      return tf.cond(
+          global_step_float < warmup_steps_float,
+          lambda: warmup_learning_rate,
+          lambda: self.decay_schedule_fn(step),
+          name=name)
+
+  def get_config(self):
+    return {
+        'initial_learning_rate': self.initial_learning_rate,
+        'decay_schedule_fn': self.decay_schedule_fn,
+        'warmup_steps': self.warmup_steps,
+        'name': self.name
+    }
diff --git a/tensorflow_examples/lite/model_maker/core/task/image_classifier.py b/tensorflow_examples/lite/model_maker/core/task/image_classifier.py
@@ -17,7 +17,7 @@
 from __future__ import division
 from __future__ import print_function
 
-import tensorflow as tf
+import tensorflow.compat.v2 as tf
 
 from tensorflow_examples.lite.model_maker.core import compat
 from tensorflow_examples.lite.model_maker.core import model_export_format as mef
@@ -26,8 +26,15 @@
 from tensorflow_examples.lite.model_maker.core.task import image_preprocessing
 from tensorflow_examples.lite.model_maker.core.task import metadata
 from tensorflow_examples.lite.model_maker.core.task import model_spec as ms
+from tensorflow_examples.lite.model_maker.core.task import train_image_classifier_lib
 
-from tensorflow_hub.tools.make_image_classifier import make_image_classifier_lib as lib
+from tensorflow_hub.tools.make_image_classifier import make_image_classifier_lib as hub_lib
+
+
+def get_hub_lib_hparams(**kwargs):
+  """Gets the hyperparameters for the tensorflow hub's library."""
+  hparams = hub_lib.get_default_hparams()
+  return train_image_classifier_lib.add_params(hparams, **kwargs)
 
 
 def create(train_data,
@@ -41,7 +48,10 @@ def create(train_data,
            dropout_rate=None,
            learning_rate=None,
            momentum=None,
-           use_augmentation=False):
+           use_augmentation=False,
+           use_hub_library=True,
+           warmup_steps=None,
+           model_dir=None):
   """Loads data and retrains the model based on data for image classification.
 
   Args:
@@ -50,36 +60,51 @@ def create(train_data,
     model_spec: Specification for the model.
     shuffle: Whether the data should be shuffled.
     validation_data: Validation data. If None, skips validation process.
-    batch_size: Number of samples per training step.
+    batch_size: Number of samples per training step. If `use_hub_library` is
+      False, it represents the base learning rate when train batch size is 256
+      and it's linear to the batch size.
     epochs: Number of epochs for training.
     train_whole_model: If true, the Hub module is trained together with the
       classification layer on top. Otherwise, only train the top classification
       layer.
-    dropout_rate: the rate for dropout.
-    learning_rate: a Python float forwarded to the optimizer.
-    momentum: a Python float forwarded to the optimizer.
+    dropout_rate: The rate for dropout.
+    learning_rate: Base learning rate when train batch size is 256. Linear to
+      the batch size.
+    momentum: a Python float forwarded to the optimizer. Only used when
+      `use_hub_library` is True.
     use_augmentation: Use data augmentation for preprocessing.
+    use_hub_library: Use `make_image_classifier_lib` from tensorflow hub to
+      retrain the model.
+    warmup_steps: Number of warmup steps for warmup schedule on learning rate.
+      If None, the default warmup_steps is used which is the total training
+      steps in two epochs. Only used when `use_hub_library` is False.
+    model_dir: The location of the model checkpoint files. Only used when
+      `use_hub_library` is False.
+
   Returns:
     An instance of ImageClassifier class.
   """
   if compat.get_tf_behavior() not in model_spec.compat_tf_versions:
     raise ValueError('Incompatible versions. Expect {}, but got {}.'.format(
         model_spec.compat_tf_versions, compat.get_tf_behavior()))
 
-  # The hyperparameters for make_image_classifier by tensorflow hub.
-  hparams = lib.get_default_hparams()
-  if batch_size is not None:
-    hparams = hparams._replace(batch_size=batch_size)
-  if epochs is not None:
-    hparams = hparams._replace(train_epochs=epochs)
-  if train_whole_model is not None:
-    hparams = hparams._replace(do_fine_tuning=train_whole_model)
-  if dropout_rate is not None:
-    hparams = hparams._replace(dropout_rate=dropout_rate)
-  if learning_rate is not None:
-    hparams = hparams._replace(learning_rate=learning_rate)
-  if momentum is not None:
-    hparams = hparams._replace(momentum=momentum)
+  if use_hub_library:
+    hparams = get_hub_lib_hparams(
+        batch_size=batch_size,
+        train_epochs=epochs,
+        do_fine_tuning=train_whole_model,
+        dropout_rate=dropout_rate,
+        learning_rate=learning_rate,
+        momentum=momentum)
+  else:
+    hparams = train_image_classifier_lib.HParams.get_hparams(
+        batch_size=batch_size,
+        train_epochs=epochs,
+        do_fine_tuning=train_whole_model,
+        dropout_rate=dropout_rate,
+        learning_rate=learning_rate,
+        warmup_steps=warmup_steps,
+        model_dir=model_dir)
 
   image_classifier = ImageClassifier(
       model_export_format,
@@ -105,7 +130,7 @@ def __init__(self,
                index_to_label,
                num_classes,
                shuffle=True,
-               hparams=lib.get_default_hparams(),
+               hparams=hub_lib.get_default_hparams(),
                use_augmentation=False):
     """Init function for ImageClassifier class.
 
@@ -118,6 +143,8 @@ def __init__(self,
       hparams: A namedtuple of hyperparameters. This function expects
         .dropout_rate: The fraction of the input units to drop, used in dropout
           layer.
+        .do_fine_tuning: If true, the Hub module is trained together with the
+          classification layer on top.
       use_augmentation: Use data augmentation for preprocessing.
     """
     super(ImageClassifier,
@@ -138,21 +165,18 @@ def _create_model(self, hparams=None):
 
     module_layer = hub_loader.HubKerasLayerV1V2(
         self.model_spec.uri, trainable=hparams.do_fine_tuning)
-    return lib.build_model(module_layer, hparams,
-                           self.model_spec.input_image_shape, self.num_classes)
+    return hub_lib.build_model(module_layer, hparams,
+                               self.model_spec.input_image_shape,
+                               self.num_classes)
 
   def train(self, train_data, validation_data=None, hparams=None):
     """Feeds the training data for training.
 
     Args:
       train_data: Training data.
       validation_data: Validation data. If None, skips validation process.
-      hparams: A namedtuple of hyperparameters. This function expects
-      .train_epochs: a Python integer with the number of passes over the
-        training dataset;
-      .learning_rate: a Python float forwarded to the optimizer;
-      .momentum: a Python float forwarded to the optimizer;
-      .batch_size: a Python integer, number of samples per training step.
+      hparams: An instance of hub_lib.HParams or
+        train_image_classifier_lib.HParams. Anamedtuple of hyperparameters.
 
     Returns:
       The tf.keras.callbacks.History object returned by tf.keras.Model.fit*().
@@ -170,7 +194,11 @@ def train(self, train_data, validation_data=None, hparams=None):
           validation_data, hparams.batch_size, is_training=False)
       validation_size = validation_data.size
     validation_data_and_size = (validation_ds, validation_size)
+
     # Trains the models.
+    lib = hub_lib
+    if isinstance(hparams, train_image_classifier_lib.HParams):
+      lib = train_image_classifier_lib
     return lib.train_model(self.model, hparams, train_data_and_size,
                            validation_data_and_size)
 
diff --git a/tensorflow_examples/lite/model_maker/core/task/image_classifier_test.py b/tensorflow_examples/lite/model_maker/core/task/image_classifier_test.py
@@ -20,7 +20,7 @@
 import os
 
 import numpy as np
-import tensorflow as tf
+import tensorflow.compat.v2 as tf
 from tensorflow_examples.lite.model_maker.core import compat
 from tensorflow_examples.lite.model_maker.core import model_export_format as mef
 from tensorflow_examples.lite.model_maker.core import test_util
@@ -84,6 +84,19 @@ def test_mobilenetv2_model_create_v1_incompatible(self):
       _ = image_classifier.create(self.train_data, mef.ModelExportFormat.TFLITE,
                                   model_spec.mobilenet_v2_spec)
 
+  @test_util.test_in_tf_1and2
+  def test_efficientnetlite0_model_with_model_maker_retraining_lib(self):
+    model = image_classifier.create(
+        self.train_data,
+        mef.ModelExportFormat.TFLITE,
+        model_spec.efficientnet_lite0_spec,
+        epochs=2,
+        batch_size=4,
+        shuffle=True,
+        use_hub_library=False)
+    self._test_accuracy(model)
+    self._test_export_to_tflite(model)
+
   @test_util.test_in_tf_1and2
   def test_efficientnetlite0_model(self):
     model = image_classifier.create(
diff --git a/tensorflow_examples/lite/model_maker/core/task/train_image_classifier_lib.py b/tensorflow_examples/lite/model_maker/core/task/train_image_classifier_lib.py