Open source model_maker/python/core/tasks and model_maker/python/vision/image_classifier

PiperOrigin-RevId: 481182271
2022-10-14 10:45:23 -07:00 · 2022-10-14 10:45:23 -07:00 · 0428550d75
commit 0428550d75
parent 6f3e8381ed
20 changed files with 1544 additions and 0 deletions
--- a/mediapipe/model_maker/python/core/tasks/BUILD
+++ b/mediapipe/model_maker/python/core/tasks/BUILD
@ -0,0 +1,64 @@
 # Copyright 2022 The MediaPipe Authors. All Rights Reserved.
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
 # You may obtain a copy of the License at
 #
 #     http://www.apache.org/licenses/LICENSE-2.0
 #
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 # See the License for the specific language governing permissions and
 # limitations under the License.
 # Placeholder for internal Python strict library and test compatibility macro.
 package(
    default_visibility = ["//mediapipe:__subpackages__"],
 )
 licenses(["notice"])
 py_library(
    name = "custom_model",
    srcs = ["custom_model.py"],
    srcs_version = "PY3",
    deps = [
        "//mediapipe/model_maker/python/core/data:dataset",
        "//mediapipe/model_maker/python/core/utils:model_util",
        "//mediapipe/model_maker/python/core/utils:quantization",
    ],
 )
 py_test(
    name = "custom_model_test",
    srcs = ["custom_model_test.py"],
    python_version = "PY3",
    srcs_version = "PY3",
    deps = [
        ":custom_model",
        "//mediapipe/model_maker/python/core/utils:test_util",
    ],
 )
 py_library(
    name = "classifier",
    srcs = ["classifier.py"],
    srcs_version = "PY3",
    deps = [
        ":custom_model",
        "//mediapipe/model_maker/python/core/data:dataset",
    ],
 )
 py_test(
    name = "classifier_test",
    srcs = ["classifier_test.py"],
    python_version = "PY3",
    srcs_version = "PY3",
    deps = [
        ":classifier",
        "//mediapipe/model_maker/python/core/utils:test_util",
    ],
 )
--- a/mediapipe/model_maker/python/core/tasks/init.py
+++ b/mediapipe/model_maker/python/core/tasks/init.py
@ -0,0 +1,13 @@
 # Copyright 2022 The MediaPipe Authors. All Rights Reserved.
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
 # You may obtain a copy of the License at
 #
 #     http://www.apache.org/licenses/LICENSE-2.0
 #
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 # See the License for the specific language governing permissions and
 # limitations under the License.
--- a/mediapipe/model_maker/python/core/tasks/classifier.py
+++ b/mediapipe/model_maker/python/core/tasks/classifier.py
@ -0,0 +1,77 @@
 # Copyright 2022 The MediaPipe Authors. All Rights Reserved.
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
 # You may obtain a copy of the License at
 #
 #     http://www.apache.org/licenses/LICENSE-2.0
 #
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 # See the License for the specific language governing permissions and
 # limitations under the License.
 """Custom classifier."""
 from __future__ import absolute_import
 from __future__ import division
 from __future__ import print_function
 import os
 from typing import Any, List
 import tensorflow as tf
 from mediapipe.model_maker.python.core.data import dataset
 from mediapipe.model_maker.python.core.tasks import custom_model
 class Classifier(custom_model.CustomModel):
  """An abstract base class that represents a TensorFlow classifier."""
  def __init__(self, model_spec: Any, index_to_label: List[str], shuffle: bool,
               full_train: bool):
    """Initilizes a classifier with its specifications.
    Args:
        model_spec: Specification for the model.
        index_to_label: A list that map from index to label class name.
        shuffle: Whether the dataset should be shuffled.
        full_train: If true, train the model end-to-end including the backbone
          and the classification layers on top. Otherwise, only train the top
          classification layers.
    """
    super(Classifier, self).__init__(model_spec, shuffle)
    self._index_to_label = index_to_label
    self._full_train = full_train
    self._num_classes = len(index_to_label)
  def evaluate(self, data: dataset.Dataset, batch_size: int = 32) -> Any:
    """Evaluates the classifier with the provided evaluation dataset.
    Args:
        data: Evaluation dataset
        batch_size: Number of samples per evaluation step.
    Returns:
      The loss value and accuracy.
    """
    ds = data.gen_tf_dataset(
        batch_size, is_training=False, preprocess=self._preprocess)
    return self._model.evaluate(ds)
  def export_labels(self, export_dir: str, label_filename: str = 'labels.txt'):
    """Exports classification labels into a label file.
    Args:
      export_dir: The directory to save exported files.
      label_filename: File name to save labels model. The full export path is
        {export_dir}/{label_filename}.
    """
    if not tf.io.gfile.exists(export_dir):
      tf.io.gfile.makedirs(export_dir)
    label_filepath = os.path.join(export_dir, label_filename)
    tf.compat.v1.logging.info('Saving labels in %s', label_filepath)
    with tf.io.gfile.GFile(label_filepath, 'w') as f:
      f.write('\n'.join(self._index_to_label))
--- a/mediapipe/model_maker/python/core/tasks/classifier_test.py
+++ b/mediapipe/model_maker/python/core/tasks/classifier_test.py
@ -0,0 +1,58 @@
 # Copyright 2022 The MediaPipe Authors. All Rights Reserved.
 #
 # Licensed under the Apache License, Version 2.0 (the 'License');
 # you may not use this file except in compliance with the License.
 # You may obtain a copy of the License at
 #
 #     http://www.apache.org/licenses/LICENSE-2.0
 #
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an 'AS IS' BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 # See the License for the specific language governing permissions and
 # limitations under the License.
 import os
 # Dependency imports
 import tensorflow as tf
 from mediapipe.model_maker.python.core.tasks import classifier
 from mediapipe.model_maker.python.core.utils import test_util
 class MockClassifier(classifier.Classifier):
  """A mock class with implementation of abstract methods for testing."""
  def train(self, train_data, validation_data=None, **kwargs):
    pass
  def evaluate(self, data, **kwargs):
    pass
 class ClassifierTest(tf.test.TestCase):
  def setUp(self):
    super(ClassifierTest, self).setUp()
    index_to_label = ['cat', 'dog']
    self.model = MockClassifier(
        model_spec=None,
        index_to_label=index_to_label,
        shuffle=False,
        full_train=False)
    self.model.model = test_util.build_model(input_shape=[4], num_classes=2)
  def _check_nonempty_file(self, filepath):
    self.assertTrue(os.path.isfile(filepath))
    self.assertGreater(os.path.getsize(filepath), 0)
  def test_export_labels(self):
    export_path = os.path.join(self.get_temp_dir(), 'export/')
    self.model.export_labels(export_dir=export_path)
    self._check_nonempty_file(os.path.join(export_path, 'labels.txt'))
 if __name__ == '__main__':
  tf.test.main()
--- a/mediapipe/model_maker/python/core/tasks/custom_model.py
+++ b/mediapipe/model_maker/python/core/tasks/custom_model.py
@ -0,0 +1,85 @@
 # Copyright 2022 The MediaPipe Authors. All Rights Reserved.
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
 # You may obtain a copy of the License at
 #
 #     http://www.apache.org/licenses/LICENSE-2.0
 #
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 # See the License for the specific language governing permissions and
 # limitations under the License.
 """Interface to define a custom model."""
 from __future__ import absolute_import
 from __future__ import division
 from __future__ import print_function
 import abc
 import os
 from typing import Any, Callable, Optional
 # Dependency imports
 import tensorflow as tf
 from mediapipe.model_maker.python.core.data import dataset
 from mediapipe.model_maker.python.core.utils import model_util
 from mediapipe.model_maker.python.core.utils import quantization
 class CustomModel(abc.ABC):
  """The abstract base class that represents a custom TensorFlow model."""
  def __init__(self, model_spec: Any, shuffle: bool):
    """Initializes a custom model with model specs and other parameters.
    Args:
      model_spec: Specification for the model.
      shuffle: Whether the training data need be shuffled.
    """
    self._model_spec = model_spec
    self._shuffle = shuffle
    self._preprocess = None
    self._model = None
  @abc.abstractmethod
  def evaluate(self, data: dataset.Dataset, **kwargs):
    """Evaluates the model with the provided data."""
    return
  def summary(self):
    """Prints a summary of the model."""
    self._model.summary()
  def export_tflite(
      self,
      export_dir: str,
      tflite_filename: str = 'model.tflite',
      quantization_config: Optional[quantization.QuantizationConfig] = None,
      preprocess: Optional[Callable[..., bool]] = None):
    """Converts the model to requested formats.
    Args:
      export_dir: The directory to save exported files.
      tflite_filename: File name to save tflite model. The full export path is
        {export_dir}/{tflite_filename}.
      quantization_config: The configuration for model quantization.
      preprocess: A callable to preprocess the representative dataset for
        quantization. The callable takes three arguments in order: feature,
        label, and is_training.
    """
    if not tf.io.gfile.exists(export_dir):
      tf.io.gfile.makedirs(export_dir)
    tflite_filepath = os.path.join(export_dir, tflite_filename)
    # TODO: Populate metadata to the exported TFLite model.
    model_util.export_tflite(
        self._model,
        tflite_filepath,
        quantization_config,
        preprocess=preprocess)
    tf.compat.v1.logging.info(
        'TensorFlow Lite model exported successfully: %s' % tflite_filepath)
--- a/mediapipe/model_maker/python/core/tasks/custom_model_test.py
+++ b/mediapipe/model_maker/python/core/tasks/custom_model_test.py
@ -0,0 +1,56 @@
 # Copyright 2022 The MediaPipe Authors. All Rights Reserved.
 #
 # Licensed under the Apache License, Version 2.0 (the 'License');
 # you may not use this file except in compliance with the License.
 # You may obtain a copy of the License at
 #
 #     http://www.apache.org/licenses/LICENSE-2.0
 #
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an 'AS IS' BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 # See the License for the specific language governing permissions and
 # limitations under the License.
 from __future__ import absolute_import
 from __future__ import division
 from __future__ import print_function
 import os
 # Dependency imports
 import tensorflow as tf
 from mediapipe.model_maker.python.core.tasks import custom_model
 from mediapipe.model_maker.python.core.utils import test_util
 class MockCustomModel(custom_model.CustomModel):
  """A mock class with implementation of abstract methods for testing."""
  def train(self, train_data, validation_data=None, **kwargs):
    pass
  def evaluate(self, data, **kwargs):
    pass
 class CustomModelTest(tf.test.TestCase):
  def setUp(self):
    super(CustomModelTest, self).setUp()
    self.model = MockCustomModel(model_spec=None, shuffle=False)
    self.model._model = test_util.build_model(input_shape=[4], num_classes=2)
  def _check_nonempty_file(self, filepath):
    self.assertTrue(os.path.isfile(filepath))
    self.assertGreater(os.path.getsize(filepath), 0)
  def test_export_tflite(self):
    export_path = os.path.join(self.get_temp_dir(), 'export/')
    self.model.export_tflite(export_dir=export_path)
    self._check_nonempty_file(os.path.join(export_path, 'model.tflite'))
 if __name__ == '__main__':
  tf.test.main()
--- a/mediapipe/model_maker/python/vision/BUILD
+++ b/mediapipe/model_maker/python/vision/BUILD
@ -0,0 +1,19 @@
 # Copyright 2022 The MediaPipe Authors. All Rights Reserved.
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
 # You may obtain a copy of the License at
 #
 #     http://www.apache.org/licenses/LICENSE-2.0
 #
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 # See the License for the specific language governing permissions and
 # limitations under the License.
 package(
    default_visibility = ["//mediapipe:__subpackages__"],
 )
 licenses(["notice"])
--- a/mediapipe/model_maker/python/vision/init.py
+++ b/mediapipe/model_maker/python/vision/init.py
@ -0,0 +1,13 @@
 # Copyright 2022 The MediaPipe Authors. All Rights Reserved.
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
 # You may obtain a copy of the License at
 #
 #     http://www.apache.org/licenses/LICENSE-2.0
 #
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 # See the License for the specific language governing permissions and
 # limitations under the License.
--- a/mediapipe/model_maker/python/vision/image_classifier/BUILD
+++ b/mediapipe/model_maker/python/vision/image_classifier/BUILD
@ -0,0 +1,111 @@
 # Copyright 2022 The MediaPipe Authors. All Rights Reserved.
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
 # You may obtain a copy of the License at
 #
 #     http://www.apache.org/licenses/LICENSE-2.0
 #
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 # See the License for the specific language governing permissions and
 # limitations under the License.
 # Placeholder for internal Python library rule.
 # Placeholder for internal Python strict library and test compatibility macro.
 licenses(["notice"])
 package(
    default_visibility = ["//mediapipe:__subpackages__"],
 )
 py_library(
    name = "image_classifier_import",
    srcs = ["__init__.py"],
    deps = [
        ":dataset",
        ":hyperparameters",
        ":image_classifier",
        ":model_spec",
    ],
 )
 py_library(
    name = "model_spec",
    srcs = ["model_spec.py"],
 )
 py_test(
    name = "model_spec_test",
    srcs = ["model_spec_test.py"],
    deps = [":model_spec"],
 )
 py_library(
    name = "dataset",
    srcs = ["dataset.py"],
    deps = ["//mediapipe/model_maker/python/core/data:classification_dataset"],
 )
 py_test(
    name = "dataset_test",
    srcs = ["dataset_test.py"],
    deps = [":dataset"],
 )
 py_library(
    name = "hyperparameters",
    srcs = ["hyperparameters.py"],
 )
 py_library(
    name = "train_image_classifier_lib",
    srcs = ["train_image_classifier_lib.py"],
    deps = [
        ":hyperparameters",
        "//mediapipe/model_maker/python/core/utils:model_util",
    ],
 )
 py_library(
    name = "image_classifier",
    srcs = ["image_classifier.py"],
    deps = [
        ":hyperparameters",
        ":model_spec",
        ":train_image_classifier_lib",
        "//mediapipe/model_maker/python/core/data:classification_dataset",
        "//mediapipe/model_maker/python/core/tasks:classifier",
        "//mediapipe/model_maker/python/core/utils:image_preprocessing",
        "//mediapipe/model_maker/python/core/utils:model_util",
        "//mediapipe/model_maker/python/core/utils:quantization",
    ],
 )
 py_library(
    name = "image_classifier_test_lib",
    testonly = 1,
    srcs = ["image_classifier_test.py"],
    deps = [":image_classifier_import"],
 )
 py_test(
    name = "image_classifier_test",
    srcs = ["image_classifier_test.py"],
    shard_count = 2,
    tags = ["requires-net:external"],
    deps = [
        ":image_classifier_test_lib",
    ],
 )
 py_binary(
    name = "image_classifier_demo",
    srcs = ["image_classifier_demo.py"],
    deps = [
        ":image_classifier_import",
        "//mediapipe/model_maker/python/core/utils:quantization",
    ],
 )
--- a/mediapipe/model_maker/python/vision/image_classifier/init.py
+++ b/mediapipe/model_maker/python/vision/image_classifier/init.py
@ -0,0 +1,25 @@
 # Copyright 2022 The MediaPipe Authors. All Rights Reserved.
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
 # You may obtain a copy of the License at
 #
 #     http://www.apache.org/licenses/LICENSE-2.0
 #
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 # See the License for the specific language governing permissions and
 # limitations under the License.
 """MediaPipe Model Maker Python Public API For Image Classifier."""
 from mediapipe.model_maker.python.vision.image_classifier import dataset
 from mediapipe.model_maker.python.vision.image_classifier import hyperparameters
 from mediapipe.model_maker.python.vision.image_classifier import image_classifier
 from mediapipe.model_maker.python.vision.image_classifier import model_spec
 ImageClassifier = image_classifier.ImageClassifier
 HParams = hyperparameters.HParams
 Dataset = dataset.Dataset
 ModelSpec = model_spec.ModelSpec
 SupportedModels = model_spec.SupportedModels
--- a/mediapipe/model_maker/python/vision/image_classifier/dataset.py
+++ b/mediapipe/model_maker/python/vision/image_classifier/dataset.py
@ -0,0 +1,139 @@
 # Copyright 2022 The MediaPipe Authors. All Rights Reserved.
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
 # You may obtain a copy of the License at
 #
 #     http://www.apache.org/licenses/LICENSE-2.0
 #
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 # See the License for the specific language governing permissions and
 # limitations under the License.
 """Image classifier dataset library."""
 import os
 import random
 from typing import List, Optional, Tuple
 import tensorflow as tf
 import tensorflow_datasets as tfds
 from mediapipe.model_maker.python.core.data import classification_dataset
 def _load_image(path: str) -> tf.Tensor:
  """Loads image."""
  image_raw = tf.io.read_file(path)
  image_tensor = tf.cond(
      tf.image.is_jpeg(image_raw),
      lambda: tf.image.decode_jpeg(image_raw, channels=3),
      lambda: tf.image.decode_png(image_raw, channels=3))
  return image_tensor
 def _create_data(
    name: str, data: tf.data.Dataset, info: tfds.core.DatasetInfo,
    label_names: List[str]
 ) -> Optional[classification_dataset.ClassificationDataset]:
  """Creates a Dataset object from tfds data."""
  if name not in data:
    return None
  data = data[name]
  data = data.map(lambda a: (a['image'], a['label']))
  size = info.splits[name].num_examples
  return Dataset(data, size, label_names)
 class Dataset(classification_dataset.ClassificationDataset):
  """Dataset library for image classifier."""
  @classmethod
  def from_folder(
      cls,
      dirname: str,
      shuffle: bool = True) -> classification_dataset.ClassificationDataset:
    """Loads images and labels from the given directory.
    Assume the image data of the same label are in the same subdirectory.
    Args:
      dirname: Name of the directory containing the data files.
      shuffle: boolean, if shuffle, random shuffle data.
    Returns:
      Dataset containing images and labels and other related info.
    Raises:
      ValueError: if the input data directory is empty.
    """
    data_root = os.path.abspath(dirname)
    # Assumes the image data of the same label are in the same subdirectory,
    # gets image path and label names.
    all_image_paths = list(tf.io.gfile.glob(data_root + r'/*/*'))
    all_image_size = len(all_image_paths)
    if all_image_size == 0:
      raise ValueError('Image size is zero')
    if shuffle:
      # Random shuffle data.
      random.shuffle(all_image_paths)
    label_names = sorted(
        name for name in os.listdir(data_root)
        if os.path.isdir(os.path.join(data_root, name)))
    all_label_size = len(label_names)
    label_to_index = dict(
        (name, index) for index, name in enumerate(label_names))
    all_image_labels = [
        label_to_index[os.path.basename(os.path.dirname(path))]
        for path in all_image_paths
    ]
    path_ds = tf.data.Dataset.from_tensor_slices(all_image_paths)
    autotune = tf.data.AUTOTUNE
    image_ds = path_ds.map(_load_image, num_parallel_calls=autotune)
    # Loads label.
    label_ds = tf.data.Dataset.from_tensor_slices(
        tf.cast(all_image_labels, tf.int64))
    # Creates  a dataset if (image, label) pairs.
    image_label_ds = tf.data.Dataset.zip((image_ds, label_ds))
    tf.compat.v1.logging.info(
        'Load image with size: %d, num_label: %d, labels: %s.', all_image_size,
        all_label_size, ', '.join(label_names))
    return Dataset(image_label_ds, all_image_size, label_names)
  @classmethod
  def load_tf_dataset(
      cls, name: str
  ) -> Tuple[Optional[classification_dataset.ClassificationDataset],
             Optional[classification_dataset.ClassificationDataset],
             Optional[classification_dataset.ClassificationDataset]]:
    """Loads data from tensorflow_datasets.
    Args:
      name: the registered name of the tfds.core.DatasetBuilder. Refer to the
        documentation of tfds.load for more details.
    Returns:
      A tuple of Datasets for the train/validation/test.
    Raises:
      ValueError: if the input tf dataset does not have train/validation/test
      labels.
    """
    data, info = tfds.load(name, with_info=True)
    if 'label' not in info.features:
      raise ValueError('info.features need to contain \'label\' key.')
    label_names = info.features['label'].names
    train_data = _create_data('train', data, info, label_names)
    validation_data = _create_data('validation', data, info, label_names)
    test_data = _create_data('test', data, info, label_names)
    return train_data, validation_data, test_data
--- a/mediapipe/model_maker/python/vision/image_classifier/dataset_test.py
+++ b/mediapipe/model_maker/python/vision/image_classifier/dataset_test.py
@ -0,0 +1,108 @@
 # Copyright 2022 The MediaPipe Authors. All Rights Reserved.
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
 # You may obtain a copy of the License at
 #
 #     http://www.apache.org/licenses/LICENSE-2.0
 #
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 # See the License for the specific language governing permissions and
 # limitations under the License.
 import os
 import random
 import numpy as np
 import tensorflow as tf
 from mediapipe.model_maker.python.vision.image_classifier import dataset
 def _fill_image(rgb, image_size):
  r, g, b = rgb
  return np.broadcast_to(
      np.array([[[r, g, b]]], dtype=np.uint8),
      shape=(image_size, image_size, 3))
 def _write_filled_jpeg_file(path, rgb, image_size):
  tf.keras.preprocessing.image.save_img(path, _fill_image(rgb, image_size),
                                        'channels_last', 'jpeg')
 class DatasetTest(tf.test.TestCase):
  def setUp(self):
    super().setUp()
    self.image_path = os.path.join(self.get_temp_dir(), 'random_image_dir')
    if os.path.exists(self.image_path):
      return
    os.mkdir(self.image_path)
    for class_name in ('daisy', 'tulips'):
      class_subdir = os.path.join(self.image_path, class_name)
      os.mkdir(class_subdir)
      _write_filled_jpeg_file(
          os.path.join(class_subdir, '0.jpeg'),
          [random.uniform(0, 255) for _ in range(3)], 224)
  def test_split(self):
    ds = tf.data.Dataset.from_tensor_slices([[0, 1], [1, 1], [0, 0], [1, 0]])
    data = dataset.Dataset(ds, 4, ['pos', 'neg'])
    train_data, test_data = data.split(0.5)
    self.assertLen(train_data, 2)
    for i, elem in enumerate(train_data._dataset):
      self.assertTrue((elem.numpy() == np.array([i, 1])).all())
    self.assertEqual(train_data.num_classes, 2)
    self.assertEqual(train_data.index_to_label, ['pos', 'neg'])
    self.assertLen(test_data, 2)
    for i, elem in enumerate(test_data._dataset):
      self.assertTrue((elem.numpy() == np.array([i, 0])).all())
    self.assertEqual(test_data.num_classes, 2)
    self.assertEqual(test_data.index_to_label, ['pos', 'neg'])
  def test_from_folder(self):
    data = dataset.Dataset.from_folder(self.image_path)
    self.assertLen(data, 2)
    self.assertEqual(data.num_classes, 2)
    self.assertEqual(data.index_to_label, ['daisy', 'tulips'])
    for image, label in data.gen_tf_dataset():
      self.assertTrue(label.numpy() == 1 or label.numpy() == 0)
      if label.numpy() == 0:
        raw_image_tensor = dataset._load_image(
            os.path.join(self.image_path, 'daisy', '0.jpeg'))
      else:
        raw_image_tensor = dataset._load_image(
            os.path.join(self.image_path, 'tulips', '0.jpeg'))
      self.assertTrue((image.numpy() == raw_image_tensor.numpy()).all())
  def test_from_tfds(self):
    # TODO: Remove this once tfds download error is fixed.
    self.skipTest('Temporarily skip the unittest due to tfds download error.')
    train_data, validation_data, test_data = (
        dataset.Dataset.from_tfds('beans'))
    self.assertIsInstance(train_data.gen_tf_dataset(), tf.data.Dataset)
    self.assertLen(train_data, 1034)
    self.assertEqual(train_data.num_classes, 3)
    self.assertEqual(train_data.index_to_label,
                     ['angular_leaf_spot', 'bean_rust', 'healthy'])
    self.assertIsInstance(validation_data.gen_tf_dataset(), tf.data.Dataset)
    self.assertLen(validation_data, 133)
    self.assertEqual(validation_data.num_classes, 3)
    self.assertEqual(validation_data.index_to_label,
                     ['angular_leaf_spot', 'bean_rust', 'healthy'])
    self.assertIsInstance(test_data.gen_tf_dataset(), tf.data.Dataset)
    self.assertLen(test_data, 128)
    self.assertEqual(test_data.num_classes, 3)
    self.assertEqual(test_data.index_to_label,
                     ['angular_leaf_spot', 'bean_rust', 'healthy'])
 if __name__ == '__main__':
  tf.test.main()
--- a/mediapipe/model_maker/python/vision/image_classifier/hyperparameters.py
+++ b/mediapipe/model_maker/python/vision/image_classifier/hyperparameters.py
@ -0,0 +1,74 @@
 # Copyright 2022 The MediaPipe Authors. All Rights Reserved.
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
 # You may obtain a copy of the License at
 #
 #     http://www.apache.org/licenses/LICENSE-2.0
 #
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 # See the License for the specific language governing permissions and
 # limitations under the License.
 """Hyperparameters for training image classification models."""
 import dataclasses
 import tempfile
 from typing import Optional
 # TODO: Expose other hyperparameters, e.g. data augmentation
 # hyperparameters if requested.
@dataclasses.dataclass
 class HParams:
  """The hyperparameters for training image classifiers.
  The hyperparameters include:
    # Parameters about training data.
    do_fine_tuning: If true, the base module is trained together with the
      classification layer on top.
    shuffle: A boolean controlling if shuffle the dataset. Default to false.
    # Parameters about training configuration
    train_epochs: Training will do this many iterations over the dataset.
    batch_size: Each training step samples a batch of this many images.
    learning_rate: The learning rate to use for gradient descent training.
    dropout_rate: The fraction of the input units to drop, used in dropout
      layer.
    l1_regularizer: A regularizer that applies a L1 regularization penalty.
    l2_regularizer: A regularizer that applies a L2 regularization penalty.
    label_smoothing: Amount of label smoothing to apply. See tf.keras.losses for
      more details.
    do_data_augmentation: A boolean controlling whether the training dataset is
      augmented by randomly distorting input images, including random cropping,
      flipping, etc. See utils.image_preprocessing documentation for details.
    steps_per_epoch: An optional integer indicate the number of training steps
      per epoch. If not set, the training pipeline calculates the default steps
      per epoch as the training dataset size devided by batch size.
    decay_samples: Number of training samples used to calculate the decay steps
      and create the training optimizer.
    warmup_steps: Number of warmup steps for a linear increasing warmup schedule
       on learning rate. Used to set up warmup schedule by model_util.WarmUp.
    # Parameters about the saved checkpoint
    model_dir: The location of model checkpoint files and exported model files.
  """
  # Parameters about training data
  do_fine_tuning: bool = False
  shuffle: bool = False
  # Parameters about training configuration
  train_epochs: int = 5
  batch_size: int = 32
  learning_rate: float = 0.005
  dropout_rate: float = 0.2
  l1_regularizer: float = 0.0
  l2_regularizer: float = 0.0001
  label_smoothing: float = 0.1
  do_data_augmentation: bool = True
  steps_per_epoch: Optional[int] = None
  decay_samples: int = 10000 * 256
  warmup_epochs: int = 2
  # Parameters about the saved checkpoint
  model_dir: str = tempfile.mkdtemp()
--- a/mediapipe/model_maker/python/vision/image_classifier/image_classifier.py
+++ b/mediapipe/model_maker/python/vision/image_classifier/image_classifier.py
@ -0,0 +1,172 @@
 # Copyright 2022 The MediaPipe Authors. All Rights Reserved.
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
 # You may obtain a copy of the License at
 #
 #     http://www.apache.org/licenses/LICENSE-2.0
 #
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 # See the License for the specific language governing permissions and
 # limitations under the License.
 """APIs to train image classifier model."""
 from typing import Any, List, Optional
 import tensorflow as tf
 import tensorflow_hub as hub
 from mediapipe.model_maker.python.core.data import classification_dataset as classification_ds
 from mediapipe.model_maker.python.core.tasks import classifier
 from mediapipe.model_maker.python.core.utils import image_preprocessing
 from mediapipe.model_maker.python.core.utils import model_util
 from mediapipe.model_maker.python.core.utils import quantization
 from mediapipe.model_maker.python.vision.image_classifier import hyperparameters as hp
 from mediapipe.model_maker.python.vision.image_classifier import model_spec as ms
 from mediapipe.model_maker.python.vision.image_classifier import train_image_classifier_lib
 class ImageClassifier(classifier.Classifier):
  """ImageClassifier for building image classification model."""
  def __init__(self, model_spec: ms.ModelSpec, index_to_label: List[Any],
               hparams: hp.HParams):
    """Initializes ImageClassifier class.
    Args:
      model_spec: Specification for the model.
      index_to_label: A list that maps from index to label class name.
      hparams: The hyperparameters for training image classifier.
    """
    super(ImageClassifier, self).__init__(
        model_spec=model_spec,
        index_to_label=index_to_label,
        shuffle=hparams.shuffle,
        full_train=hparams.do_fine_tuning)
    self._hparams = hparams
    self._preprocess = image_preprocessing.Preprocessor(
        input_shape=self._model_spec.input_image_shape,
        num_classes=self._num_classes,
        mean_rgb=self._model_spec.mean_rgb,
        stddev_rgb=self._model_spec.stddev_rgb,
        use_augmentation=hparams.do_data_augmentation)
    self._history = None  # Training history returned from `keras_model.fit`.
  @classmethod
  def create(
      cls,
      model_spec: ms.SupportedModels,
      train_data: classification_ds.ClassificationDataset,
      validation_data: classification_ds.ClassificationDataset,
      hparams: Optional[hp.HParams] = None,
  ) -> 'ImageClassifier':
    """Creates and trains an image classifier.
    Loads data and trains the model based on data for image classification.
    Args:
      model_spec: Specification for the model.
      train_data: Training data.
      validation_data: Validation data.
      hparams: Hyperparameters for training image classifier.
    Returns:
      An instance based on ImageClassifier.
    """
    if hparams is None:
      hparams = hp.HParams()
    spec = ms.SupportedModels.get(model_spec)
    image_classifier = cls(
        model_spec=spec,
        index_to_label=train_data.index_to_label,
        hparams=hparams)
    image_classifier._create_model()
    tf.compat.v1.logging.info('Training the models...')
    image_classifier._train(
        train_data=train_data, validation_data=validation_data)
    return image_classifier
  def _train(self, train_data: classification_ds.ClassificationDataset,
             validation_data: classification_ds.ClassificationDataset):
    """Trains the model with input train_data.
    The training results are recorded by a self._history object returned by
    tf.keras.Model.fit().
    Args:
      train_data: Training data.
      validation_data: Validation data.
    """
    tf.compat.v1.logging.info('Training the models...')
    hparams = self._hparams
    if len(train_data) < hparams.batch_size:
      raise ValueError('The size of the train_data (%d) couldn\'t be smaller '
                       'than batch_size (%d). To solve this problem, set '
                       'the batch_size smaller or increase the size of the '
                       'train_data.' % (len(train_data), hparams.batch_size))
    train_dataset = train_data.gen_tf_dataset(
        batch_size=hparams.batch_size,
        is_training=True,
        shuffle=self._shuffle,
        preprocess=self._preprocess)
    hparams.steps_per_epoch = model_util.get_steps_per_epoch(
        steps_per_epoch=hparams.steps_per_epoch,
        batch_size=hparams.batch_size,
        train_data=train_data)
    train_dataset = train_dataset.take(count=hparams.steps_per_epoch)
    validation_dataset = validation_data.gen_tf_dataset(
        batch_size=hparams.batch_size,
        is_training=False,
        preprocess=self._preprocess)
    # Train the model.
    self._history = train_image_classifier_lib.train_model(
        model=self._model,
        hparams=hparams,
        train_ds=train_dataset,
        validation_ds=validation_dataset)
  def _create_model(self):
    """Creates the classifier model from TFHub pretrained models."""
    module_layer = hub.KerasLayer(
        handle=self._model_spec.uri, trainable=self._hparams.do_fine_tuning)
    image_size = self._model_spec.input_image_shape
    self._model = tf.keras.Sequential([
        tf.keras.Input(shape=(image_size[0], image_size[1], 3)), module_layer,
        tf.keras.layers.Dropout(rate=self._hparams.dropout_rate),
        tf.keras.layers.Dense(
            units=self._num_classes,
            activation='softmax',
            kernel_regularizer=tf.keras.regularizers.l1_l2(
                l1=self._hparams.l1_regularizer,
                l2=self._hparams.l2_regularizer))
    ])
    print(self._model.summary())
  def export_model(
      self,
      model_name: str = 'model.tflite',
      quantization_config: Optional[quantization.QuantizationConfig] = None):
    """Converts the model to the requested formats and exports to a file.
    Args:
      model_name: File name to save tflite model. The full export path is
        {export_dir}/{tflite_filename}.
      quantization_config: The configuration for model quantization.
    """
    super().export_tflite(
        self._hparams.model_dir,
        model_name,
        quantization_config,
        preprocess=self._preprocess)
--- a/mediapipe/model_maker/python/vision/image_classifier/image_classifier_demo.py
+++ b/mediapipe/model_maker/python/vision/image_classifier/image_classifier_demo.py
@ -0,0 +1,106 @@
 # Copyright 2022 The MediaPipe Authors. All Rights Reserved.
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
 # You may obtain a copy of the License at
 #
 #     http://www.apache.org/licenses/LICENSE-2.0
 #
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 # See the License for the specific language governing permissions and
 # limitations under the License.
 """Demo for making an image classifier model by MediaPipe Model Maker."""
 import os
 # Dependency imports
 from absl import app
 from absl import flags
 from absl import logging
 import tensorflow as tf
 from mediapipe.model_maker.python.core.utils import quantization
 from mediapipe.model_maker.python.vision import image_classifier
 FLAGS = flags.FLAGS
 def define_flags() -> None:
  """Define flags for the image classifier model maker demo."""
  flags.DEFINE_string('export_dir', None,
                      'The directory to save exported files.')
  flags.DEFINE_string(
      'input_data_dir', None,
      """The directory with input training data. If the training data is not
      specified, the pipeline will download a default training dataset.""")
  flags.DEFINE_enum_class('spec',
                          image_classifier.SupportedModels.EFFICIENTNET_LITE0,
                          image_classifier.SupportedModels,
                          'The image classifier to run.')
  flags.DEFINE_enum('quantization', None, ['dynamic', 'int8', 'float16'],
                    'The quantization method to use when exporting the model.')
  flags.mark_flag_as_required('export_dir')
 def download_demo_data() -> str:
  """Downloads demo data, and returns directory path."""
  data_dir = tf.keras.utils.get_file(
      fname='flower_photos.tgz',
      origin='https://storage.googleapis.com/download.tensorflow.org/example_images/flower_photos.tgz',
      extract=True)
  return os.path.join(os.path.dirname(data_dir), 'flower_photos')  # folder name
 def run(data_dir: str, export_dir: str,
        model_spec: image_classifier.SupportedModels,
        quantization_option: str) -> None:
  """Runs demo."""
  data = image_classifier.Dataset.from_folder(data_dir)
  train_data, rest_data = data.split(0.8)
  validation_data, test_data = rest_data.split(0.5)
  model = image_classifier.ImageClassifier.create(
      model_spec=model_spec,
      train_data=train_data,
      validation_data=validation_data,
      hparams=image_classifier.HParams(model_dir=export_dir))
  _, acc = model.evaluate(test_data)
  print('Test accuracy: %f' % acc)
  if quantization_option is None:
    quantization_config = None
  elif quantization_option == 'dynamic':
    quantization_config = quantization.QuantizationConfig.for_dynamic()
  elif quantization_option == 'int8':
    quantization_config = quantization.QuantizationConfig.for_int8(train_data)
  elif quantization_option == 'float16':
    quantization_config = quantization.QuantizationConfig.for_float16()
  else:
    raise ValueError(f'Quantization: {quantization} is not recognized')
  model.export_model(quantization_config=quantization_config)
  model.export_labels(export_dir)
 def main(_) -> None:
  logging.set_verbosity(logging.INFO)
  if FLAGS.input_data_dir is None:
    data_dir = download_demo_data()
  else:
    data_dir = FLAGS.input_data_dir
  export_dir = os.path.expanduser(FLAGS.export_dir)
  run(data_dir=data_dir,
      export_dir=export_dir,
      model_spec=FLAGS.spec,
      quantization_option=FLAGS.quantization)
 if __name__ == '__main__':
  define_flags()
  app.run(main)
--- a/mediapipe/model_maker/python/vision/image_classifier/image_classifier_test.py
+++ b/mediapipe/model_maker/python/vision/image_classifier/image_classifier_test.py
@ -0,0 +1,122 @@
 # Copyright 2022 The MediaPipe Authors. All Rights Reserved.
 #
 # Licensed under the Apache License, Version 2.0 (the 'License');
 # you may not use this file except in compliance with the License.
 # You may obtain a copy of the License at
 #
 #     http://www.apache.org/licenses/LICENSE-2.0
 #
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an 'AS IS' BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 # See the License for the specific language governing permissions and
 # limitations under the License.
 import os
 from absl.testing import parameterized
 import numpy as np
 import tensorflow as tf
 from mediapipe.model_maker.python.vision import image_classifier
 def _fill_image(rgb, image_size):
  r, g, b = rgb
  return np.broadcast_to(
      np.array([[[r, g, b]]], dtype=np.uint8),
      shape=(image_size, image_size, 3))
 class ImageClassifierTest(tf.test.TestCase, parameterized.TestCase):
  IMAGE_SIZE = 24
  IMAGES_PER_CLASS = 2
  CMY_NAMES_AND_RGB_VALUES = (('cyan', (0, 255, 255)),
                              ('magenta', (255, 0, 255)), ('yellow', (255, 255,
                                                                      0)))
  def _gen(self):
    for i, (_, rgb) in enumerate(self.CMY_NAMES_AND_RGB_VALUES):
      for _ in range(self.IMAGES_PER_CLASS):
        yield (_fill_image(rgb, self.IMAGE_SIZE), i)
  def _gen_cmy_data(self):
    ds = tf.data.Dataset.from_generator(
        self._gen, (tf.uint8, tf.int64), (tf.TensorShape(
            [self.IMAGE_SIZE, self.IMAGE_SIZE, 3]), tf.TensorShape([])))
    data = image_classifier.Dataset(ds, self.IMAGES_PER_CLASS * 3,
                                    ['cyan', 'magenta', 'yellow'])
    return data
  def setUp(self):
    super(ImageClassifierTest, self).setUp()
    all_data = self._gen_cmy_data()
    # Splits data, 90% data for training, 10% for testing
    self.train_data, self.test_data = all_data.split(0.9)
  @parameterized.named_parameters(
      dict(
          testcase_name='mobilenet_v2',
          model_spec=image_classifier.SupportedModels.MOBILENET_V2,
          hparams=image_classifier.HParams(
              train_epochs=1, batch_size=1, shuffle=True)),
      dict(
          testcase_name='resnet_50',
          model_spec=image_classifier.SupportedModels.RESNET_50,
          hparams=image_classifier.HParams(
              train_epochs=1, batch_size=1, shuffle=True)),
      dict(
          testcase_name='efficientnet_lite0',
          model_spec=image_classifier.SupportedModels.EFFICIENTNET_LITE0,
          hparams=image_classifier.HParams(
              train_epochs=1, batch_size=1, shuffle=True)),
      dict(
          testcase_name='efficientnet_lite1',
          model_spec=image_classifier.SupportedModels.EFFICIENTNET_LITE1,
          hparams=image_classifier.HParams(
              train_epochs=1, batch_size=1, shuffle=True)),
      dict(
          testcase_name='efficientnet_lite2',
          model_spec=image_classifier.SupportedModels.EFFICIENTNET_LITE2,
          hparams=image_classifier.HParams(
              train_epochs=1, batch_size=1, shuffle=True)),
      dict(
          testcase_name='efficientnet_lite3',
          model_spec=image_classifier.SupportedModels.EFFICIENTNET_LITE3,
          hparams=image_classifier.HParams(
              train_epochs=1, batch_size=1, shuffle=True)),
      dict(
          testcase_name='efficientnet_lite4',
          model_spec=image_classifier.SupportedModels.EFFICIENTNET_LITE4,
          hparams=image_classifier.HParams(
              train_epochs=1, batch_size=1, shuffle=True)),
  )
  def test_create_and_train_model(self,
                                  model_spec: image_classifier.SupportedModels,
                                  hparams: image_classifier.HParams):
    model = image_classifier.ImageClassifier.create(
        model_spec=model_spec,
        train_data=self.train_data,
        hparams=hparams,
        validation_data=self.test_data)
    self._test_accuracy(model)
  def test_efficientnetlite0_model_with_model_maker_retraining_lib(self):
    hparams = image_classifier.HParams(
        train_epochs=1, batch_size=1, shuffle=True)
    model = image_classifier.ImageClassifier.create(
        model_spec=image_classifier.SupportedModels.EFFICIENTNET_LITE0,
        train_data=self.train_data,
        hparams=hparams,
        validation_data=self.test_data)
    self._test_accuracy(model)
  def _test_accuracy(self, model, threshold=0.0):
    _, accuracy = model.evaluate(self.test_data)
    self.assertGreaterEqual(accuracy, threshold)
 if __name__ == '__main__':
  # Load compressed models from tensorflow_hub
  os.environ['TFHUB_MODEL_LOAD_FORMAT'] = 'COMPRESSED'
  tf.test.main()
--- a/mediapipe/model_maker/python/vision/image_classifier/model_spec.py
+++ b/mediapipe/model_maker/python/vision/image_classifier/model_spec.py
@ -0,0 +1,104 @@
 # Copyright 2022 The MediaPipe Authors. All Rights Reserved.
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
 # You may obtain a copy of the License at
 #
 #     http://www.apache.org/licenses/LICENSE-2.0
 #
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 # See the License for the specific language governing permissions and
 # limitations under the License.
 """Image classifier model specification."""
 import enum
 import functools
 from typing import List, Optional
 class ModelSpec(object):
  """Specification of image classifier model."""
  mean_rgb = [0.0]
  stddev_rgb = [255.0]
  def __init__(self,
               uri: str,
               input_image_shape: Optional[List[int]] = None,
               name: str = ''):
    """Initializes a new instance of the `ImageModelSpec` class.
    Args:
      uri: str, URI to the pretrained model.
      input_image_shape: list of int, input image shape. Default: [224, 224].
      name: str, model spec name.
    """
    self.uri = uri
    self.name = name
    if input_image_shape is None:
      input_image_shape = [224, 224]
    self.input_image_shape = input_image_shape
 mobilenet_v2_spec = functools.partial(
    ModelSpec,
    uri='https://tfhub.dev/google/tf2-preview/mobilenet_v2/feature_vector/4',
    name='mobilenet_v2')
 resnet_50_spec = functools.partial(
    ModelSpec,
    uri='https://tfhub.dev/google/imagenet/resnet_v2_50/feature_vector/4',
    name='resnet_50')
 efficientnet_lite0_spec = functools.partial(
    ModelSpec,
    uri='https://tfhub.dev/tensorflow/efficientnet/lite0/feature-vector/2',
    name='efficientnet_lite0')
 efficientnet_lite1_spec = functools.partial(
    ModelSpec,
    uri='https://tfhub.dev/tensorflow/efficientnet/lite1/feature-vector/2',
    input_image_shape=[240, 240],
    name='efficientnet_lite1')
 efficientnet_lite2_spec = functools.partial(
    ModelSpec,
    uri='https://tfhub.dev/tensorflow/efficientnet/lite2/feature-vector/2',
    input_image_shape=[260, 260],
    name='efficientnet_lite2')
 efficientnet_lite3_spec = functools.partial(
    ModelSpec,
    uri='https://tfhub.dev/tensorflow/efficientnet/lite3/feature-vector/2',
    input_image_shape=[280, 280],
    name='efficientnet_lite3')
 efficientnet_lite4_spec = functools.partial(
    ModelSpec,
    uri='https://tfhub.dev/tensorflow/efficientnet/lite4/feature-vector/2',
    input_image_shape=[300, 300],
    name='efficientnet_lite4')
 # TODO: Document the exposed models.
@enum.unique
 class SupportedModels(enum.Enum):
  """Image classifier model supported by model maker."""
  MOBILENET_V2 = mobilenet_v2_spec
  RESNET_50 = resnet_50_spec
  EFFICIENTNET_LITE0 = efficientnet_lite0_spec
  EFFICIENTNET_LITE1 = efficientnet_lite1_spec
  EFFICIENTNET_LITE2 = efficientnet_lite2_spec
  EFFICIENTNET_LITE3 = efficientnet_lite3_spec
  EFFICIENTNET_LITE4 = efficientnet_lite4_spec
  @classmethod
  def get(cls, spec: 'SupportedModels') -> 'ModelSpec':
    """Gets model spec from the input enum and initializes it."""
    if spec not in cls:
      raise TypeError('Unsupported image classifier spec: {}'.format(spec))
    return spec.value()
--- a/mediapipe/model_maker/python/vision/image_classifier/model_spec_test.py
+++ b/mediapipe/model_maker/python/vision/image_classifier/model_spec_test.py
@ -0,0 +1,93 @@
 # Copyright 2022 The MediaPipe Authors. All Rights Reserved.
 #
 # Licensed under the Apache License, Version 2.0 (the 'License');
 # you may not use this file except in compliance with the License.
 # You may obtain a copy of the License at
 #
 #     http://www.apache.org/licenses/LICENSE-2.0
 #
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an 'AS IS' BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 # See the License for the specific language governing permissions and
 # limitations under the License.
 import os
 from typing import Callable, List
 from absl.testing import parameterized
 import tensorflow as tf
 from mediapipe.model_maker.python.vision.image_classifier import model_spec as ms
 class ModelSpecTest(tf.test.TestCase, parameterized.TestCase):
  @parameterized.named_parameters(
      dict(
          testcase_name='mobilenet_v2_spec_test',
          model_spec=ms.mobilenet_v2_spec,
          expected_uri='https://tfhub.dev/google/tf2-preview/mobilenet_v2/feature_vector/4',
          expected_name='mobilenet_v2',
          expected_input_image_shape=[224, 224]),
      dict(
          testcase_name='resnet_50_spec_test',
          model_spec=ms.resnet_50_spec,
          expected_uri='https://tfhub.dev/google/imagenet/resnet_v2_50/feature_vector/4',
          expected_name='resnet_50',
          expected_input_image_shape=[224, 224]),
      dict(
          testcase_name='efficientnet_lite0_spec_test',
          model_spec=ms.efficientnet_lite0_spec,
          expected_uri='https://tfhub.dev/tensorflow/efficientnet/lite0/feature-vector/2',
          expected_name='efficientnet_lite0',
          expected_input_image_shape=[224, 224]),
      dict(
          testcase_name='efficientnet_lite1_spec_test',
          model_spec=ms.efficientnet_lite1_spec,
          expected_uri='https://tfhub.dev/tensorflow/efficientnet/lite1/feature-vector/2',
          expected_name='efficientnet_lite1',
          expected_input_image_shape=[240, 240]),
      dict(
          testcase_name='efficientnet_lite2_spec_test',
          model_spec=ms.efficientnet_lite2_spec,
          expected_uri='https://tfhub.dev/tensorflow/efficientnet/lite2/feature-vector/2',
          expected_name='efficientnet_lite2',
          expected_input_image_shape=[260, 260]),
      dict(
          testcase_name='efficientnet_lite3_spec_test',
          model_spec=ms.efficientnet_lite3_spec,
          expected_uri='https://tfhub.dev/tensorflow/efficientnet/lite3/feature-vector/2',
          expected_name='efficientnet_lite3',
          expected_input_image_shape=[280, 280]),
      dict(
          testcase_name='efficientnet_lite4_spec_test',
          model_spec=ms.efficientnet_lite4_spec,
          expected_uri='https://tfhub.dev/tensorflow/efficientnet/lite4/feature-vector/2',
          expected_name='efficientnet_lite4',
          expected_input_image_shape=[300, 300]),
  )
  def test_predefiend_spec(self, model_spec: Callable[..., ms.ModelSpec],
                           expected_uri: str, expected_name: str,
                           expected_input_image_shape: List[int]):
    model_spec_obj = model_spec()
    self.assertIsInstance(model_spec_obj, ms.ModelSpec)
    self.assertEqual(model_spec_obj.uri, expected_uri)
    self.assertEqual(model_spec_obj.name, expected_name)
    self.assertEqual(model_spec_obj.input_image_shape,
                     expected_input_image_shape)
  def test_create_spec(self):
    custom_model_spec = ms.ModelSpec(
        uri='https://custom_model',
        input_image_shape=[128, 128],
        name='custom_model')
    self.assertEqual(custom_model_spec.uri, 'https://custom_model')
    self.assertEqual(custom_model_spec.name, 'custom_model')
    self.assertEqual(custom_model_spec.input_image_shape, [128, 128])
 if __name__ == '__main__':
  # Load compressed models from tensorflow_hub
  os.environ['TFHUB_MODEL_LOAD_FORMAT'] = 'COMPRESSED'
  tf.test.main()
--- a/mediapipe/model_maker/python/vision/image_classifier/train_image_classifier_lib.py
+++ b/mediapipe/model_maker/python/vision/image_classifier/train_image_classifier_lib.py
@ -0,0 +1,103 @@
 # Copyright 2022 The MediaPipe Authors. All Rights Reserved.
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
 # You may obtain a copy of the License at
 #
 #     http://www.apache.org/licenses/LICENSE-2.0
 #
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 # See the License for the specific language governing permissions and
 # limitations under the License.
 """Library to train model."""
 import os
 from typing import List
 import tensorflow as tf
 from mediapipe.model_maker.python.core.utils import model_util
 from mediapipe.model_maker.python.vision.image_classifier import hyperparameters as hp
 def _create_optimizer(init_lr: float, decay_steps: int,
                      warmup_steps: int) -> tf.keras.optimizers.Optimizer:
  """Creates an optimizer with learning rate schedule.
  Uses Keras CosineDecay schedule for the learning rate by default.
  Args:
    init_lr: Initial learning rate.
    decay_steps: Number of steps to decay over.
    warmup_steps: Number of steps to do warmup for.
  Returns:
    A tf.keras.optimizers.Optimizer for model training.
  """
  learning_rate_fn = tf.keras.experimental.CosineDecay(
      initial_learning_rate=init_lr, decay_steps=decay_steps, alpha=0.0)
  if warmup_steps:
    learning_rate_fn = model_util.WarmUp(
        initial_learning_rate=init_lr,
        decay_schedule_fn=learning_rate_fn,
        warmup_steps=warmup_steps)
  optimizer = tf.keras.optimizers.RMSprop(
      learning_rate=learning_rate_fn, rho=0.9, momentum=0.9, epsilon=0.001)
  return optimizer
 def _get_default_callbacks(model_dir: str) -> List[tf.keras.callbacks.Callback]:
  """Gets default callbacks."""
  summary_dir = os.path.join(model_dir, 'summaries')
  summary_callback = tf.keras.callbacks.TensorBoard(summary_dir)
  # Save checkpoint every 20 epochs.
  checkpoint_path = os.path.join(model_dir, 'checkpoint')
  checkpoint_callback = tf.keras.callbacks.ModelCheckpoint(
      checkpoint_path, save_weights_only=True, period=20)
  return [summary_callback, checkpoint_callback]
 def train_model(model: tf.keras.Model, hparams: hp.HParams,
                train_ds: tf.data.Dataset,
                validation_ds: tf.data.Dataset) -> tf.keras.callbacks.History:
  """Trains model with the input data and hyperparameters.
  Args:
    model: Input tf.keras.Model.
    hparams: Hyperparameters for training image classifier.
    train_ds: tf.data.Dataset, training data to be fed in tf.keras.Model.fit().
    validation_ds: tf.data.Dataset, validation data to be fed in
      tf.keras.Model.fit().
  Returns:
    The tf.keras.callbacks.History object returned by tf.keras.Model.fit().
  """
  # Learning rate is linear to batch size.
  learning_rate = hparams.learning_rate * hparams.batch_size / 256
  # Get decay steps.
  total_training_steps = hparams.steps_per_epoch * hparams.train_epochs
  default_decay_steps = hparams.decay_samples // hparams.batch_size
  decay_steps = max(total_training_steps, default_decay_steps)
  warmup_steps = hparams.warmup_epochs * hparams.steps_per_epoch
  optimizer = _create_optimizer(
      init_lr=learning_rate, decay_steps=decay_steps, warmup_steps=warmup_steps)
  loss = tf.keras.losses.CategoricalCrossentropy(
      label_smoothing=hparams.label_smoothing)
  model.compile(optimizer=optimizer, loss=loss, metrics=['accuracy'])
  callbacks = _get_default_callbacks(hparams.model_dir)
  # Train the model.
  return model.fit(
      x=train_ds,
      epochs=hparams.train_epochs,
      steps_per_epoch=hparams.steps_per_epoch,
      validation_data=validation_ds,
      callbacks=callbacks)
--- a/mediapipe/model_maker/requirements.txt
+++ b/mediapipe/model_maker/requirements.txt
@ -2,3 +2,5 @@ absl-py
 numpy
 opencv-contrib-python
 tensorflow
 tensorflow-datasets
 tensorflow-hub