Create a Keras AutoEnsemble API. #1

This API is under development which means it is experimental and subject to change. PiperOrigin-RevId: 275293435
tensorflow · Oct 17, 2019 · b57e43a · b57e43a
1 parent 4d34947
commit b57e43a
Show file tree

Hide file tree

Showing 11 changed files with 242 additions and 0 deletions.
diff --git a/RELEASE.md b/RELEASE.md
@@ -17,6 +17,7 @@ limitations under the License.
  * Under development.
  * Introduce support for `AutoEnsembleTPUEstimator`.
  * Introduce experimental `adanet.keras.Model` API.
+ * Introduce experimental `adanet.keras.AutoEnsemble` API.
 
 # Release 0.8.0
  * Add support for TensorFlow 2.0.

diff --git a/adanet/__init__.py b/adanet/__init__.py
@@ -23,6 +23,7 @@
 from adanet import keras
 from adanet import replay
 from adanet import subnetwork
+from adanet.autoensemble import AutoEnsemble
 from adanet.autoensemble import AutoEnsembleEstimator
 from adanet.autoensemble import AutoEnsembleSubestimator
 from adanet.core import Estimator

diff --git a/adanet/adanet_test.py b/adanet/adanet_test.py
@@ -28,6 +28,7 @@ class AdaNetTest(tf.test.TestCase):
 
   def test_public(self):
     self.assertIsNotNone(adanet.__version__)
+    self.assertIsNotNone(adanet.AutoEnsemble)
     self.assertIsNotNone(adanet.AutoEnsembleEstimator)
     self.assertIsNotNone(adanet.AutoEnsembleSubestimator)
     self.assertIsNotNone(adanet.distributed.PlacementStrategy)
@@ -50,6 +51,7 @@ def test_public(self):
     self.assertIsNotNone(adanet.Estimator)
     self.assertIsNotNone(adanet.Evaluator)
     self.assertIsNotNone(adanet.keras.Model)
+    self.assertIsNotNone(adanet.keras.AutoEnsemble)
     self.assertIsNotNone(adanet.Model)
     self.assertIsNotNone(adanet.MixtureWeightType)
     self.assertIsNotNone(adanet.replay.Config)

diff --git a/adanet/autoensemble/BUILD b/adanet/autoensemble/BUILD
@@ -11,6 +11,16 @@ py_library(
     visibility = ["//adanet:__subpackages__"],
     deps = [
         ":estimator",
+        ":keras",
+    ],
+)
+
+py_library(
+    name = "keras",
+    srcs = ["keras.py"],
+    deps = [
+        ":estimator",
+        "//adanet/keras:model",
     ],
 )
 
@@ -26,6 +36,17 @@ py_library(
     ],
 )
 
+py_test(
+    name = "keras_test",
+    size = "medium",
+    srcs = ["keras_test.py"],
+    deps = [
+        ":keras",
+        "//adanet/tf_compat",
+        "@absl_py//absl/testing:parameterized",
+    ],
+)
+
 py_test(
     name = "estimator_test",
     size = "large",

diff --git a/adanet/autoensemble/__init__.py b/adanet/autoensemble/__init__.py
@@ -22,9 +22,11 @@
 from adanet.autoensemble.estimator import AutoEnsembleEstimator
 from adanet.autoensemble.estimator import AutoEnsembleSubestimator
 from adanet.autoensemble.estimator import AutoEnsembleTPUEstimator
+from adanet.autoensemble.keras import AutoEnsemble
 
 __all__ = [
     "AutoEnsembleEstimator",
     "AutoEnsembleSubestimator",
     "AutoEnsembleTPUEstimator",
+    "AutoEnsemble",
 ]
diff --git a/adanet/autoensemble/keras.py b/adanet/autoensemble/keras.py
@@ -0,0 +1,122 @@
+"""A Keras model that learns to ensemble.
+
+Copyright 2019 The AdaNet Authors. All Rights Reserved.
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    https://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+"""
+
+from __future__ import absolute_import
+from __future__ import division
+from __future__ import print_function
+
+from absl import logging
+from adanet.autoensemble.estimator import _GeneratorFromCandidatePool
+from adanet.keras.model import Model
+
+
+class AutoEnsemble(Model):
+  """A :class:`tf.keras.Model` that learns to ensemble models."""
+
+  def __init__(self,
+               candidate_pool,
+               max_iteration_steps,
+               logits_dimension=1,
+               ensemblers=None,
+               ensemble_strategies=None,
+               evaluator=None,
+               adanet_loss_decay=.9,
+               filepath=None,
+               logits_fn=None,
+               last_layer_fn=None):
+    """Instantiates an `adanet.AutoEnsemble`.
+
+    Args:
+      candidate_pool: List of :class:`tf.estimator.Estimator` and
+        :class:`AutoEnsembleSubestimator` objects, or dict of string name to
+        :class:`tf.estimator.Estimator` and :class:`AutoEnsembleSubestimator`
+        objects that are candidate subestimators to ensemble at each iteration.
+        The order does not directly affect which candidates will be included in
+        the final ensemble, but will affect the name of the candidate. When
+        using a dict, the string key becomes the candidate subestimator's name.
+        Alternatively, this argument can be a function that takes a `config`
+        argument and returns the aforementioned values in case the
+        objects need to be re-instantiated at each adanet iteration.
+      max_iteration_steps: Total number of steps for which to train candidates
+        per iteration. If :class:`OutOfRange` or :class:`StopIteration` occurs
+        in the middle, training stops before `max_iteration_steps` steps. When
+        :code:`None`, it will train the current iteration forever.
+      logits_dimension: The dimension of the final layer of any subnetworks.
+      ensemblers: An iterable of :class:`adanet.ensemble.Ensembler` objects that
+        define how to ensemble a group of subnetworks. If there are multiple,
+        each should have a different `name` property.
+      ensemble_strategies: An iterable of :class:`adanet.ensemble.Strategy`
+        objects that define the candidate ensembles of subnetworks to explore at
+        each iteration.
+      evaluator: An :class:`adanet.Evaluator` for candidate selection after all
+        subnetworks are done training. When :code:`None`, candidate selection
+        uses a moving average of their :class:`adanet.Ensemble` AdaNet loss
+        during training instead. In order to use the *AdaNet algorithm* as
+        described in [Cortes et al., '17], the given :class:`adanet.Evaluator`
+        must be created with the same dataset partition used during training.
+        Otherwise, this framework will perform *AdaNet.HoldOut* which uses a
+        holdout set for candidate selection, but does not benefit from learning
+        guarantees.
+      adanet_loss_decay: Float decay for the exponential-moving-average of the
+        AdaNet objective throughout training. This moving average is a data-
+        driven way tracking the best candidate with only the training set.
+      filepath: Directory to save model parameters, graph and etc. This can also
+        be used to load checkpoints from the directory into a estimator to
+        continue training a previously saved model.
+      logits_fn: A function for fetching the subnetwork logits from a
+        :class:`tf.estimator.EstimatorSpec`, which should obey the
+        following signature:
+          - `Args`: Can only have following argument:
+            - estimator_spec: The candidate's
+              :class:`tf.estimator.EstimatorSpec`.
+          - `Returns`: Logits :class:`tf.Tensor` or dict of string to logits
+            :class:`tf.Tensor` (for multi-head) for the candidate subnetwork
+            extracted from the given `estimator_spec`. When `None`, it will
+            default to returning `estimator_spec.predictions` when they are a
+            :class:`tf.Tensor` or the :class:`tf.Tensor` for the key 'logits'
+            when they are a dict of string to :class:`tf.Tensor`.
+      last_layer_fn: An optional function for fetching the subnetwork last_layer
+        from a :class:`tf.estimator.EstimatorSpec`, which should obey the
+        following signature:
+          - `Args`: Can only have following argument:
+            - estimator_spec: The candidate's
+              :class:`tf.estimator.EstimatorSpec`.
+          - `Returns`: Last layer :class:`tf.Tensor` or dict of string to last
+            layer :class:`tf.Tensor` (for multi-head) for the candidate
+            subnetwork extracted from the given `estimator_spec`. The last_layer
+            can be used for learning ensembles or exporting them as embeddings.
+        When `None`, it will default to using the logits as the last_layer.
+    """
+
+    logging.warning("The AdaNet AutoEnsemble API is currently experimental.")
+
+    subnetwork_generator = _GeneratorFromCandidatePool(candidate_pool,
+                                                       logits_fn, last_layer_fn)
+
+    super(AutoEnsemble, self).__init__(
+        subnetwork_generator=subnetwork_generator,
+        max_iteration_steps=max_iteration_steps,
+        logits_dimension=logits_dimension,
+        ensemblers=ensemblers,
+        ensemble_strategies=ensemble_strategies,
+        evaluator=evaluator,
+        adanet_loss_decay=adanet_loss_decay,
+        filepath=filepath)
+
+
+
+
diff --git a/adanet/autoensemble/keras_test.py b/adanet/autoensemble/keras_test.py
@@ -0,0 +1,75 @@
+"""A Keras model that learns to ensemble.
+
+Copyright 2019 The AdaNet Authors. All Rights Reserved.
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    https://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+"""
+
+from __future__ import absolute_import
+from __future__ import division
+from __future__ import print_function
+
+from absl.testing import parameterized
+from adanet.autoensemble.keras import AutoEnsemble
+import tensorflow as tf
+
+
+class KerasTest(parameterized.TestCase, tf.test.TestCase):
+
+  # pylint: disable=g-long-lambda
+  @parameterized.named_parameters(
+      {
+          "testcase_name": "dict_candidate_pool",
+          "candidate_pool":
+              lambda head, feature_columns, optimizer: {
+                  "dnn":
+                      tf.estimator.DNNEstimator(
+                          head=head,
+                          feature_columns=feature_columns,
+                          optimizer=optimizer,
+                          hidden_units=[3]),
+                  "linear":
+                      tf.estimator.LinearEstimator(
+                          head=head,
+                          feature_columns=feature_columns,
+                          optimizer=optimizer),
+              },
+      })
+  # pylint: enable=g-long-lambda
+
+  def test_auto_ensemble_lifecycle(self,
+                                   candidate_pool):
+
+    optimizer = lambda: tf.keras.optimizers.SGD(lr=.01)
+    feature_columns = [tf.feature_column.numeric_column("x", shape=[2])]
+
+    keras_model = AutoEnsemble(
+        candidate_pool=candidate_pool(tf.estimator.RegressionHead(),
+                                      feature_columns, optimizer),
+        max_iteration_steps=10)
+    keras_model.compile(loss="mse")
+    self.assertEqual(["loss"], keras_model.metrics_names)
+
+    train_data = tf.data.Dataset.from_tensors(([[1., 0.]], [[1.]])).repeat()
+    keras_model.fit(train_data, epochs=1, steps_per_epoch=1)
+
+    eval_results = keras_model.evaluate(train_data, steps=3)
+    # TODO: Rewrite this test to be deterministic.
+    self.assertIsNotNone(eval_results["loss"])
+
+    predict_data = tf.data.Dataset.from_tensors(([[1., 0.]]))
+    predictions = keras_model.predict(predict_data)
+    self.assertLen(predictions, 1)
+
+if __name__ == "__main__":
+  tf.test.main()
diff --git a/adanet/keras/BUILD b/adanet/keras/BUILD
@@ -13,6 +13,7 @@ py_library(
     visibility = whitelist,
     deps = [
         ":model",
+        "//adanet/autoensemble",
     ],
 )
 

diff --git a/adanet/keras/__init__.py b/adanet/keras/__init__.py
@@ -21,8 +21,10 @@
 from __future__ import division
 from __future__ import print_function
 
+from adanet.autoensemble.keras import AutoEnsemble
 from adanet.keras.model import Model
 
 __all__ = [
+    "AutoEnsemble",
     "Model",
 ]
diff --git a/docs/source/adanet.keras.rst b/docs/source/adanet.keras.rst
@@ -13,6 +13,14 @@ Keras
 **Experimental** Keras API for training, evaluating, predicting, and serving
 AdaNet models.
 
+:hidden:`AutoEnsemble`
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+.. autoclass:: AutoEnsemble
+    :members:
+    :show-inheritance:
+    :inherited-members:
+
 :hidden:`Model`
 ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
 

diff --git a/docs/source/adanet.rst b/docs/source/adanet.rst
@@ -61,6 +61,13 @@ Keras
 **Experimental** Keras API for training, evaluating, predicting, and serving
 AdaNet models.
 
+:hidden:`AutoEnsemble`
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+.. autoclass:: AutoEnsemble
+    :members:
+    :show-inheritance:
+    :inherited-members:
 
 :hidden:`Model`
 ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~