Add subpackage for RNN related code. (#189)

qlzh727 · seanpmorgan · commit 4e0aefe53754 · 2019-04-18T14:24:10.000-04:00
* Update .gitignore to include intellij project file (*.iml).

* Add package for customized RNN cell.

* Add package for customized RNN cell.

* Update the unit test for rnn cell.

* Fix more code and test.
1. The test case was missing test.main, which means the test wasn't executed at all.
2. Add initializer params for user to control how weights are initialized.
3. Update the tests with the fix.

* Fix code format.

* Fix more lint error.

* Address the PR review comments.
1. Update the addon init/build/README
2. Add README for rnn.

* Fix annotation in doc.

* Update gitowner for rnn package.
diff --git a/.github/CODEOWNERS b/.github/CODEOWNERS
@@ -5,6 +5,7 @@
 
 
 # Subpackage Owners
+/tensorflow_addons/rnn/ @qlzh727
 /tensorflow_addons/seq2seq/ @qlzh727
 /tensorflow_addons/custom_ops/seq2seq/ @qlzh727
 
diff --git a/BUILD b/BUILD
@@ -11,6 +11,7 @@ sh_binary(
         "//tensorflow_addons/layers",
         "//tensorflow_addons/losses",
         "//tensorflow_addons/optimizers",
+        "//tensorflow_addons/rnn",
         "//tensorflow_addons/seq2seq",
         "//tensorflow_addons/text",
     ],
diff --git a/README.md b/README.md
@@ -34,7 +34,8 @@ developments that cannot be integrated into core TensorFlow
 | [tfa.layers](tensorflow_addons/layers/README.md) | SIG-Addons |     addons@tensorflow.org |
 | [tfa.losses](tensorflow_addons/losses/README.md) | SIG-Addons |     addons@tensorflow.org |
 | [tfa.optimizers](tensorflow_addons/optimizers/README.md) | SIG-Addons | addons@tensorflow.org |
-| [tfa.seq2seq](tensorflow_addons/seq2seq/README.md) | Google | @qlzh727 | 
+| [tfa.rnn](tensorflow_addons/rnn/README.md) | Google | @qlzh727 |
+| [tfa.seq2seq](tensorflow_addons/seq2seq/README.md) | Google | @qlzh727 |
 | [tfa.text](tensorflow_addons/text/README.md) |  |  |
 
 ## Core Concepts
diff --git a/tensorflow_addons/__init__.py b/tensorflow_addons/__init__.py
@@ -76,6 +76,7 @@ def _ensure_tf_install():
 from tensorflow_addons import layers
 from tensorflow_addons import losses
 from tensorflow_addons import optimizers
+from tensorflow_addons import rnn
 from tensorflow_addons import seq2seq
 from tensorflow_addons import text
 
diff --git a/tensorflow_addons/rnn/BUILD b/tensorflow_addons/rnn/BUILD
@@ -0,0 +1,24 @@
+licenses(["notice"])  # Apache 2.0
+
+package(default_visibility = ["//visibility:public"])
+
+py_library(
+    name = "rnn",
+    srcs = [
+        "__init__.py",
+        "cell.py",
+    ],
+    srcs_version = "PY2AND3",
+    deps = [
+        "//tensorflow_addons/utils",
+    ],
+)
+
+py_test(
+    name = "cell_test",
+    size = "small",
+    srcs = ["cell_test.py"],
+    deps = [
+        ":rnn",
+    ],
+)
diff --git a/tensorflow_addons/rnn/README.md b/tensorflow_addons/rnn/README.md
@@ -0,0 +1,37 @@
+# Addons - RNN
+
+## Maintainers
+| Submodule  | Maintainers  | Contact Info  |
+|:---------- |:------------ |:------------- |
+| cell       | Google       | @qlzh727      |
+
+## Components
+| Submodule | Class   | Reference |
+|:----------|:------- |:--------- |
+| cell      | NASCell | https://arxiv.org/abs/1611.01578  |
+
+
+## Contribution Guidelines
+#### Prerequisites
+ * For any cell based on research paper, the original paper has to be well recognized.
+   The criteria here is >= 100 citation based on Google scholar. If the contributor feels
+   this requirement need to be overruled, please specify the detailed justification in the
+   PR.
+
+#### Standard API
+In order to conform with the current API standard, all cells must:
+ * Inherit from either `keras.layers.AbstractRNNCell` or `keras.layers.Layer` with
+   required properties.
+ * [Register as a Keras global object](https://github.com/tensorflow/addons/blob/master/tensorflow_addons/utils/python/keras_utils.py)
+  so it can be serialized properly.
+ * Add the addon to the `py_library` in this sub-package's BUILD file.
+
+#### Testing Requirements
+ * When applicable, run all tests with TensorFlow's
+   `@run_in_graph_and_eager_modes` (for test method)
+   or `@run_all_in_graph_and_eager_modes` (for TestCase subclass)
+   decorator.
+ * Add a `py_test` to this sub-package's BUILD file.
+
+#### Documentation Requirements
+ * Update the table of contents in this sub-packages's README.
diff --git a/tensorflow_addons/rnn/__init__.py b/tensorflow_addons/rnn/__init__.py
@@ -0,0 +1,21 @@
+# Copyright 2019 The TensorFlow Authors. All Rights Reserved.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+# ==============================================================================
+"""Customized RNN cells."""
+
+from __future__ import absolute_import
+from __future__ import division
+from __future__ import print_function
+
+from tensorflow_addons.rnn.cell import NASCell
diff --git a/tensorflow_addons/rnn/cell.py b/tensorflow_addons/rnn/cell.py
@@ -0,0 +1,210 @@
+# Copyright 2019 The TensorFlow Authors. All Rights Reserved.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+# ==============================================================================
+"""Module for RNN Cells."""
+from __future__ import absolute_import
+from __future__ import division
+from __future__ import print_function
+
+import tensorflow as tf
+import tensorflow.keras as keras
+from tensorflow_addons.utils import keras_utils
+
+
+@keras_utils.register_keras_custom_object
+class NASCell(keras.layers.AbstractRNNCell):
+    """Neural Architecture Search (NAS) recurrent network cell.
+
+    This implements the recurrent cell from the paper:
+
+      https://arxiv.org/abs/1611.01578
+
+    Barret Zoph and Quoc V. Le.
+    "Neural Architecture Search with Reinforcement Learning" Proc. ICLR 2017.
+
+    The class uses an optional projection layer.
+    """
+
+    # NAS cell's architecture base.
+    _NAS_BASE = 8
+
+    def __init__(self,
+                 units,
+                 projection=None,
+                 use_bias=False,
+                 kernel_initializer="glorot_uniform",
+                 recurrent_initializer="glorot_uniform",
+                 projection_initializer="glorot_uniform",
+                 bias_initializer="zeros",
+                 **kwargs):
+        """Initialize the parameters for a NAS cell.
+
+        Args:
+          units: int, The number of units in the NAS cell.
+          projection: (optional) int, The output dimensionality for the
+            projection matrices.  If None, no projection is performed.
+          use_bias: (optional) bool, If True then use biases within the cell.
+            This is False by default.
+          kernel_initializer: Initializer for kernel weight.
+          recurrent_initializer: Initializer for recurrent kernel weight.
+          projection_initializer: Initializer for projection weight, used when
+            projection is not None.
+          bias_initializer: Initializer for bias, used when use_bias is True.
+          **kwargs: Additional keyword arguments.
+        """
+        super(NASCell, self).__init__(**kwargs)
+        self.units = units
+        self.projection = projection
+        self.use_bias = use_bias
+        self.kernel_initializer = kernel_initializer
+        self.recurrent_initializer = recurrent_initializer
+        self.projection_initializer = projection_initializer
+        self.bias_initializer = bias_initializer
+
+        if projection is not None:
+            self._state_size = [units, projection]
+            self._output_size = projection
+        else:
+            self._state_size = [units, units]
+            self._output_size = units
+
+    @property
+    def state_size(self):
+        return self._state_size
+
+    @property
+    def output_size(self):
+        return self._output_size
+
+    def build(self, inputs_shape):
+        input_size = tf.compat.dimension_value(
+            tf.TensorShape(inputs_shape).with_rank(2)[1])
+        if input_size is None:
+            raise ValueError(
+                "Could not infer input size from inputs.get_shape()[-1]")
+
+        # Variables for the NAS cell. `recurrent_kernel` is all matrices
+        # multiplying the hidden state and `kernel` is all matrices multiplying
+        # the inputs.
+        self.recurrent_kernel = self.add_variable(
+            name="recurrent_kernel",
+            shape=[self.output_size, self._NAS_BASE * self.units],
+            initializer=self.recurrent_initializer)
+        self.kernel = self.add_variable(
+            name="kernel",
+            shape=[input_size, self._NAS_BASE * self.units],
+            initializer=self.kernel_initializer)
+
+        if self.use_bias:
+            self.bias = self.add_variable(
+                name="bias",
+                shape=[self._NAS_BASE * self.units],
+                initializer=self.bias_initializer)
+        # Projection layer if specified
+        if self.projection is not None:
+            self.projection_weights = self.add_variable(
+                name="projection_weights",
+                shape=[self.units, self.projection],
+                initializer=self.projection_initializer)
+
+        self.built = True
+
+    def call(self, inputs, state):
+        """Run one step of NAS Cell.
+
+        Args:
+          inputs: input Tensor, 2D, batch x num_units.
+          state: This must be a list of state Tensors, both `2-D`, with column
+            sizes `c_state` and `m_state`.
+
+        Returns:
+          A tuple containing:
+          - A `2-D, [batch x output_dim]`, Tensor representing the output of
+            the NAS Cell after reading `inputs` when previous state was
+            `state`.
+            Here output_dim is:
+               projection if projection was set, units otherwise.
+          - Tensor(s) representing the new state of NAS Cell after reading
+            `inputs` when the previous state was `state`.  Same type and
+            shape(s) as `state`.
+
+        Raises:
+          ValueError: If input size cannot be inferred from inputs via
+            static shape inference.
+        """
+        sigmoid = tf.math.sigmoid
+        tanh = tf.math.tanh
+        relu = tf.nn.relu
+
+        c_prev, m_prev = state
+
+        m_matrix = tf.matmul(m_prev, self.recurrent_kernel)
+        inputs_matrix = tf.matmul(inputs, self.kernel)
+
+        if self.use_bias:
+            m_matrix = tf.nn.bias_add(m_matrix, self.bias)
+
+        # The NAS cell branches into 8 different splits for both the hidden
+        # state and the input
+        m_matrix_splits = tf.split(
+            axis=1, num_or_size_splits=self._NAS_BASE, value=m_matrix)
+        inputs_matrix_splits = tf.split(
+            axis=1, num_or_size_splits=self._NAS_BASE, value=inputs_matrix)
+
+        # First layer
+        layer1_0 = sigmoid(inputs_matrix_splits[0] + m_matrix_splits[0])
+        layer1_1 = relu(inputs_matrix_splits[1] + m_matrix_splits[1])
+        layer1_2 = sigmoid(inputs_matrix_splits[2] + m_matrix_splits[2])
+        layer1_3 = relu(inputs_matrix_splits[3] * m_matrix_splits[3])
+        layer1_4 = tanh(inputs_matrix_splits[4] + m_matrix_splits[4])
+        layer1_5 = sigmoid(inputs_matrix_splits[5] + m_matrix_splits[5])
+        layer1_6 = tanh(inputs_matrix_splits[6] + m_matrix_splits[6])
+        layer1_7 = sigmoid(inputs_matrix_splits[7] + m_matrix_splits[7])
+
+        # Second layer
+        l2_0 = tanh(layer1_0 * layer1_1)
+        l2_1 = tanh(layer1_2 + layer1_3)
+        l2_2 = tanh(layer1_4 * layer1_5)
+        l2_3 = sigmoid(layer1_6 + layer1_7)
+
+        # Inject the cell
+        l2_0 = tanh(l2_0 + c_prev)
+
+        # Third layer
+        l3_0_pre = l2_0 * l2_1
+        new_c = l3_0_pre  # create new cell
+        l3_0 = l3_0_pre
+        l3_1 = tanh(l2_2 + l2_3)
+
+        # Final layer
+        new_m = tanh(l3_0 * l3_1)
+
+        # Projection layer if specified
+        if self.projection is not None:
+            new_m = tf.matmul(new_m, self.projection_weights)
+
+        return new_m, [new_c, new_m]
+
+    def get_config(self):
+        config = {
+            "units": self.units,
+            "projection": self.projection,
+            "use_bias": self.use_bias,
+            "kernel_initializer": self.kernel_initializer,
+            "recurrent_initializer": self.recurrent_initializer,
+            "bias_initializer": self.bias_initializer,
+            "projection_initializer": self.projection_initializer,
+        }
+        base_config = super(NASCell, self).get_config()
+        return dict(list(base_config.items()) + list(config.items()))
diff --git a/tensorflow_addons/rnn/cell_test.py b/tensorflow_addons/rnn/cell_test.py