Raising errors for humans:

* optimize_loss expects 0d Tensor. * Estimator.get_eval_ops requires to have `targets` not None. * Adding asserts for shapes in rnn_cells. * Added error check in rnn.rnn. Change: 125425807

Raising errors for humans:
* optimize_loss expects 0d Tensor. * Estimator.get_eval_ops requires to have `targets` not None. * Adding asserts for shapes in rnn_cells. * Added error check in rnn.rnn. Change: 125425807
54d915b1 · Illia Polosukhin · TensorFlower Gardener · 7498d9b2 · 54d915b1 · 54d915b1
8 changed file
--- a/tensorflow/contrib/layers/python/layers/optimizers.py
+++ b/tensorflow/contrib/layers/python/layers/optimizers.py
@@ -92,8 +92,11 @@ def optimize_loss(loss,
    Training op.

  Raises:
-    ValueError: if optimizer is wrong type.
+    ValueError: if `optimizer` is wrong type or `loss` is not 0d Tensor.
  """
+  if not isinstance(loss, ops.Tensor) or loss.get_shape().ndims > 0:
+    raise ValueError("optimize_loss expects loss to be 0d Tensor, "
+                     "got %s" % loss)
  with vs.variable_op_scope([loss, global_step], name, "OptimizeLoss"):
    # Update ops take UPDATE_OPS collection if not provided.
    update_ops = (set(update_ops or []) or

--- a/tensorflow/contrib/layers/python/layers/optimizers_test.py
+++ b/tensorflow/contrib/layers/python/layers/optimizers_test.py
@@ -63,6 +63,21 @@ class OptimizersTest(tf.test.TestCase):
                                            learning_rate=0.1,
                                            optimizer=optimizer)

+  def testWrongLoss(self):
+    with tf.Graph().as_default() as g:
+      with self.test_session(graph=g):
+        _, _, _, global_step = _setup_model()
+        with self.assertRaises(ValueError):
+          tf.contrib.layers.optimize_loss(None,
+                                          global_step,
+                                          learning_rate=0.1,
+                                          optimizer="SGD")
+        with self.assertRaises(ValueError):
+          tf.contrib.layers.optimize_loss([[1.0]],
+                                          global_step,
+                                          learning_rate=0.1,
+                                          optimizer="SGD")
+
  def testGradientNoise(self):
    tf.set_random_seed(42)
    with self.test_session() as session:

--- a/tensorflow/contrib/learn/python/learn/estimators/estimator.py
+++ b/tensorflow/contrib/learn/python/learn/estimators/estimator.py
@@ -729,6 +729,9 @@ class Estimator(BaseEstimator):
    Raises:
      ValueError: if `metrics` don't match `targets`.
    """
+    if targets is None:
+      raise ValueError('Metrics %s in Estimator.evaluate requires targets '
+                       'not be None.' % metrics)
    predictions, loss, _ = self._call_model_fn(features, targets, ModeKeys.EVAL)
    result = {'loss': loss}
    metrics = metrics or {}

--- a/tensorflow/contrib/learn/python/learn/estimators/estimator_test.py
+++ b/tensorflow/contrib/learn/python/learn/estimators/estimator_test.py
@@ -213,6 +213,13 @@ class EstimatorTest(tf.test.TestCase):
    est.fit(input_fn=boston_input_fn, steps=1)
    _ = est.evaluate(input_fn=boston_eval_fn, steps=1)

+  def testEvalNoTarget(self):
+    boston = tf.contrib.learn.datasets.load_boston()
+    est = tf.contrib.learn.Estimator(model_fn=linear_model_fn)
+    est.fit(input_fn=boston_input_fn, steps=1)
+    with self.assertRaises(ValueError):
+      _ = est.evaluate(x=boston.data, steps=1)
+
  def testPredict(self):
    est = tf.contrib.learn.Estimator(model_fn=linear_model_fn)
    boston = tf.contrib.learn.datasets.load_boston()

--- a/tensorflow/python/kernel_tests/rnn_cell_test.py
+++ b/tensorflow/python/kernel_tests/rnn_cell_test.py
@@ -83,6 +83,18 @@ class RNNCellTest(tf.test.TestCase):
        # Smoke test
        self.assertAllClose(res[0], [[0.156736, 0.156736]])

+  def testGRUCellMismatch(self):
+    with self.test_session():
+      with tf.variable_scope("root", initializer=tf.constant_initializer(0.5)):
+        x = tf.zeros([1, 2])
+        x_incorrect = tf.zeros([1, 2, 3])
+        m = tf.zeros([1, 2])
+        m_incorrect = tf.zeros([1, 2, 3])
+        with self.assertRaises(ValueError):
+          tf.nn.rnn_cell.GRUCell(2)(x_incorrect, m)
+        with self.assertRaises(ValueError):
+          tf.nn.rnn_cell.GRUCell(2)(x, m_incorrect)
+
  def testBasicLSTMCell(self):
    with self.test_session() as sess:
      with tf.variable_scope("root", initializer=tf.constant_initializer(0.5)):

--- a/tensorflow/python/kernel_tests/rnn_test.py
+++ b/tensorflow/python/kernel_tests/rnn_test.py
@@ -1025,6 +1025,20 @@ class LSTMTest(tf.test.TestCase):
    self._testDynamicEquivalentToStaticRNN(
        use_gpu=True, use_sequence_length=True)

+  def testRNNWrongInputs(self):
+    cell = tf.nn.rnn_cell.GRUCell(2)
+    inputs = tf.constant([[1., 2.], [1., 2.]])
+    inputs_wrong = tf.constant([[[1., 2.], [1., 2.]], [[1., 2.], [1., 2.]]])
+    state_wrong = tf.constant([[1., 2.], [1., 2.]])
+    with self.assertRaises(TypeError):
+      tf.nn.rnn(None, inputs)
+    with self.assertRaises(TypeError):
+      tf.nn.rnn(cell, None)
+    with self.assertRaises(TypeError):
+      tf.nn.rnn(cell, inputs_wrong)
+    with self.assertRaises(TypeError):
+      tf.nn.rnn(cell, inputs, state_wrong)
+

 class BidirectionalRNNTest(tf.test.TestCase):


--- a/tensorflow/python/ops/rnn.py
+++ b/tensorflow/python/ops/rnn.py
@@ -91,11 +91,19 @@ def rnn(cell, inputs, initial_state=None, dtype=None,
  """

  if not isinstance(cell, rnn_cell.RNNCell):
-    raise TypeError("cell must be an instance of RNNCell")
+    raise TypeError("Rnn expects cell to be an instance of RNNCell, "
+                    "got %s" % cell)
  if not isinstance(inputs, list):
-    raise TypeError("inputs must be a list")
+    raise TypeError("Rnn expects inputs to be a list, got %s" % inputs)
  if not inputs:
-    raise ValueError("inputs must not be empty")
+    raise ValueError("Rnn expects inputs not to be empty, got %s" % inputs)
+  first_el_shape = inputs[0].get_shape()
+  for i, inp in enumerate(inputs):
+    if not inp.get_shape().is_compatible_with(first_el_shape):
+      raise ValueError("Rnn expectes inputs to be list of compatible Tensors. "
+                       "Received %s, where inputs[%d].shape == %s doesn't "
+                       "match inputs[0].shape == %s" % (
+                           inputs, i, inp.get_shape(), first_el_shape))

  outputs = []
  # Create a new scope in which the caching device is either
@@ -127,7 +135,7 @@ def rnn(cell, inputs, initial_state=None, dtype=None,
    else:
      if not dtype:
        raise ValueError("If no initial_state is provided, "
-                           "dtype must be specified")
+                         "dtype must be specified")
      state = cell.zero_state(batch_size, dtype)

    if sequence_length is not None:  # Prepare variables

--- a/tensorflow/python/ops/rnn_cell.py
+++ b/tensorflow/python/ops/rnn_cell.py
@@ -171,6 +171,30 @@ class RNNCell(object):
    return zeros


+def _assert_rnn_cell_input_shapes(inputs, state, state_is_tuple):
+  inputs = ops.convert_to_tensor(inputs)
+  if inputs.get_shape().ndims is not None and inputs.get_shape().ndims != 2:
+    raise ValueError("RNN cells expects inputs to be 2D Tensor, "
+                     "got inputs with %s shape." % inputs.get_shape())
+  # If state is None, don't check.
+  if state is None:
+    return
+  if state_is_tuple:
+    c, h = state
+    c = ops.convert_to_tensor(c)
+    h = ops.convert_to_tensor(h)
+    if ((c.get_shape().ndims is not None and c.get_shape().ndims != 2) or
+        (h.get_shape().ndims is not None and h.get_shape().ndims != 2)):
+      raise ValueError("RNN cells expects state to be tuple of 2D Tensors, "
+                       "got state tuple with shape: (%s, %s)." % (
+                           c.get_shape(), h.get_shape()))
+  else:
+    state = ops.convert_to_tensor(state)
+    if state.get_shape().ndims is not None and state.get_shape().ndims != 2:
+      raise ValueError("RNN cells expect state to be 2D Tensor, "
+                       "got state with sahpe: %s." % state.get_shape())
+
+
 class BasicRNNCell(RNNCell):
  """The most basic RNN cell."""

@@ -189,7 +213,19 @@ class BasicRNNCell(RNNCell):
    return self._num_units

  def __call__(self, inputs, state, scope=None):
-    """Most basic RNN: output = new_state = activation(W * input + U * state + B)."""
+    """Most basic RNN.
+
+    output = new_state = activation(W * input + U * state + B).
+
+    Args:
+      inputs: 2D `Tensor`.
+      state: `tuple` of `Tensor`s or 2D `Tensor`.
+      scope: name of `VariableScope` object.
+
+    Returns:
+      `tuple` of output and state `Tensor`, where they are equal for this cell.
+    """
+    _assert_rnn_cell_input_shapes(inputs, state, False)
    with vs.variable_scope(scope or type(self).__name__):  # "BasicRNNCell"
      output = self._activation(_linear([inputs, state], self._num_units, True))
    return output, output
@@ -214,6 +250,7 @@ class GRUCell(RNNCell):

  def __call__(self, inputs, state, scope=None):
    """Gated recurrent unit (GRU) with nunits cells."""
+    _assert_rnn_cell_input_shapes(inputs, state, False)
    with vs.variable_scope(scope or type(self).__name__):  # "GRUCell"
      with vs.variable_scope("Gates"):  # Reset gate and update gate.
        # We start with bias of 1.0 to not reset and not update.
@@ -289,6 +326,7 @@ class BasicLSTMCell(RNNCell):

  def __call__(self, inputs, state, scope=None):
    """Long short-term memory cell (LSTM)."""
+    _assert_rnn_cell_input_shapes(inputs, state, self._state_is_tuple)
    with vs.variable_scope(scope or type(self).__name__):  # "BasicLSTMCell"
      # Parameters of gates are concatenated into one multiply for efficiency.
      if self._state_is_tuple:
@@ -460,6 +498,8 @@ class LSTMCell(RNNCell):
      ValueError: If input size cannot be inferred from inputs via
        static shape inference.
    """
+    _assert_rnn_cell_input_shapes(inputs, state, self._state_is_tuple)
+
    num_proj = self._num_units if self._num_proj is None else self._num_proj

    if self._state_is_tuple:
@@ -564,6 +604,7 @@ class OutputProjectionWrapper(RNNCell):
    """Run the cell and output projection on inputs, starting from state."""
    output, res_state = self._cell(inputs, state)
    # Default scope: "OutputProjectionWrapper"
+    _assert_rnn_cell_input_shapes(inputs, None, None)
    with vs.variable_scope(scope or type(self).__name__):
      projected = _linear(output, self._output_size, True)
    return projected, res_state
@@ -606,6 +647,7 @@ class InputProjectionWrapper(RNNCell):
  def __call__(self, inputs, state, scope=None):
    """Run the input projection and then the cell."""
    # Default scope: "InputProjectionWrapper"
+    _assert_rnn_cell_input_shapes(inputs, None, None)
    with vs.variable_scope(scope or type(self).__name__):
      projected = _linear(inputs, self._num_proj, True)
    return self._cell(projected, state)
@@ -657,6 +699,7 @@ class DropoutWrapper(RNNCell):

  def __call__(self, inputs, state, scope=None):
    """Run the cell with the declared dropouts."""
+    _assert_rnn_cell_input_shapes(inputs, None, None)
    if (not isinstance(self._input_keep_prob, float) or
        self._input_keep_prob < 1):
      inputs = nn_ops.dropout(inputs, self._input_keep_prob, seed=self._seed)
@@ -767,6 +810,7 @@ class MultiRNNCell(RNNCell):

  def __call__(self, inputs, state, scope=None):
    """Run this multi-layer cell on inputs, starting from state."""
+    _assert_rnn_cell_input_shapes(inputs, state, self._state_is_tuple)
    with vs.variable_scope(scope or type(self).__name__):  # "MultiRNNCell"
      cur_state_pos = 0
      cur_inp = inputs