Create op ReverseV2 that takes indices for reversing rather than a bool array

aselle · tensorflower-gardener · commit 7aa95633c19c · 2016-10-19T21:04:26.000-07:00
This does not implement the Python API change yet for forward compatibility.
e.g. eventually tf.reverse(a, [0,1,-1]) will be the same as the old API of
tf.reverse(a, [True, True, False, False, False, True]) for a 6 dimensional
tensor a.
Change: 136675570
diff --git a/tensorflow/core/kernels/reverse_op.cc b/tensorflow/core/kernels/reverse_op.cc
@@ -24,6 +24,7 @@ limitations under the License.
 #include "tensorflow/core/framework/tensor.h"
 #include "tensorflow/core/framework/tensor_shape.h"
 #include "tensorflow/core/framework/types.h"
+#include "tensorflow/core/kernels/bounds_check.h"
 #include "tensorflow/core/lib/core/status.h"
 #include "tensorflow/core/platform/logging.h"
 
@@ -32,6 +33,19 @@ namespace tensorflow {
 typedef Eigen::ThreadPoolDevice CPUDevice;
 typedef Eigen::GpuDevice GPUDevice;
 
+template <typename Device, typename T, int NDIMS>
+void HandleReverseCase(OpKernelContext* context,
+                       typename TTypes<bool, 1>::ConstTensor dims,
+                       Tensor* result) {
+  typename Eigen::array<bool, NDIMS> axes_di;
+  for (int i = 0; i < NDIMS; i++) {
+    axes_di[i] = dims(i);
+  }
+  functor::Reverse<Device, T, NDIMS>()(context->eigen_device<Device>(),
+                                       context->input(0).tensor<T, NDIMS>(),
+                                       axes_di, result->tensor<T, NDIMS>());
+}
+
 template <typename Device, typename T>
 class ReverseOp : public OpKernel {
  public:
@@ -67,11 +81,9 @@ class ReverseOp : public OpKernel {
       OP_REQUIRES_OK(context,
                      context->allocate_output(0, input.shape(), &output));
 
-#define HANDLE_REVERSE(NDIMS)                                      \
-  case NDIMS:                                                      \
-    functor::Reverse<Device, T, NDIMS>()(                          \
-        context->eigen_device<Device>(), input.tensor<T, NDIMS>(), \
-        dims.vec<bool>(), output->tensor<T, NDIMS>());             \
+#define HANDLE_REVERSE(NDIMS)                                               \
+  case NDIMS:                                                               \
+    HandleReverseCase<Device, T, NDIMS>(context, dims.vec<bool>(), output); \
     return;
 
       switch (input_dims) {
@@ -90,15 +102,97 @@ class ReverseOp : public OpKernel {
   }
 };
 
-#define REGISTER_KERNEL(T)                            \
-  REGISTER_KERNEL_BUILDER(Name("Reverse")             \
-                              .Device(DEVICE_CPU)     \
-                              .TypeConstraint<T>("T") \
-                              .HostMemory("dims"),    \
-                          ReverseOp<CPUDevice, T>)
+template <typename Device, typename T, int NDIMS>
+void HandleReverseV2Case(OpKernelContext* context,
+                         const gtl::ArraySlice<bool>& axes, Tensor* result) {
+  typename Eigen::array<bool, NDIMS> axes_di;
+  for (int i = 0; i < NDIMS; i++) {
+    axes_di[i] = axes[i];
+  }
+  functor::Reverse<Device, T, NDIMS>()(context->eigen_device<Device>(),
+                                       context->input(0).tensor<T, NDIMS>(),
+                                       axes_di, result->tensor<T, NDIMS>());
+}
+
+template <typename Device, typename T>
+class ReverseV2Op : public OpKernel {
+ public:
+  explicit ReverseV2Op(OpKernelConstruction* context) : OpKernel(context) {}
+
+  void Compute(OpKernelContext* context) override {
+    const Tensor& input = context->input(0);
+    const Tensor& sparse_dims = context->input(1);
+
+    if (TensorShapeUtils::IsScalar(input.shape())) {
+      Tensor* output = nullptr;
+      OP_REQUIRES_OK(context,
+                     context->allocate_output(0, input.shape(), &output));
+      output->scalar<T>() = input.scalar<T>();
+    } else {
+      const int input_dims = input.dims();
+      const TensorShape& sparse_dims_shape = sparse_dims.shape();
+      const auto& axes_sparse_flat = sparse_dims.flat<int32>();
+
+      OP_REQUIRES(context, TensorShapeUtils::IsVector(sparse_dims_shape),
+                  errors::InvalidArgument("'dims' must be 1-dimension, not ",
+                                          sparse_dims.dims()));
+      gtl::InlinedVector<bool, 8> axes_dense(input_dims, false);
+      for (int dummy = 0; dummy < axes_sparse_flat.size(); dummy++) {
+        int32 axis = internal::SubtleMustCopy<int32>(axes_sparse_flat(dummy));
+        int32 canonical_axis = axis < 0 ? input_dims + axis : axis;
+        OP_REQUIRES(context, canonical_axis >= 0 && canonical_axis < input_dims,
+                    errors::InvalidArgument("'axis'[", dummy, "] = ", axis,
+                                            " is out of valid range [", 0, ", ",
+                                            input_dims - 1));
+        OP_REQUIRES(context, !axes_dense[canonical_axis],
+                    errors::InvalidArgument("axis ", canonical_axis,
+                                            " specified more than once."));
+        axes_dense[canonical_axis] = true;
+      }
 
-TF_CALL_POD_TYPES(REGISTER_KERNEL);
-#undef REGISTER_KERNEL
+      OP_REQUIRES(context, input_dims <= 8,
+                  errors::Unimplemented(
+                      "reverse is not implemented for tensors of rank > 8."));
+
+      Tensor* output = nullptr;
+      OP_REQUIRES_OK(context,
+                     context->allocate_output(0, input.shape(), &output));
+
+#define HANDLE_REVERSE(NDIMS)                                           \
+  case NDIMS:                                                           \
+    HandleReverseV2Case<Device, T, NDIMS>(context, axes_dense, output); \
+    return;
+
+      switch (input_dims) {
+        HANDLE_REVERSE(0);
+        HANDLE_REVERSE(1);
+        HANDLE_REVERSE(2);
+        HANDLE_REVERSE(3);
+        HANDLE_REVERSE(4);
+        HANDLE_REVERSE(5);
+        HANDLE_REVERSE(6);
+        HANDLE_REVERSE(7);
+        HANDLE_REVERSE(8);
+      }
+#undef HANDLE_REVERSE
+    }
+  }
+};
+
+#define REGISTER_KERNELS(T)                                  \
+  REGISTER_KERNEL_BUILDER(Name("Reverse")                    \
+                              .Device(DEVICE_CPU)            \
+                              .TypeConstraint<T>("T")        \
+                              .HostMemory("dims"),           \
+                          ReverseOp<CPUDevice, T>)           \
+  REGISTER_KERNEL_BUILDER(Name("ReverseV2")                  \
+                              .Device(DEVICE_CPU)            \
+                              .TypeConstraint<T>("T")        \
+                              .TypeConstraint<int32>("Tidx") \
+                              .HostMemory("axis"),           \
+                          ReverseV2Op<CPUDevice, T>)
+TF_CALL_POD_TYPES(REGISTER_KERNELS);
+#undef REGISTER_KERNELS
 
 #if GOOGLE_CUDA
 
@@ -109,7 +203,7 @@ namespace functor {
   template <>                                                         \
   void Reverse<GPUDevice, T, DIM>::operator()(                        \
       const GPUDevice& d, typename TTypes<T, DIM>::ConstTensor input, \
-      typename TTypes<bool, 1>::ConstTensor dims,                     \
+      const Eigen::array<bool, DIM>& reverse_dims,                    \
       typename TTypes<T, DIM>::Tensor output);                        \
   extern template struct Reverse<GPUDevice, T, DIM>;
 #define DECLARE_GPU_SPEC(T)  \
@@ -136,21 +230,27 @@ TF_CALL_complex128(DECLARE_GPU_SPEC);
 }  // namespace functor
 
 // Registration of the GPU implementations.
-#define REGISTER_GPU_KERNEL(T)                        \
-  REGISTER_KERNEL_BUILDER(Name("Reverse")             \
-                              .Device(DEVICE_GPU)     \
-                              .TypeConstraint<T>("T") \
-                              .HostMemory("dims"),    \
-                          ReverseOp<GPUDevice, T>)
-TF_CALL_uint8(REGISTER_GPU_KERNEL);
-TF_CALL_int8(REGISTER_GPU_KERNEL);
+#define REGISTER_GPU_KERNELS(T)                              \
+  REGISTER_KERNEL_BUILDER(Name("Reverse")                    \
+                              .Device(DEVICE_GPU)            \
+                              .TypeConstraint<T>("T")        \
+                              .HostMemory("dims"),           \
+                          ReverseOp<GPUDevice, T>)           \
+  REGISTER_KERNEL_BUILDER(Name("ReverseV2")                  \
+                              .Device(DEVICE_GPU)            \
+                              .TypeConstraint<T>("T")        \
+                              .TypeConstraint<int32>("Tidx") \
+                              .HostMemory("axis"),           \
+                          ReverseV2Op<GPUDevice, T>)
+TF_CALL_uint8(REGISTER_GPU_KERNELS);
+TF_CALL_int8(REGISTER_GPU_KERNELS);
 // TODO decide whether we want to enable the bool kernel.
-// TF_CALL_bool(REGISTER_GPU_KERNEL);
-TF_CALL_half(REGISTER_GPU_KERNEL);
-TF_CALL_float(REGISTER_GPU_KERNEL);
-TF_CALL_double(REGISTER_GPU_KERNEL);
-TF_CALL_complex64(REGISTER_GPU_KERNEL);
-TF_CALL_complex128(REGISTER_GPU_KERNEL);
+// TF_CALL_bool(REGISTER_GPU_KERNELS);
+TF_CALL_half(REGISTER_GPU_KERNELS);
+TF_CALL_float(REGISTER_GPU_KERNELS);
+TF_CALL_double(REGISTER_GPU_KERNELS);
+TF_CALL_complex64(REGISTER_GPU_KERNELS);
+TF_CALL_complex128(REGISTER_GPU_KERNELS);
 #undef REGISTER_GPU_KERNEL
 
 // A special GPU kernel for int32.
@@ -163,7 +263,14 @@ REGISTER_KERNEL_BUILDER(Name("Reverse")
                             .HostMemory("dims")
                             .HostMemory("output"),
                         ReverseOp<CPUDevice, int32>);
-
+REGISTER_KERNEL_BUILDER(Name("ReverseV2")
+                            .Device(DEVICE_GPU)
+                            .TypeConstraint<int32>("T")
+                            .TypeConstraint<int32>("Tidx")
+                            .HostMemory("tensor")
+                            .HostMemory("axis")
+                            .HostMemory("output"),
+                        ReverseV2Op<CPUDevice, int32>);
 #endif  // GOOGLE_CUDA
 
 }  // namespace tensorflow
diff --git a/tensorflow/core/kernels/reverse_op.h b/tensorflow/core/kernels/reverse_op.h
@@ -22,25 +22,20 @@ limitations under the License.
 namespace tensorflow {
 namespace functor {
 
-// Functor used by MirrorOp to do the computations.
+// Functor used by ReverseOp to do the computations.
 template <typename Device, typename T, int Dims>
 struct Reverse {
   void operator()(const Device& d, typename TTypes<T, Dims>::ConstTensor input,
-                  typename TTypes<bool, 1>::ConstTensor dims,
+                  const Eigen::array<bool, Dims>& reverse_dims,
                   typename TTypes<T, Dims>::Tensor output) {
-    // mirror is in host memory
-    Eigen::array<bool, Dims> reverse_dims;
-    for (int i = 0; i < Dims; ++i) {
-      reverse_dims[i] = dims(i);
-    }
     output.device(d) = input.reverse(reverse_dims);
   }
 };
 
 template <typename Device, typename T>
 struct Reverse<Device, T, 0> {
   void operator()(const Device& d, typename TTypes<T, 0>::ConstTensor input,
-                  typename TTypes<bool, 1>::ConstTensor,
+                  const Eigen::array<bool, 0>& reverse_dims,
                   typename TTypes<T, 0>::Tensor output) {
     // Reversing a scalar is copying it.
     output.device(d) = input;
diff --git a/tensorflow/core/ops/array_ops.cc b/tensorflow/core/ops/array_ops.cc
@@ -791,6 +791,79 @@ dims: 1-D. The dimensions to reverse.
 output: The same shape as `tensor`.
 )Doc");
 
+// --------------------------------------------------------------------------
+REGISTER_OP("ReverseV2")
+    .Input("tensor: T")
+    .Input("axis: Tidx")
+    .Output("output: T")
+    .Attr("Tidx: {int32, int64} = DT_INT32")
+    .Attr(
+        "T: {uint8, int8, int32, int64, bool, half, float, double, complex64, "
+        "complex128}")
+    .SetShapeFn([](InferenceContext* c) {
+      ShapeHandle input = c->input(0);
+      ShapeHandle axis;
+      TF_RETURN_IF_ERROR(c->WithRank(c->input(1), 1, &axis));
+      // TODO(aselle): if input(0)'s dimension is known we could validate axis
+      if (c->Rank(input) > 8) {
+        return errors::InvalidArgument(
+            "reverse does not work on tensors with more than 8 dimensions");
+      }
+      c->set_output(0, input);
+      return Status::OK();
+    })
+    .Doc(R"Doc(
+Reverses specific dimensions of a tensor.
+
+Given a `tensor`, and a `int32` tensor `axis` representing the set of
+dimensions of `tensor` to reverse. This operation reverses each dimension
+`i` for which there exists `j` s.t. `axis[j] == i`.
+
+`tensor` can have up to 8 dimensions. The number of dimensions specified
+in `axis` may be 0 or more entries. If an index is specified more than
+once, a InvalidArgument error is raised.
+
+For example:
+
+```prettyprint
+# tensor 't' is [[[[ 0,  1,  2,  3],
+#                  [ 4,  5,  6,  7],
+#                  [ 8,  9, 10, 11]],
+#                 [[12, 13, 14, 15],
+#                  [16, 17, 18, 19],
+#                  [20, 21, 22, 23]]]]
+# tensor 't' shape is [1, 2, 3, 4]
+
+# 'dims' is [3] or 'dims' is -1
+reverse(t, dims) ==> [[[[ 3,  2,  1,  0],
+                        [ 7,  6,  5,  4],
+                        [ 11, 10, 9, 8]],
+                       [[15, 14, 13, 12],
+                        [19, 18, 17, 16],
+                        [23, 22, 21, 20]]]]
+
+# 'dims' is '[1]' (or 'dims' is '[-3]')
+reverse(t, dims) ==> [[[[12, 13, 14, 15],
+                        [16, 17, 18, 19],
+                        [20, 21, 22, 23]
+                       [[ 0,  1,  2,  3],
+                        [ 4,  5,  6,  7],
+                        [ 8,  9, 10, 11]]]]
+
+# 'dims' is '[2]' (or 'dims' is '[-2]')
+reverse(t, dims) ==> [[[[8, 9, 10, 11],
+                        [4, 5, 6, 7],
+                        [0, 1, 2, 3]]
+                       [[20, 21, 22, 23],
+                        [16, 17, 18, 19],
+                        [12, 13, 14, 15]]]]
+```
+
+tensor: Up to 8-D.
+axis: 1-D. The indices of the dimensions to reverse.
+output: The same shape as `tensor`.
+)Doc");
+
 // --------------------------------------------------------------------------
 REGISTER_OP("EditDistance")
     .Input("hypothesis_indices: int64")
diff --git a/tensorflow/core/ops/array_ops_test.cc b/tensorflow/core/ops/array_ops_test.cc
@@ -203,6 +203,18 @@ TEST(ArrayOpsTest, Reverse_ShapeFn) {
   INFER_OK(op, "[1,2,3,?,5,6,7,8];[8]", "in0");
 }
 
+TEST(ArrayOpsTest, ReverseV2_ShapeFn) {
+  ShapeInferenceTestOp op("ReverseV2");
+  INFER_OK(op, "?;?", "in0");
+  INFER_ERROR("Shape must be rank 1 but is rank 0", op, "?;[]");
+  INFER_ERROR("Shape must be rank 1 but is rank 2", op, "?;[?,2]");
+  INFER_OK(op, "[1,2,3];[2]", "in0");
+  INFER_ERROR("reverse does not work on tensors with more than 8 dimensions",
+              op, "[1,2,3,4,5,6,7,8,9];[9]");
+  INFER_OK(op, "[1,2,3,?];[4]", "in0");
+  INFER_OK(op, "[1,2,3,?,5,6,7,8];[8]", "in0");
+}
+
 TEST(ArrayOpsTest, Fill_ShapeFn) {
   ShapeInferenceTestOp op("Fill");
   op.input_tensors.resize(2);
diff --git a/tensorflow/python/kernel_tests/array_ops_test.py b/tensorflow/python/kernel_tests/array_ops_test.py
diff --git a/tensorflow/python/ops/array_ops.py b/tensorflow/python/ops/array_ops.py