pythonAI
diff --git a/‎tensorflow/core/kernels/segment_reduction_ops.cc‎
Lines changed: 68 additions & 11 deletions b/‎tensorflow/core/kernels/segment_reduction_ops.cc‎
Lines changed: 68 additions & 11 deletions
diff --git a/‎tensorflow/core/ops/math_grad.cc‎
Lines changed: 1 addition & 0 deletions b/‎tensorflow/core/ops/math_grad.cc‎
Lines changed: 1 addition & 0 deletions
diff --git a/‎tensorflow/core/ops/math_ops.cc‎
Lines changed: 43 additions & 0 deletions b/‎tensorflow/core/ops/math_ops.cc‎
Lines changed: 43 additions & 0 deletions
diff --git a/‎tensorflow/core/ops/ops.pbtxt‎
Lines changed: 73 additions & 0 deletions b/‎tensorflow/core/ops/ops.pbtxt‎
Lines changed: 73 additions & 0 deletions
@@ -250,8 +250,8 @@ template <typename Device, class T>
 class SparseSegmentReductionOpBase : public OpKernel {
  public:
   explicit SparseSegmentReductionOpBase(OpKernelConstruction* context,
-                                        bool is_mean)
-      : OpKernel(context), is_mean_(is_mean) {}
+                                        bool is_mean, bool is_sqrtn)
+      : OpKernel(context), is_mean_(is_mean), is_sqrtn_(is_sqrtn) {}
 
   void Compute(OpKernelContext* context) override {
     const Tensor& input = context->input(0);
@@ -309,7 +309,13 @@ class SparseSegmentReductionOpBase : public OpKernel {
         out = I(0);
       } else {
         int r = num % 8;
-        T m = (is_mean_ && (num < 10)) ? num : 1;
+        T m = 1;
+        if (is_mean_ && (num < 10)) {
+          m = num;
+        }
+        if (is_sqrtn_ && (num < 10)) {
+          m = sqrt(num);
+        }
         switch (r) {
           case 2:
             out = (I(0) + I(1)) / m;
@@ -348,30 +354,45 @@ class SparseSegmentReductionOpBase : public OpKernel {
         if (is_mean_ && num >= 10) {
           out = out / static_cast<T>(num);
         }
+        if (is_sqrtn_ && num >= 10) {
+          out = out / static_cast<T>(sqrt(num));
+        }
       }
       start = end;
       ++end;
     }
   }
 
  private:
-  bool is_mean_;
+  const bool is_mean_;
+  const bool is_sqrtn_;
 };
 
 template <typename Device, class T>
 class SparseSegmentReductionMeanOp
     : public SparseSegmentReductionOpBase<Device, T> {
  public:
   explicit SparseSegmentReductionMeanOp(OpKernelConstruction* context)
-      : SparseSegmentReductionOpBase<Device, T>(context, true /*is_mean*/) {}
+      : SparseSegmentReductionOpBase<Device, T>(context, true /*is_mean*/,
+                                                false /*is_sqrtn*/) {}
+};
+
+template <typename Device, class T>
+class SparseSegmentReductionSqrtNOp
+    : public SparseSegmentReductionOpBase<Device, T> {
+ public:
+  explicit SparseSegmentReductionSqrtNOp(OpKernelConstruction* context)
+      : SparseSegmentReductionOpBase<Device, T>(context, false /*is_mean*/,
+                                                true /*is_sqrtn*/) {}
 };
 
 template <typename Device, class T>
 class SparseSegmentReductionSumOp
     : public SparseSegmentReductionOpBase<Device, T> {
  public:
   explicit SparseSegmentReductionSumOp(OpKernelConstruction* context)
-      : SparseSegmentReductionOpBase<Device, T>(context, false /*is_mean*/) {}
+      : SparseSegmentReductionOpBase<Device, T>(context, false /*is_mean*/,
+                                                false /*is_sqrtn*/) {}
 };
 
 #define REGISTER_CPU_SPARSE_KERNELS(type)                                    \
@@ -390,11 +411,19 @@ REGISTER_CPU_SPARSE_KERNELS(float);
 REGISTER_CPU_SPARSE_KERNELS(double);
 #undef REGISTER_CPU_SPARSE_KERNELS
 
+#define REGISTER_CPU_SPARSE_KERNELS(type)                                      \
+  REGISTER_KERNEL_BUILDER(                                                     \
+      Name("SparseSegmentSqrtN").Device(DEVICE_CPU).TypeConstraint<type>("T"), \
+      SparseSegmentReductionSqrtNOp<CPUDevice, type>);
+REGISTER_CPU_SPARSE_KERNELS(float);
+REGISTER_CPU_SPARSE_KERNELS(double);
+#undef REGISTER_CPU_SPARSE_KERNELS
+
 template <class T>
-class SparseSegmentMeanGradOp : public OpKernel {
+class SparseSegmentGradOpBase : public OpKernel {
  public:
-  explicit SparseSegmentMeanGradOp(OpKernelConstruction* context)
-      : OpKernel(context) {}
+  explicit SparseSegmentGradOpBase(OpKernelConstruction* context, bool is_sqrtn)
+      : OpKernel(context), is_sqrtn_(is_sqrtn) {}
 
   void Compute(OpKernelContext* context) override {
     const Tensor& input = context->input(0);
@@ -437,7 +466,11 @@ class SparseSegmentMeanGradOp : public OpKernel {
       scaling[segment_vec(i)] += 1;
     }
     for (int i = 0; i < scaling.size(); ++i) {
-      scaling[i] = 1.0 / std::max(scaling[i], 1.0);
+      if (is_sqrtn_) {
+        scaling[i] = 1.0 / sqrt(std::max(scaling[i], 1.0));
+      } else {
+        scaling[i] = 1.0 / std::max(scaling[i], 1.0);
+      }
     }
 
     auto output_flat = output->flat_outer_dims<T>();
@@ -468,16 +501,40 @@ class SparseSegmentMeanGradOp : public OpKernel {
       is_modified[output_idx] = true;
     }
   }
+
+ private:
+  const bool is_sqrtn_;
+};
+
+template <class T>
+class SparseSegmentMeanGradOp : public SparseSegmentGradOpBase<T> {
+ public:
+  explicit SparseSegmentMeanGradOp(OpKernelConstruction* context)
+      : SparseSegmentGradOpBase<T>(context, false /*is_sqrtn*/) {}
+};
+
+template <class T>
+class SparseSegmentSqrtNGradOp : public SparseSegmentGradOpBase<T> {
+ public:
+  explicit SparseSegmentSqrtNGradOp(OpKernelConstruction* context)
+      : SparseSegmentGradOpBase<T>(context, true /*is_sqrtn*/) {}
 };
 
 #define REGISTER_CPU_SPARSE_KERNELS(type)                 \
   REGISTER_KERNEL_BUILDER(Name("SparseSegmentMeanGrad")   \
                               .Device(DEVICE_CPU)         \
                               .TypeConstraint<type>("T"), \
                           SparseSegmentMeanGradOp<type>);
-
 REGISTER_CPU_SPARSE_KERNELS(float);
 REGISTER_CPU_SPARSE_KERNELS(double);
+#undef REGISTER_CPU_SPARSE_KERNELS
 
+#define REGISTER_CPU_SPARSE_KERNELS(type)                 \
+  REGISTER_KERNEL_BUILDER(Name("SparseSegmentSqrtNGrad")  \
+                              .Device(DEVICE_CPU)         \
+                              .TypeConstraint<type>("T"), \
+                          SparseSegmentSqrtNGradOp<type>);
+REGISTER_CPU_SPARSE_KERNELS(float);
+REGISTER_CPU_SPARSE_KERNELS(double);
 #undef REGISTER_CPU_SPARSE_KERNELS
 }  // namespace tensorflow
@@ -468,6 +468,7 @@ REGISTER_OP_GRADIENT("Mean", MeanGrad);
 // REGISTER_OP_GRADIENT("SegmentMean", SegmentMeanGrad);
 // REGISTER_OP_GRADIENT("SparseSegmentSum", SparseSegmentSumGrad);
 // REGISTER_OP_GRADIENT("SparseSegmentMean", SparseSegmentMeanGrad);
+// REGISTER_OP_GRADIENT("SparseSegmentSqrtN", SparseSegmentSqrtNGrad);
 // REGISTER_OP_GRADIENT("SegmentMin", SegmentMinGrad);
 // REGISTER_OP_GRADIENT("SegmentMax", SegmentMaxGrad);
 // REGISTER_OP_GRADIENT("UnsortedSegmentSum", UnsortedSegmentSumGrad);
 
@@ -921,6 +921,49 @@ segment_ids: segment_ids passed to the corresponding SparseSegmentMean op.
 output_dim0: dimension 0 of "data" passed to SparseSegmentMean op.
 )doc");
 
+REGISTER_OP("SparseSegmentSqrtN")
+    .Input("data: T")
+    .Input("indices: int32")
+    .Input("segment_ids: int32")
+    .Output("output: T")
+    .Attr("T: {float, double}")
+    .Doc(R"doc(
+Computes the sum along sparse segments of a tensor divided by the sqrt of N.
+
+N is the size of the segment being reduced.
+
+Read [the section on
+Segmentation](../../api_docs/python/math_ops.md#segmentation) for an explanation
+of segments.
+
+indices: A 1-D tensor. Has same rank as `segment_ids`.
+
+segment_ids: A 1-D tensor. Values should be sorted and can be repeated.
+
+output: Has same shape as data, except for dimension 0 which
+has size `k`, the number of segments.
+
+)doc");
+
+REGISTER_OP("SparseSegmentSqrtNGrad")
+    .Input("grad: T")
+    .Input("indices: int32")
+    .Input("segment_ids: int32")
+    .Input("output_dim0: int32")
+    .Output("output: T")
+    .Attr("T: {float, double}")
+    .Doc(R"doc(
+Computes gradients for SparseSegmentSqrtN.
+
+Returns tensor "output" with same shape as grad, except for dimension 0 whose
+value is output_dim0.
+
+grad: gradient propagated to the SparseSegmentSqrtN op.
+indices: indices passed to the corresponding SparseSegmentSqrtN op.
+segment_ids: segment_ids passed to the corresponding SparseSegmentSqrtN op.
+output_dim0: dimension 0 of "data" passed to SparseSegmentSqrtN op.
+)doc");
+
 REGISTER_OP("All")
     .Input("input: bool")
     .Input("reduction_indices: int32")
 
@@ -7894,6 +7894,79 @@ op {
   summary: "Computes gradients for SparseSegmentMean."
   description: "Returns tensor \"output\" with same shape as grad, except for dimension 0 whose\nvalue is output_dim0."
 }
+op {
+  name: "SparseSegmentSqrtN"
+  input_arg {
+    name: "data"
+    type_attr: "T"
+  }
+  input_arg {
+    name: "indices"
+    description: "A 1-D tensor. Has same rank as `segment_ids`."
+    type: DT_INT32
+  }
+  input_arg {
+    name: "segment_ids"
+    description: "A 1-D tensor. Values should be sorted and can be repeated."
+    type: DT_INT32
+  }
+  output_arg {
+    name: "output"
+    description: "Has same shape as data, except for dimension 0 which\nhas size `k`, the number of segments."
+    type_attr: "T"
+  }
+  attr {
+    name: "T"
+    type: "type"
+    allowed_values {
+      list {
+        type: DT_FLOAT
+        type: DT_DOUBLE
+      }
+    }
+  }
+  summary: "Computes the sum along sparse segments of a tensor divided by the sqrt of N."
+  description: "N is the size of the segment being reduced.\n\nRead [the section on\nSegmentation](../../api_docs/python/math_ops.md#segmentation) for an explanation\nof segments."
+}
+op {
+  name: "SparseSegmentSqrtNGrad"
+  input_arg {
+    name: "grad"
+    description: "gradient propagated to the SparseSegmentSqrtN op."
+    type_attr: "T"
+  }
+  input_arg {
+    name: "indices"
+    description: "indices passed to the corresponding SparseSegmentSqrtN op."
+    type: DT_INT32
+  }
+  input_arg {
+    name: "segment_ids"
+    description: "segment_ids passed to the corresponding SparseSegmentSqrtN op."
+    type: DT_INT32
+  }
+  input_arg {
+    name: "output_dim0"
+    description: "dimension 0 of \"data\" passed to SparseSegmentSqrtN op."
+    type: DT_INT32
+  }
+  output_arg {
+    name: "output"
+    type_attr: "T"
+  }
+  attr {
+    name: "T"
+    type: "type"
+    allowed_values {
+      list {
+        type: DT_FLOAT
+        type: DT_DOUBLE
+      }
+    }
+  }
+  summary: "Computes gradients for SparseSegmentSqrtN."
+  description: "Returns tensor \"output\" with same shape as grad, except for dimension 0 whose\nvalue is output_dim0."
+}
 op {
   name: "SparseSegmentSum"
   input_arg {