pytorch
diff --git a/‎aten/src/ATen/Declarations.cwrap‎
Lines changed: 0 additions & 7 deletions b/‎aten/src/ATen/Declarations.cwrap‎
Lines changed: 0 additions & 7 deletions
diff --git a/‎aten/src/ATen/core/Tensor.h‎
Lines changed: 6 additions & 6 deletions b/‎aten/src/ATen/core/Tensor.h‎
Lines changed: 6 additions & 6 deletions
diff --git a/‎aten/src/ATen/core/TensorMethods.h‎
Lines changed: 18 additions & 18 deletions b/‎aten/src/ATen/core/TensorMethods.h‎
Lines changed: 18 additions & 18 deletions
diff --git a/‎aten/src/ATen/core/Type.h‎
Lines changed: 6 additions & 6 deletions b/‎aten/src/ATen/core/Type.h‎
Lines changed: 6 additions & 6 deletions
diff --git a/‎aten/src/ATen/cpu/vec256/vec256_base.h‎
Lines changed: 7 additions & 1 deletion b/‎aten/src/ATen/cpu/vec256/vec256_base.h‎
Lines changed: 7 additions & 1 deletion
diff --git a/‎aten/src/ATen/cpu/vec256/vec256_double.h‎
Lines changed: 6 additions & 0 deletions b/‎aten/src/ATen/cpu/vec256/vec256_double.h‎
Lines changed: 6 additions & 0 deletions
diff --git a/‎aten/src/ATen/cpu/vec256/vec256_float.h‎
Lines changed: 6 additions & 0 deletions b/‎aten/src/ATen/cpu/vec256/vec256_float.h‎
Lines changed: 6 additions & 0 deletions
diff --git a/‎aten/src/ATen/cpu/vec256/vec256_int.h‎
Lines changed: 19 additions & 0 deletions b/‎aten/src/ATen/cpu/vec256/vec256_int.h‎
Lines changed: 19 additions & 0 deletions
diff --git a/‎aten/src/ATen/native/LegacyDefinitions.cpp‎
Lines changed: 0 additions & 36 deletions b/‎aten/src/ATen/native/LegacyDefinitions.cpp‎
Lines changed: 0 additions & 36 deletions
@@ -879,7 +879,6 @@
   name: _th_abs
   cname: abs
   backends:
-    - CPU
     - CUDA
   variants: function
   return: argument 0
@@ -1353,7 +1352,6 @@
   types:
     - floating_point
   backends:
-    - CPU
     - CUDA
   cname: frac
   variants: function
@@ -1368,7 +1366,6 @@
   types:
     - floating_point
   backends:
-    - CPU
     - CUDA
   variants:
     - function
@@ -1506,7 +1503,6 @@
   types:
     - floating_point
   backends:
-    - CPU
     - CUDA
   variants:
     - function
@@ -1523,7 +1519,6 @@
   types:
     - floating_point
   backends:
-    - CPU
     - CUDA
   variants: function
   options:
@@ -1536,7 +1531,6 @@
 [[
   name: _th_neg
   backends:
-    - CPU
     - CUDA
   variants:
     - function
@@ -1551,7 +1545,6 @@
 [[
   name: _th_neg_
   backends:
-    - CPU
     - CUDA
   variants: function
   options:
 
@@ -408,6 +408,8 @@ class CAFFE2_API Tensor {
   Tensor & fill_(const Tensor & value);
   Tensor floor() const;
   Tensor & floor_();
+  Tensor frac() const;
+  Tensor & frac_();
   Tensor ger(const Tensor & vec2) const;
   Tensor fft(int64_t signal_ndim, bool normalized=false) const;
   Tensor ifft(int64_t signal_ndim, bool normalized=false) const;
@@ -465,6 +467,10 @@ class CAFFE2_API Tensor {
   Tensor permute(IntArrayRef dims) const;
   Tensor pin_memory() const;
   Tensor pinverse(double rcond=1e-15) const;
+  Tensor reciprocal() const;
+  Tensor & reciprocal_();
+  Tensor neg() const;
+  Tensor & neg_();
   Tensor repeat(IntArrayRef repeats) const;
   Tensor repeat_interleave(const Tensor & repeats, c10::optional<int64_t> dim=c10::nullopt) const;
   Tensor repeat_interleave(int64_t repeats, c10::optional<int64_t> dim=c10::nullopt) const;
@@ -648,10 +654,7 @@ class CAFFE2_API Tensor {
   Tensor & digamma_();
   Tensor & polygamma_(int64_t n);
   Tensor & erfinv_();
-  Tensor & frac_();
   Tensor & renorm_(Scalar p, int64_t dim, Scalar maxnorm);
-  Tensor & reciprocal_();
-  Tensor & neg_();
   Tensor & pow_(Scalar exponent);
   Tensor & pow_(const Tensor & exponent);
   Tensor & lerp_(const Tensor & end, Scalar weight);
@@ -718,10 +721,7 @@ class CAFFE2_API Tensor {
   Tensor digamma() const;
   Tensor polygamma(int64_t n) const;
   Tensor erfinv() const;
-  Tensor frac() const;
   Tensor dist(const Tensor & other, Scalar p=2) const;
-  Tensor reciprocal() const;
-  Tensor neg() const;
   Tensor atan2(const Tensor & other) const;
   Tensor lerp(const Tensor & end, Scalar weight) const;
   Tensor lerp(const Tensor & end, const Tensor & weight) const;
 
@@ -280,6 +280,12 @@ inline Tensor Tensor::floor() const {
 inline Tensor & Tensor::floor_() {
     return dispatch_type().floor_(*this);
 }
+inline Tensor Tensor::frac() const {
+    return dispatch_type().frac(*this);
+}
+inline Tensor & Tensor::frac_() {
+    return dispatch_type().frac_(*this);
+}
 inline Tensor Tensor::ger(const Tensor & vec2) const {
     return dispatch_type().ger(*this, vec2);
 }
@@ -451,6 +457,18 @@ inline Tensor Tensor::pin_memory() const {
 inline Tensor Tensor::pinverse(double rcond) const {
     return dispatch_type().pinverse(*this, rcond);
 }
+inline Tensor Tensor::reciprocal() const {
+    return dispatch_type().reciprocal(*this);
+}
+inline Tensor & Tensor::reciprocal_() {
+    return dispatch_type().reciprocal_(*this);
+}
+inline Tensor Tensor::neg() const {
+    return dispatch_type().neg(*this);
+}
+inline Tensor & Tensor::neg_() {
+    return dispatch_type().neg_(*this);
+}
 inline Tensor Tensor::repeat(IntArrayRef repeats) const {
     return dispatch_type().repeat(*this, repeats);
 }
@@ -1000,18 +1018,9 @@ inline Tensor & Tensor::polygamma_(int64_t n) {
 inline Tensor & Tensor::erfinv_() {
     return dispatch_type().erfinv_(*this);
 }
-inline Tensor & Tensor::frac_() {
-    return dispatch_type().frac_(*this);
-}
 inline Tensor & Tensor::renorm_(Scalar p, int64_t dim, Scalar maxnorm) {
     return dispatch_type().renorm_(*this, p, dim, maxnorm);
 }
-inline Tensor & Tensor::reciprocal_() {
-    return dispatch_type().reciprocal_(*this);
-}
-inline Tensor & Tensor::neg_() {
-    return dispatch_type().neg_(*this);
-}
 inline Tensor & Tensor::pow_(Scalar exponent) {
     return dispatch_type().pow_(*this, exponent);
 }
@@ -1210,18 +1219,9 @@ inline Tensor Tensor::polygamma(int64_t n) const {
 inline Tensor Tensor::erfinv() const {
     return dispatch_type().erfinv(*this);
 }
-inline Tensor Tensor::frac() const {
-    return dispatch_type().frac(*this);
-}
 inline Tensor Tensor::dist(const Tensor & other, Scalar p) const {
     return dispatch_type().dist(*this, other, p);
 }
-inline Tensor Tensor::reciprocal() const {
-    return dispatch_type().reciprocal(*this);
-}
-inline Tensor Tensor::neg() const {
-    return dispatch_type().neg(*this);
-}
 inline Tensor Tensor::atan2(const Tensor & other) const {
     return dispatch_type().atan2(*this, other);
 }
 
@@ -282,6 +282,8 @@ struct CAFFE2_API Type {
   virtual Tensor & fill_(Tensor & self, const Tensor & value) const = 0;
   virtual Tensor floor(const Tensor & self) const = 0;
   virtual Tensor & floor_(Tensor & self) const = 0;
+  virtual Tensor frac(const Tensor & self) const = 0;
+  virtual Tensor & frac_(Tensor & self) const = 0;
   virtual Tensor ger(const Tensor & self, const Tensor & vec2) const = 0;
   virtual Tensor fft(const Tensor & self, int64_t signal_ndim, bool normalized) const = 0;
   virtual Tensor ifft(const Tensor & self, int64_t signal_ndim, bool normalized) const = 0;
@@ -339,6 +341,10 @@ struct CAFFE2_API Type {
   virtual Tensor permute(const Tensor & self, IntArrayRef dims) const = 0;
   virtual Tensor pin_memory(const Tensor & self) const = 0;
   virtual Tensor pinverse(const Tensor & self, double rcond) const = 0;
+  virtual Tensor reciprocal(const Tensor & self) const = 0;
+  virtual Tensor & reciprocal_(Tensor & self) const = 0;
+  virtual Tensor neg(const Tensor & self) const = 0;
+  virtual Tensor & neg_(Tensor & self) const = 0;
   virtual Tensor repeat(const Tensor & self, IntArrayRef repeats) const = 0;
   virtual Tensor repeat_interleave(const Tensor & repeats) const = 0;
   virtual Tensor repeat_interleave(const Tensor & self, const Tensor & repeats, c10::optional<int64_t> dim) const = 0;
@@ -523,10 +529,7 @@ struct CAFFE2_API Type {
   virtual Tensor & digamma_(Tensor & self) const = 0;
   virtual Tensor & polygamma_(Tensor & self, int64_t n) const = 0;
   virtual Tensor & erfinv_(Tensor & self) const = 0;
-  virtual Tensor & frac_(Tensor & self) const = 0;
   virtual Tensor & renorm_(Tensor & self, Scalar p, int64_t dim, Scalar maxnorm) const = 0;
-  virtual Tensor & reciprocal_(Tensor & self) const = 0;
-  virtual Tensor & neg_(Tensor & self) const = 0;
   virtual Tensor & pow_(Tensor & self, Scalar exponent) const = 0;
   virtual Tensor & pow_(Tensor & self, const Tensor & exponent) const = 0;
   virtual Tensor & lerp_(Tensor & self, const Tensor & end, Scalar weight) const = 0;
@@ -593,10 +596,7 @@ struct CAFFE2_API Type {
   virtual Tensor digamma(const Tensor & self) const = 0;
   virtual Tensor polygamma(int64_t n, const Tensor & self) const = 0;
   virtual Tensor erfinv(const Tensor & self) const = 0;
-  virtual Tensor frac(const Tensor & self) const = 0;
   virtual Tensor dist(const Tensor & self, const Tensor & other, Scalar p) const = 0;
-  virtual Tensor reciprocal(const Tensor & self) const = 0;
-  virtual Tensor neg(const Tensor & self) const = 0;
   virtual Tensor atan2(const Tensor & self, const Tensor & other) const = 0;
   virtual Tensor lerp(const Tensor & self, const Tensor & end, Scalar weight) const = 0;
   virtual Tensor lerp(const Tensor & self, const Tensor & end, const Tensor & weight) const = 0;
 
@@ -194,6 +194,9 @@ struct Vec256 {
   Vec256<T> expm1() const {
     return map(std::expm1);
   }
+  Vec256<T> frac() const {
+    return *this - this->trunc();
+  }
   Vec256<T> log() const {
     return map(std::log);
   }
@@ -219,7 +222,10 @@ struct Vec256 {
     return map(std::floor);
   }
   Vec256<T> neg() const {
-    return map([](T x) { return -x; });
+    // NB: the trailing return type is needed because we need to coerce the
+    // return value back to T in the case of unary operator- incuring a
+    // promotion
+    return map([](T x) -> T { return -x; });
   }
   Vec256<T> round() const {
     return map(std::nearbyint);
 
@@ -141,6 +141,7 @@ template <> class Vec256<double> {
   Vec256<double> floor() const {
     return _mm256_floor_pd(values);
   }
+  Vec256<double> frac() const;
   Vec256<double> neg() const {
     return _mm256_xor_pd(_mm256_set1_pd(-0.), values);
   }
@@ -216,6 +217,11 @@ Vec256<double> inline operator/(const Vec256<double>& a, const Vec256<double>& b
   return _mm256_div_pd(a, b);
 }
 
+// frac. Implement this here so we can use subtraction.
+Vec256<double> Vec256<double>::frac() const {
+  return *this - this->trunc();
+}
+
 // Implements the IEEE 754 201X `maximum` operation, which propagates NaN if
 // either input is a NaN.
 template <>
 
@@ -131,6 +131,7 @@ template <> class Vec256<float> {
   Vec256<float> log1p() const {
     return Vec256<float>(Sleef_log1pf8_u10(values));
   }
+  Vec256<float> frac() const;
   Vec256<float> sin() const {
     return map(std::sin);
   }
@@ -224,6 +225,11 @@ Vec256<float> inline operator/(const Vec256<float>& a, const Vec256<float>& b) {
   return _mm256_div_ps(a, b);
 }
 
+// frac. Implement this here so we can use subtraction
+Vec256<float> Vec256<float>::frac() const {
+  return *this - this->trunc();
+}
+
 // Implements the IEEE 754 201X `maximum` operation, which propagates NaN if
 // either input is a NaN.
 template <>
 
@@ -96,6 +96,8 @@ struct Vec256<int64_t> : public Vec256i {
     auto inverse = _mm256_xor_si256(values, is_larger);
     return _mm256_sub_epi64(inverse, is_larger);
   }
+  Vec256<int64_t> frac() const;
+  Vec256<int64_t> neg() const;
   Vec256<int64_t> operator==(const Vec256<int64_t>& other) const {
     return _mm256_cmpeq_epi64(values, other.values);
   }
@@ -185,6 +187,8 @@ struct Vec256<int32_t> : public Vec256i {
   Vec256<int32_t> abs() const {
     return _mm256_abs_epi32(values);
   }
+  Vec256<int32_t> frac() const;
+  Vec256<int32_t> neg() const;
   Vec256<int32_t> operator==(const Vec256<int32_t>& other) const {
     return _mm256_cmpeq_epi32(values, other.values);
   }
@@ -369,6 +373,8 @@ struct Vec256<int16_t> : public Vec256i {
   Vec256<int16_t> abs() const {
     return _mm256_abs_epi16(values);
   }
+  Vec256<int16_t> frac() const;
+  Vec256<int16_t> neg() const;
   Vec256<int16_t> operator==(const Vec256<int16_t>& other) const {
     return _mm256_cmpeq_epi16(values, other.values);
   }
@@ -419,6 +425,19 @@ Vec256<int16_t> inline operator-(const Vec256<int16_t>& a, const Vec256<int16_t>
   return _mm256_sub_epi16(a, b);
 }
 
+// Negation. Defined here so we can utilize operator-
+Vec256<int64_t> Vec256<int64_t>::neg() const {
+  return Vec256<int64_t>(0) - *this;
+}
+
+Vec256<int32_t> Vec256<int32_t>::neg() const {
+  return Vec256<int32_t>(0) - *this;
+}
+
+Vec256<int16_t> Vec256<int16_t>::neg() const {
+  return Vec256<int16_t>(0) - *this;
+}
+
 // Emulate operations with no native 64-bit support in avx,
 // by extracting each element, performing the operation pointwise,
 // then combining the results into a vector.
 
@@ -162,22 +162,10 @@ Tensor & erfinv_(Tensor& self) {
   return at::legacy::th::_th_erfinv_(self);
 }
 
-Tensor & frac_(Tensor& self) {
-  return at::legacy::th::_th_frac_(self);
-}
-
 Tensor & renorm_(Tensor& self, Scalar p, int64_t dim, Scalar maxnorm) {
   return at::legacy::th::_th_renorm_(self, p, dim, maxnorm);
 }
 
-Tensor & reciprocal_(Tensor& self) {
-  return at::legacy::th::_th_reciprocal_(self);
-}
-
-Tensor & neg_(Tensor& self) {
-  return at::legacy::th::_th_neg_(self);
-}
-
 Tensor & pow_(Tensor& self, Scalar exponent) {
   return at::legacy::th::_th_pow_(self, exponent);
 }
@@ -563,34 +551,10 @@ Tensor erfinv(const Tensor & self) {
   return at::legacy::th::_th_erfinv(self);
 }
 
-Tensor & frac_out(Tensor & result, const Tensor & self) {
-  return at::legacy::th::_th_frac_out(result, self);
-}
-
-Tensor frac(const Tensor & self) {
-  return at::legacy::th::_th_frac(self);
-}
-
 Tensor dist(const Tensor & self, const Tensor & other, Scalar p) {
   return at::legacy::th::_th_dist(self, other, p);
 }
 
-Tensor & reciprocal_out(Tensor & result, const Tensor & self) {
-  return at::legacy::th::_th_reciprocal_out(result, self);
-}
-
-Tensor reciprocal(const Tensor & self) {
-  return at::legacy::th::_th_reciprocal(self);
-}
-
-Tensor & neg_out(Tensor & result, const Tensor & self) {
-  return at::legacy::th::_th_neg_out(result, self);
-}
-
-Tensor neg(const Tensor & self) {
-  return at::legacy::th::_th_neg(self);
-}
-
 Tensor & atan2_out(Tensor & result, const Tensor & self, const Tensor & other) {
   return at::legacy::th::_th_atan2_out(result, self, other);
 }
Original file line number	Diff line number	Diff line change
`@@ -194,6 +194,9 @@ struct Vec256 {`
`194`	`194`	`Vec256<T> expm1() const {`
`195`	`195`	`return map(std::expm1);`
`196`	`196`	`}`
	`197`	`+ Vec256<T> frac() const {`
	`198`	`+ return *this - this->trunc();`
	`199`	`+ }`
`197`	`200`	`Vec256<T> log() const {`
`198`	`201`	`return map(std::log);`
`199`	`202`	`}`
`@@ -219,7 +222,10 @@ struct Vec256 {`
`219`	`222`	`return map(std::floor);`
`220`	`223`	`}`
`221`	`224`	`Vec256<T> neg() const {`
`222`		`- return map([](T x) { return -x; });`
	`225`	`+ // NB: the trailing return type is needed because we need to coerce the`
	`226`	`+ // return value back to T in the case of unary operator- incuring a`
	`227`	`+ // promotion`
	`228`	`+ return map([](T x) -> T { return -x; });`
`223`	`229`	`}`
`224`	`230`	`Vec256<T> round() const {`
`225`	`231`	`return map(std::nearbyint);`
Original file line number	Diff line number	Diff line change
`@@ -141,6 +141,7 @@ template <> class Vec256<double> {`
`141`	`141`	`Vec256<double> floor() const {`
`142`	`142`	`return _mm256_floor_pd(values);`
`143`	`143`	`}`
	`144`	`+ Vec256<double> frac() const;`
`144`	`145`	`Vec256<double> neg() const {`
`145`	`146`	`return _mm256_xor_pd(_mm256_set1_pd(-0.), values);`
`146`	`147`	`}`
`@@ -216,6 +217,11 @@ Vec256<double> inline operator/(const Vec256<double>& a, const Vec256<double>& b`
`216`	`217`	`return _mm256_div_pd(a, b);`
`217`	`218`	`}`
`218`	`219`
	`220`	`+// frac. Implement this here so we can use subtraction.`
	`221`	`+Vec256<double> Vec256<double>::frac() const {`
	`222`	`+ return *this - this->trunc();`
	`223`	`+}`
	`224`	`+`
`219`	`225`	// Implements the IEEE 754 201X `maximum` operation, which propagates NaN if
`220`	`226`	`// either input is a NaN.`
`221`	`227`	`template <>`
Original file line number	Diff line number	Diff line change
`@@ -131,6 +131,7 @@ template <> class Vec256<float> {`
`131`	`131`	`Vec256<float> log1p() const {`
`132`	`132`	`return Vec256<float>(Sleef_log1pf8_u10(values));`
`133`	`133`	`}`
	`134`	`+ Vec256<float> frac() const;`
`134`	`135`	`Vec256<float> sin() const {`
`135`	`136`	`return map(std::sin);`
`136`	`137`	`}`
`@@ -224,6 +225,11 @@ Vec256<float> inline operator/(const Vec256<float>& a, const Vec256<float>& b) {`
`224`	`225`	`return _mm256_div_ps(a, b);`
`225`	`226`	`}`
`226`	`227`
	`228`	`+// frac. Implement this here so we can use subtraction`
	`229`	`+Vec256<float> Vec256<float>::frac() const {`
	`230`	`+ return *this - this->trunc();`
	`231`	`+}`
	`232`	`+`
`227`	`233`	// Implements the IEEE 754 201X `maximum` operation, which propagates NaN if
`228`	`234`	`// either input is a NaN.`
`229`	`235`	`template <>`