pytorch
diff --git a/‎aten/src/ATen/Context.cpp‎
Lines changed: 4 additions & 1 deletion b/‎aten/src/ATen/Context.cpp‎
Lines changed: 4 additions & 1 deletion
diff --git a/‎aten/src/ATen/OpaqueTensorImpl.h‎
Lines changed: 54 additions & 29 deletions b/‎aten/src/ATen/OpaqueTensorImpl.h‎
Lines changed: 54 additions & 29 deletions
diff --git a/‎aten/src/ATen/SparseTensorImpl.h‎
Lines changed: 49 additions & 26 deletions b/‎aten/src/ATen/SparseTensorImpl.h‎
Lines changed: 49 additions & 26 deletions
diff --git a/‎aten/src/ATen/native/Activation.cpp‎
Lines changed: 2 additions & 2 deletions b/‎aten/src/ATen/native/Activation.cpp‎
Lines changed: 2 additions & 2 deletions
diff --git a/‎aten/src/ATen/native/LegacyDefinitions.cpp‎
Lines changed: 1 addition & 1 deletion b/‎aten/src/ATen/native/LegacyDefinitions.cpp‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎aten/src/ATen/quantized/QTensorImpl.h‎
Lines changed: 46 additions & 6 deletions b/‎aten/src/ATen/quantized/QTensorImpl.h‎
Lines changed: 46 additions & 6 deletions
diff --git a/‎aten/src/TH/THTensor.cpp‎
Lines changed: 1 addition & 2 deletions b/‎aten/src/TH/THTensor.cpp‎
Lines changed: 1 addition & 2 deletions
diff --git a/‎c10/core/TensorImpl.cpp‎
Lines changed: 1 addition & 0 deletions b/‎c10/core/TensorImpl.cpp‎
Lines changed: 1 addition & 0 deletions
@@ -112,9 +112,12 @@ bool Context::setFlushDenormal(bool on) {
   return at::cpu::set_flush_denormal(on);
 }
 
+// NOTE: We also check `at::NonVariableTypeMode`, and if it's enabled we always
+// return non-Variable type in this function.
+// See NOTE [ Treating Variables as non-Variables in type dispatch ]
 TypeExtendedInterface& getType(TensorOptions options) {
   return globalContext().getType(
-            options.backend(), typeMetaToScalarType(options.dtype()), options.is_variable());
+            options.backend(), typeMetaToScalarType(options.dtype()), options.is_variable() && !at::NonVariableTypeMode::is_enabled());
 }
 
 // NOTE: We also check `at::NonVariableTypeMode`, and if it's enabled we always
 
@@ -77,41 +77,66 @@ struct CAFFE2_API OpaqueTensorImpl : public TensorImpl {
     AT_ERROR("opaque tensors do not have storage");
   }
 
-// NOTE: `shallow_copy_and_detach()` does not copy the following TensorImpl fields:
-// 1. the AutogradMeta pointer, because it is unique for each Variable.
-// 2. the version counter, because it is set to the passed in `version_counter`.
-//    See NOTE [ Version Counter Sharing ] for details.
-//
-// NOTE: `allow_tensor_metadata_change` determines whether the TensorImpl shallow-copy
-// allows changes to its metadata (e.g. sizes / strides / storage / storage_offset).
-// See NOTE [ Metadata Change for a Detached Tensor ] for details.
-c10::intrusive_ptr<TensorImpl> shallow_copy_and_detach(
-    const c10::VariableVersion& version_counter,
-    bool allow_tensor_metadata_change) const override {
-  //AT_ASSERT(false);
-  auto impl = c10::make_intrusive<OpaqueTensorImpl<OpaqueHandle>>(
-    type_id(), dtype(), device(), opaque_handle_, sizes_);
-  // TensorImpl general fields
-  // Note that some of these fields are not used in opaque tensor code,
-  // and we copy them here only for completeness.
-  impl->sizes_ = sizes_;
-  impl->strides_ = strides_;
-  impl->storage_offset_ = storage_offset_;
-  impl->is_contiguous_ = is_contiguous_;
-  impl->is_wrapped_number_ = is_wrapped_number_;
-  impl->reserved_ = reserved_;
-  impl->set_version_counter(version_counter);
-  impl->set_allow_tensor_metadata_change(allow_tensor_metadata_change);
-
-  // OpaqueTensorImpl-specific fields (none currently).
-  return impl;
-}
+  /**
+   * Return a TensorImpl that is a shallow-copy of this TensorImpl.
+   *
+   * For usage of `version_counter` and `allow_tensor_metadata_change`,
+   * see NOTE [ TensorImpl Shallow-Copying ].
+   */
+  c10::intrusive_ptr<TensorImpl> shallow_copy_and_detach(
+      const c10::VariableVersion& version_counter,
+      bool allow_tensor_metadata_change) const override {
+    auto impl = c10::make_intrusive<OpaqueTensorImpl<OpaqueHandle>>(
+      type_id(), dtype(), device(), opaque_handle_, sizes_);
+    copy_tensor_data(
+      /*src_impl=*/this,
+      /*dest_impl=*/impl.get(),
+      /*version_counter=*/version_counter,
+      /*allow_tensor_metadata_change=*/allow_tensor_metadata_change);
+    impl->refresh_numel();
+    return impl;
+  }
+
+  /**
+   * Shallow-copies data from another TensorImpl into this TensorImpl.
+   *
+   * For why this function doesn't check this TensorImpl's `allow_tensor_metadata_change_`,
+   * see NOTE [ TensorImpl Shallow-Copying ].
+   */
+  void shallow_copy_from(const c10::intrusive_ptr<TensorImpl>& impl) override {
+    AT_ASSERT(typeid(*(impl.get())) == typeid(OpaqueTensorImpl<OpaqueHandle>));
+    auto opaque_impl = static_cast<const OpaqueTensorImpl<OpaqueHandle>*>(impl.get());
+    copy_tensor_data(
+      /*src_impl=*/opaque_impl,
+      /*dest_impl=*/this,
+      /*version_counter=*/version_counter(),
+      /*allow_tensor_metadata_change=*/allow_tensor_metadata_change());
+    refresh_numel();
+  }
+
   OpaqueHandle& unsafe_opaque_handle() {
     return opaque_handle_;
   }
 
 private:
   OpaqueHandle opaque_handle_;
+
+  /**
+   * Copy the storage pointer and the tensor metadata fields (e.g. sizes / strides / storage_offset)
+   * from one TensorImpl to another TensorImpl.
+   *
+   * For usage of `version_counter` and `allow_tensor_metadata_change`, see NOTE [ TensorImpl Shallow-Copying ].
+   */
+  static void copy_tensor_data(
+      const OpaqueTensorImpl<OpaqueHandle>* src_opaque_impl,
+      OpaqueTensorImpl<OpaqueHandle>* dest_opaque_impl,
+      const c10::VariableVersion& version_counter,
+      bool allow_tensor_metadata_change) {
+    TensorImpl::copy_tensor_data(src_opaque_impl, dest_opaque_impl, version_counter, allow_tensor_metadata_change);
+
+    // OpaqueTensorImpl-specific fields.
+    dest_opaque_impl->opaque_handle_ = src_opaque_impl->opaque_handle_;
+  }
 };
 
 } // namespace at
@@ -183,41 +183,64 @@ struct CAFFE2_API SparseTensorImpl : public TensorImpl {
   // make it happen
   void set_indices_and_values_unsafe(const Tensor& indices, const Tensor& values);
 
-  // NOTE: `shallow_copy_and_detach()` does not copy the following TensorImpl fields:
-  // 1. the AutogradMeta pointer, because it is unique for each Variable.
-  // 2. the version counter, because it is set to the passed in `version_counter`.
-  //    See NOTE [ Version Counter Sharing ] for details.
-  //
-  // NOTE: `allow_tensor_metadata_change` determines whether the TensorImpl shallow-copy
-  // allows changes to its metadata (e.g. sizes / strides / storage / storage_offset).
-  // See NOTE [ Metadata Change for a Detached Tensor ] for details.
+  /**
+   * Return a TensorImpl that is a shallow-copy of this TensorImpl.
+   *
+   * For usage of `version_counter` and `allow_tensor_metadata_change`,
+   * see NOTE [ TensorImpl Shallow-Copying ].
+   */
   c10::intrusive_ptr<TensorImpl> shallow_copy_and_detach(
       const c10::VariableVersion& version_counter,
       bool allow_tensor_metadata_change) const override {
     auto impl = c10::make_intrusive<SparseTensorImpl>(type_id(), dtype());
-    // TensorImpl general fields
-    // Note that these fields are not used in sparse tensor code, and we copy them here only for completeness.
-    impl->sizes_ = sizes_;
-    impl->strides_ = strides_;
-    impl->storage_offset_ = storage_offset_;
-    impl->is_contiguous_ = is_contiguous_;
-    impl->is_wrapped_number_ = is_wrapped_number_;
-    impl->reserved_ = reserved_;
-    impl->set_version_counter(version_counter);
-    impl->set_allow_tensor_metadata_change(allow_tensor_metadata_change);
-
-    // Sparse-specific fields
-    impl->sparse_dim_ = sparse_dim();
-    impl->dense_dim_ = dense_dim();
-    impl->indices_ = indices();
-    impl->values_ = values();
-    impl->device_opt_ = device();
-    impl->coalesced_ = coalesced();
+    copy_tensor_data(
+      /*src_impl=*/this,
+      /*dest_impl=*/impl.get(),
+      /*version_counter=*/version_counter,
+      /*allow_tensor_metadata_change=*/allow_tensor_metadata_change);
     impl->refresh_numel();
     return impl;
   }
+
+  /**
+   * Shallow-copies data from another TensorImpl into this TensorImpl.
+   *
+   * For why this function doesn't check this TensorImpl's `allow_tensor_metadata_change_`,
+   * see NOTE [ TensorImpl Shallow-Copying ].
+   */
+  void shallow_copy_from(const c10::intrusive_ptr<TensorImpl>& impl) override {
+    AT_ASSERT(typeid(*(impl.get())) == typeid(SparseTensorImpl));
+    auto sparse_impl = static_cast<const SparseTensorImpl*>(impl.get());
+    copy_tensor_data(
+      /*src_impl=*/sparse_impl,
+      /*dest_impl=*/this,
+      /*version_counter=*/version_counter(),
+      /*allow_tensor_metadata_change=*/allow_tensor_metadata_change());
+    refresh_numel();
+  }
 private:
     explicit SparseTensorImpl(at::TensorTypeId, const caffe2::TypeMeta&, at::Tensor indices, at::Tensor values);
+
+  /**
+   * Copy the storage pointer and the tensor metadata fields (e.g. sizes / strides / storage_offset)
+   * from one TensorImpl to another TensorImpl.
+   *
+   * For usage of `version_counter` and `allow_tensor_metadata_change`, see NOTE [ TensorImpl Shallow-Copying ].
+   */
+  static void copy_tensor_data(
+      const SparseTensorImpl* src_sparse_impl,
+      SparseTensorImpl* dest_sparse_impl,
+      const c10::VariableVersion& version_counter,
+      bool allow_tensor_metadata_change) {
+    TensorImpl::copy_tensor_data(src_sparse_impl, dest_sparse_impl, version_counter, allow_tensor_metadata_change);
+
+    // Sparse-specific fields
+    dest_sparse_impl->sparse_dim_ = src_sparse_impl->sparse_dim();
+    dest_sparse_impl->dense_dim_ = src_sparse_impl->dense_dim();
+    dest_sparse_impl->indices_ = src_sparse_impl->indices();
+    dest_sparse_impl->values_ = src_sparse_impl->values();
+    dest_sparse_impl->coalesced_ = src_sparse_impl->coalesced();
+  }
 };
 
 } // namespace at
@@ -42,11 +42,11 @@ Tensor & celu_(Tensor & self, Scalar alpha) {
 }
 
 Tensor rrelu(const Tensor & self, Scalar lower, Scalar upper, bool training, Generator* generator) {
-  return at::rrelu_with_noise(self, at::empty({0}, self.options()), lower, upper, training, generator);
+  return at::rrelu_with_noise(self, at::empty_like(self), lower, upper, training, generator);
 }
 
 Tensor & rrelu_(Tensor & self, Scalar lower, Scalar upper, bool training, Generator* generator) {
-  return at::rrelu_with_noise_(self, at::empty({0}, self.options()), lower, upper, training, generator);
+  return at::rrelu_with_noise_(self, at::empty_like(self), lower, upper, training, generator);
 }
 
 // computes `result = self <= threshold ? value : other`
 
@@ -9,7 +9,7 @@ namespace at { namespace native {
 // Methods
 
 void* data_ptr(const Tensor & self) {
-  return self.unsafeGetTensorImpl()->slow_data();
+  return self.unsafeGetTensorImpl()->data();
 }
 
 Tensor & set_(Tensor& self, Storage source) {
 
@@ -25,24 +25,64 @@ struct CAFFE2_API QTensorImpl : public c10::TensorImpl {
     return quantizer_;
   }
 
+  /**
+   * Return a TensorImpl that is a shallow-copy of this TensorImpl.
+   *
+   * For usage of `version_counter` and `allow_tensor_metadata_change`,
+   * see NOTE [ TensorImpl Shallow-Copying ].
+   */
   c10::intrusive_ptr<TensorImpl> shallow_copy_and_detach(
       const c10::VariableVersion& version_counter,
       bool allow_tensor_metadata_change) const override {
     auto impl = c10::make_intrusive<QTensorImpl>(
         Storage(storage()), type_id(), quantizer_);
-    impl->set_sizes_and_strides(sizes(), strides());
-    impl->storage_offset_ = storage_offset_;
-    impl->is_wrapped_number_ = is_wrapped_number_;
-    impl->reserved_ = reserved_;
+    copy_tensor_data(
+      /*src_impl=*/this,
+      /*dest_impl=*/impl.get(),
+      /*version_counter=*/version_counter,
+      /*allow_tensor_metadata_change=*/allow_tensor_metadata_change);
     impl->refresh_numel();
     impl->refresh_contiguous();
-    impl->set_version_counter(version_counter);
-    impl->set_allow_tensor_metadata_change(allow_tensor_metadata_change);
     return impl;
   }
 
+  /**
+   * Shallow-copies data from another TensorImpl into this TensorImpl.
+   *
+   * For why this function doesn't check this TensorImpl's `allow_tensor_metadata_change_`,
+   * see NOTE [ TensorImpl Shallow-Copying ].
+   */
+  void shallow_copy_from(const c10::intrusive_ptr<TensorImpl>& impl) override {
+    AT_ASSERT(typeid(*(impl.get())) == typeid(QTensorImpl));
+    auto q_impl = static_cast<const QTensorImpl*>(impl.get());
+    copy_tensor_data(
+      /*src_impl=*/q_impl,
+      /*dest_impl=*/this,
+      /*version_counter=*/version_counter(),
+      /*allow_tensor_metadata_change=*/allow_tensor_metadata_change());
+    refresh_numel();
+    refresh_contiguous();
+  }
+
  private:
   QuantizerPtr quantizer_;
+
+  /**
+   * Copy the storage pointer and the tensor metadata fields (e.g. sizes / strides / storage_offset)
+   * from one TensorImpl to another TensorImpl.
+   *
+   * For usage of `version_counter` and `allow_tensor_metadata_change`, see NOTE [ TensorImpl Shallow-Copying ].
+   */
+  static void copy_tensor_data(
+      const QTensorImpl* src_q_impl,
+      QTensorImpl* dest_q_impl,
+      const c10::VariableVersion& version_counter,
+      bool allow_tensor_metadata_change) {
+    TensorImpl::copy_tensor_data(src_q_impl, dest_q_impl, version_counter, allow_tensor_metadata_change);
+
+    // OpaqueTensorImpl-specific fields.
+    dest_q_impl->quantizer_ = src_q_impl->quantizer_;
+  }
 };
 
 } // namespace at
@@ -164,8 +164,7 @@ void THTensor_stealAndSetStoragePtr(THTensor* tensor, THStorage* storage) {
   // Caffe2 also has uninitialized dtype states, which we disallow here
   AT_ASSERT(tensor->storage().dtype() == storage->dtype());
 
-  // We used to allow this, but this breaks device caching,
-  // see Note [We regret making Variable hold a Tensor]
+  // We used to allow this, but this breaks device caching.
   // Let's put an actual error message for this one.
   TORCH_CHECK(tensor->storage().device() == storage->device(),
             "Attempted to set the storage of a tensor on device \"", tensor->storage().device(),
 
@@ -82,6 +82,7 @@ bool TensorImpl::compute_contiguous() const {
 }
 
 void TensorImpl::release_resources() {
+  autograd_meta_.reset();
   if (storage_) {
     storage_ = {};
   }
Original file line number	Diff line number	Diff line change
`@@ -112,9 +112,12 @@ bool Context::setFlushDenormal(bool on) {`
`112`	`112`	`return at::cpu::set_flush_denormal(on);`
`113`	`113`	`}`
`114`	`114`
	`115`	+// NOTE: We also check `at::NonVariableTypeMode`, and if it's enabled we always
	`116`	`+// return non-Variable type in this function.`
	`117`	`+// See NOTE [ Treating Variables as non-Variables in type dispatch ]`
`115`	`118`	`TypeExtendedInterface& getType(TensorOptions options) {`
`116`	`119`	`return globalContext().getType(`
`117`		`- options.backend(), typeMetaToScalarType(options.dtype()), options.is_variable());`
	`120`	`+ options.backend(), typeMetaToScalarType(options.dtype()), options.is_variable() && !at::NonVariableTypeMode::is_enabled());`
`118`	`121`	`}`
`119`	`122`
`120`	`123`	// NOTE: We also check `at::NonVariableTypeMode`, and if it's enabled we always
Original file line number	Diff line number	Diff line change
`@@ -42,11 +42,11 @@ Tensor & celu_(Tensor & self, Scalar alpha) {`
`42`	`42`	`}`
`43`	`43`
`44`	`44`	`Tensor rrelu(const Tensor & self, Scalar lower, Scalar upper, bool training, Generator* generator) {`
`45`		`- return at::rrelu_with_noise(self, at::empty({0}, self.options()), lower, upper, training, generator);`
	`45`	`+ return at::rrelu_with_noise(self, at::empty_like(self), lower, upper, training, generator);`
`46`	`46`	`}`
`47`	`47`
`48`	`48`	`Tensor & rrelu_(Tensor & self, Scalar lower, Scalar upper, bool training, Generator* generator) {`
`49`		`- return at::rrelu_with_noise_(self, at::empty({0}, self.options()), lower, upper, training, generator);`
	`49`	`+ return at::rrelu_with_noise_(self, at::empty_like(self), lower, upper, training, generator);`
`50`	`50`	`}`
`51`	`51`
`52`	`52`	// computes `result = self <= threshold ? value : other`
Original file line number	Diff line number	Diff line change
`@@ -9,7 +9,7 @@ namespace at { namespace native {`
`9`	`9`	`// Methods`
`10`	`10`
`11`	`11`	`void* data_ptr(const Tensor & self) {`
`12`		`- return self.unsafeGetTensorImpl()->slow_data();`
	`12`	`+ return self.unsafeGetTensorImpl()->data();`
`13`	`13`	`}`
`14`	`14`
`15`	`15`	`Tensor & set_(Tensor& self, Storage source) {`
Original file line number	Diff line number	Diff line change
`@@ -82,6 +82,7 @@ bool TensorImpl::compute_contiguous() const {`
`82`	`82`	`}`
`83`	`83`
`84`	`84`	`void TensorImpl::release_resources() {`
	`85`	`+ autograd_meta_.reset();`
`85`	`86`	`if (storage_) {`
`86`	`87`	`storage_ = {};`
`87`	`88`	`}`