Implement tensor.refine_names (#25842)

zou3519 · facebook-github-bot · commit e544f8859038 · 2019-09-12T22:53:40.000-07:00
Summary: Pull Request resolved: #25842 `tensor.refine_names(*names)` takes `tensor` and attempts to name its dimensions `names` out-of-place. If a dimension `i` already had a name, then it cannot be changed (so tensor.names[i] must equal names[i]); if the original dimension did not have a name, then the new name (names[i]) can be anything. `tensor.refine_names(*names)` also accepts a glob '*' that greedily selects names from `tensor`. Here are some examples: - `Tensor[None].refine_names('N') -> Tensor[N]` - `Tensor[N].refine_names('N') -> Tensor[N]` - `Tensor[N].refine_names('D') -> Error!` - `Tensor[N].refine_names(None) -> Error!` - `Tensor[None, None].refine_names('*', D) -> Tensor[None, D]` Test Plan: - new tests [namedtensor ci] Differential Revision: D17255548 Pulled By: zou3519 fbshipit-source-id: fdbdb3a12f24fbe37ce1e53ed09dc8a42589d928
diff --git a/aten/src/ATen/core/NamedTensor.cpp b/aten/src/ATen/core/NamedTensor.cpp
@@ -41,6 +41,10 @@ DimnameList default_names(size_t len) {
   return DimnameList(&all_unnamed.front(), len);
 }
 
+void check_names_valid_for(const Tensor& tensor, DimnameList names) {
+  return impl::check_names_valid_for(tensor.unsafeGetTensorImpl(), names);
+}
+
 namespace impl {
 
 // Two Dimnames cannot be in the same Tensor if one of them can refer to the other.
@@ -91,7 +95,7 @@ static const NamedTensorMeta* get_named_tensor_meta(const TensorImpl* impl) {
   return static_cast<const NamedTensorMeta*>(impl->named_tensor_meta());
 }
 
-void check_valid_names(TensorImpl* impl, DimnameList names) {
+void check_names_valid_for(TensorImpl* impl, DimnameList names) {
   auto ndim = impl->dim();
   TORCH_CHECK(
       ndim <= kMaxNamedTensorDim,
@@ -109,7 +113,7 @@ void internal_set_names_inplace(TensorImpl* impl, optional<DimnameList> names) {
     impl->set_named_tensor_meta(nullptr);
     return;
   }
-  check_valid_names(impl, *names);
+  check_names_valid_for(impl, *names);
   auto* meta = get_named_tensor_meta(impl);
   if (meta == nullptr) {
     impl->set_named_tensor_meta(c10::guts::make_unique<NamedTensorMeta>(*names));
@@ -120,7 +124,7 @@ void internal_set_names_inplace(TensorImpl* impl, optional<DimnameList> names) {
 
 void internal_set_names_inplace(TensorImpl* impl, std::vector<Dimname>&& names, bool validate_names) {
   if (validate_names) {
-    check_valid_names(impl, names);
+    check_names_valid_for(impl, names);
   }
   auto* meta = get_named_tensor_meta(impl);
   if (meta == nullptr) {
diff --git a/aten/src/ATen/core/NamedTensor.h b/aten/src/ATen/core/NamedTensor.h
@@ -73,6 +73,7 @@ struct CAFFE2_API NoNamesGuard {
   bool prev_mode;
 };
 
+void check_names_valid_for(const Tensor& tensor, DimnameList names);
 
 // Sets the names of `tensor` to be `names`.
 CAFFE2_API Tensor& internal_set_names_inplace(Tensor& tensor, optional<DimnameList> names);
@@ -89,6 +90,8 @@ namespace impl {
 CAFFE2_API void internal_set_names_inplace(TensorImpl* impl, optional<DimnameList> names);
 CAFFE2_API void internal_set_names_inplace(TensorImpl* impl, std::vector<Dimname>&& names, bool validate_names);
 
+void check_names_valid_for(TensorImpl* impl, DimnameList names);
+
 // Returns true if the tensor's names exist and are not all 'None'.
 // Returns false if the tensor's names don't exist (were not allocated),
 // or if all names are 'None'.
diff --git a/aten/src/ATen/core/TensorBody.h b/aten/src/ATen/core/TensorBody.h
@@ -403,6 +403,9 @@ class CAFFE2_API Tensor {
   #ifdef BUILD_NAMEDTENSOR
   Tensor align_to(DimnameList names) const;
   #endif
+  #ifdef BUILD_NAMEDTENSOR
+  Tensor refine_names(DimnameList names) const;
+  #endif
   Tensor abs() const;
   Tensor & abs_() const;
   Tensor acos() const;
diff --git a/aten/src/ATen/core/TensorMethods.h b/aten/src/ATen/core/TensorMethods.h
@@ -103,6 +103,16 @@ inline Tensor Tensor::align_to(DimnameList names) const {
 #endif
 }
 #endif
+#ifdef BUILD_NAMEDTENSOR
+inline Tensor Tensor::refine_names(DimnameList names) const {
+#ifdef USE_STATIC_DISPATCH
+    return TypeDefault::refine_names(const_cast<Tensor&>(*this), names);
+#else
+    static auto table = globalATenDispatch().getOpTable("aten::refine_names(Tensor(a) self, DimnameList names) -> Tensor(a)");
+    return table->getOp<Tensor (const Tensor &, DimnameList)>(type_set())(const_cast<Tensor&>(*this), names);
+#endif
+}
+#endif
 inline Tensor Tensor::abs() const {
 #ifdef USE_STATIC_DISPATCH
     return TypeDefault::abs(const_cast<Tensor&>(*this));
diff --git a/aten/src/ATen/native/NamedTensor.cpp b/aten/src/ATen/native/NamedTensor.cpp
@@ -89,6 +89,38 @@ static std::vector<int64_t> aligned_size(
   return expanded_sizes;
 }
 
+Tensor refine_names(const Tensor& self, DimnameList names) {
+  const auto self_names = self.names();
+  TORCH_CHECK(self_names.size() == names.size(),
+      "refine_names: cannot coerce Tensor", self_names, " to Tensor", names,
+      " because they have a different number of dims (",
+      self_names.size(), " and ", names.size(), " respectively).");
+  check_names_valid_for(self, names);
+
+  for (size_t idx = 0; idx < self_names.size(); idx++) {
+    const auto& self_name = self_names[idx];
+    const auto& out_name = names[idx];
+    if (self_name == out_name || self_name.is_wildcard()) {
+      continue;
+    }
+    if (out_name.is_wildcard()) {
+      TORCH_CHECK(false,
+          "refine_names: cannot coerse Tensor", self_names, " to Tensor", names,
+          " because ", self_name, " is more specific than ", out_name, " at index ",
+          idx);
+    }
+    TORCH_CHECK(false,
+        "refine_names: cannot coerse Tensor", self_names, " to Tensor", names,
+        " because ", self_name, " is different from ", out_name, " at index ",
+        idx);
+    TORCH_INTERNAL_ASSERT(false); // done handling errors
+  }
+
+  auto result = self.alias();
+  internal_set_names_inplace(result, names);
+  return result;
+}
+
 // [Alignment rules]
 // Aligns `tensor` to names with the following rules:
 // 1) Check that tensor.names is a subsequence (not necessarily contiguous) of `names`.
diff --git a/aten/src/ATen/native/native_functions.yaml b/aten/src/ATen/native/native_functions.yaml
@@ -50,6 +50,10 @@
 - func: align_tensors(Tensor[] tensors) -> Tensor[]
   named_guard: False
 
+- func: refine_names(Tensor(a) self, DimnameList names) -> Tensor(a)
+  variants: method
+  named_guard: False
+
 - func: _cudnn_ctc_loss(Tensor log_probs, Tensor targets, int[] input_lengths, int[] target_lengths, int blank, bool deterministic, bool zero_infinity) -> (Tensor, Tensor)
   dispatch:
     CUDA: _cudnn_ctc_loss
diff --git a/test/test_namedtensor.py b/test/test_namedtensor.py
@@ -176,6 +176,42 @@ def test_has_names(self):
         self.assertTrue(partially_named.has_names())
         self.assertTrue(fully_named.has_names())
 
+    def test_refine_names(self):
+        # Unnamed tensor -> Unnamed tensor
+        self._test_name_inference(Tensor.refine_names,
+                                  [create('None:1,None:2,None:3'), 'N', 'C', 'H'],
+                                  ['N', 'C', 'H'])
+
+        # Named tensor -> Named tensor
+        self._test_name_inference(Tensor.refine_names,
+                                  [create('N:1,C:2,H:3'), 'N', 'C', 'H'],
+                                  ['N', 'C', 'H'])
+
+        # Partially named tensor -> named tensor
+        self._test_name_inference(Tensor.refine_names,
+                                  [create('None:1,C:2,None:3'), None, 'C', 'H'],
+                                  [None, 'C', 'H'])
+
+        # Too few names
+        self._test_name_inference(Tensor.refine_names,
+                                  [create('None:2,None:3'), 'N', 'C', 'H'],
+                                  maybe_raises_regex="different number of dims")
+
+        # Cannot change Tensor[D] to Tensor[N]
+        self._test_name_inference(Tensor.refine_names,
+                                  [create('D:3'), 'N'],
+                                  maybe_raises_regex="is different from")
+
+        # Cannot change Tensor[D] to Tensor[None]
+        self._test_name_inference(Tensor.refine_names,
+                                  [create('D:3'), None],
+                                  maybe_raises_regex="'D' is more specific than None")
+
+        # globbing behavior exists
+        self._test_name_inference(Tensor.refine_names,
+                                  [create('None:1,None:1,None:2,None:3'), '*', 'C', 'H'],
+                                  [None, None, 'C', 'H'])
+
     def test_repr(self):
         named_tensor = torch.zeros(2, 3).names_('N', 'C')
         expected = "tensor([[0., 0., 0.],\n        [0., 0., 0.]], names=('N', 'C'))"
diff --git a/test/test_torch.py b/test/test_torch.py
@@ -243,6 +243,7 @@ def test_namespace(ns, *skips):
                        'names_',  # BUILD_NAMEDTENSOR only
                        'has_names',  # BUILD_NAMEDTENSOR only
                        'rename',  # BUILD_NAMEDTENSOR only
+                       'refine_names',  # BUILD_NAMEDTENSOR only
                        )
         test_namespace(torch.nn)
         test_namespace(torch.nn.functional, 'assert_int_or_pair', 'feature_alpha_dropout')
diff --git a/torch/namedtensor.py b/torch/namedtensor.py
@@ -39,23 +39,26 @@ def _expand_single_glob(numel_pre_glob, numel_post_glob, names):
     return names[numel_pre_glob:len(names) - numel_post_glob]
 
 
+def _resolve_glob(names, tensor_names, fn_name):
+    glob_indices = [i for i, x in enumerate(names) if x == '*']
+    if len(glob_indices) >= 2:
+        raise RuntimeError('{}: More than one \'*\' found in names ('
+                           '{}). This function supports up to one \'*\'.'
+                           .format(fn_name, names))
+    if len(glob_indices) == 0:
+        return names
+    glob_idx = glob_indices[0]
+    globbed_names = _expand_single_glob(glob_idx, len(names) - glob_idx - 1, tensor_names)
+    return names[:glob_idx] + globbed_names + names[glob_idx + 1:]
+
+
 def _update_names_with_list(tensor, names, inplace):
     # Special case for tensor.renamed(None)
     if len(names) == 1 and names[0] is None:
         return tensor._update_names(None, inplace)
 
-    glob_indices = [i for i, x in enumerate(names) if x == '*']
-    if len(glob_indices) >= 2:
-        raise RuntimeError('{}: More than one \'*\' found in names ('
-                           '{}). This function supports up to one \'*\'.'
-                           .format(_namer_api_name(inplace), names))
-    elif len(glob_indices) == 1:
-        glob_idx = glob_indices[0]
-        globbed_names = _expand_single_glob(glob_idx, len(names) - glob_idx - 1, tensor.names)
-        return tensor._update_names(
-            names[:glob_idx] + globbed_names + names[glob_idx + 1:], inplace)
-    else:
-        return tensor._update_names(names, inplace)
+    return tensor._update_names(
+        _resolve_glob(names, tensor.names, _namer_api_name(inplace)), inplace)
 
 
 def _update_names_with_mapping(tensor, rename_map, inplace):
diff --git a/torch/tensor.py b/torch/tensor.py
@@ -1,7 +1,7 @@
 import sys
 import torch
 import torch._C as _C
-from torch.namedtensor import _update_names, _check_serializing_named_tensor
+from torch.namedtensor import _update_names, _check_serializing_named_tensor, _resolve_glob
 from collections import OrderedDict
 import torch.utils.hooks as hooks
 import warnings
@@ -481,6 +481,10 @@ def __cuda_array_interface__(self):
 
         return dict(typestr=typestr, shape=shape, strides=strides, data=data, version=1)
 
+    def refine_names(self, *names):
+        names = _resolve_glob(names, self.names, 'refine_names')
+        return super(Tensor, self).refine_names(names)
+
     def names_(self, *names, **rename_map):
         # Note [names_ / renamed API]
         # The Python API for these is different from the C++ API. In Python:

Original file line number	Diff line number	Diff line change
`@@ -243,6 +243,7 @@ def test_namespace(ns, *skips):`
`243`	`243`	`'names_', # BUILD_NAMEDTENSOR only`
`244`	`244`	`'has_names', # BUILD_NAMEDTENSOR only`
`245`	`245`	`'rename', # BUILD_NAMEDTENSOR only`
	`246`	`+ 'refine_names', # BUILD_NAMEDTENSOR only`
`246`	`247`	`)`
`247`	`248`	`test_namespace(torch.nn)`
`248`	`249`	`test_namespace(torch.nn.functional, 'assert_int_or_pair', 'feature_alpha_dropout')`