[PyTorch] Reapply D27404164: Devirtualize is_contiguous (pytorch#55333)

swolchok · facebook-github-bot · commit d6cbecbbb6aa · 2021-04-07T18:20:33.000-07:00
Summary: Pull Request resolved: pytorch#55333 Reapplying without using enum class in a bitfield. See new comments about gcc bug. ghstack-source-id: 125776904 Test Plan: Carefully review OSS test failure logs this time Reviewed By: kimishpatel, bhosmer Differential Revision: D27576623 fbshipit-source-id: 68fb00e5ff5215e56c8b9bc02717e1e7b2fedf9b
diff --git a/aten/src/ATen/BatchedTensorImpl.cpp b/aten/src/ATen/BatchedTensorImpl.cpp
@@ -16,6 +16,7 @@ BatchedTensorImpl::BatchedTensorImpl(Tensor value, BatchDims bdims)
 {
   TORCH_INTERNAL_ASSERT(value_.defined());
   set_storage_access_should_throw();
+  set_has_contiguity_policy(HasContiguityPolicy::CustomBehavior);
   checkInvariants();
 
   const auto public_dims = value_.dim() - bdims_.size();
@@ -74,7 +75,7 @@ void BatchedTensorImpl::checkInvariants() const {
 }
 
 // The following are publically exposed as methods of Tensor
-bool BatchedTensorImpl::is_contiguous(at::MemoryFormat memory_format) const {
+bool BatchedTensorImpl::is_contiguous_custom(at::MemoryFormat memory_format) const {
   TORCH_CHECK(memory_format == MemoryFormat::Contiguous,
       "NYI: querying is_contiguous inside of vmap for memory_format ",
       "other than torch.contiguous_format");
diff --git a/aten/src/ATen/BatchedTensorImpl.h b/aten/src/ATen/BatchedTensorImpl.h
@@ -73,7 +73,7 @@ struct TORCH_API BatchedTensorImpl : public c10::TensorImpl {
   int64_t actualDim(int64_t dim, bool wrap_dim = true) const;
 
   // Override a bunch of methods inherited from TensorImpl to return error messages.
-  bool is_contiguous(at::MemoryFormat memory_format=at::MemoryFormat::Contiguous) const override;
+  bool is_contiguous_custom(at::MemoryFormat memory_format) const override;
   void set_size(int64_t dim, int64_t new_size) override;
   void set_stride(int64_t dim, int64_t new_stride) override;
   void set_storage_offset(int64_t storage_offset) override;
diff --git a/aten/src/ATen/OpaqueTensorImpl.h b/aten/src/ATen/OpaqueTensorImpl.h
@@ -29,6 +29,7 @@ struct TORCH_API OpaqueTensorImpl : public TensorImpl {
       : TensorImpl(key_set, data_type, device),
         opaque_handle_(std::move(opaque_handle)) {
     set_storage_access_should_throw();
+    set_has_contiguity_policy(HasContiguityPolicy::ContiguityNotSupported);
     sizes_and_strides_.set_sizes(sizes);
     refresh_numel();
     is_non_overlapping_and_dense_ = is_non_overlapping_and_dense;
@@ -43,12 +44,6 @@ struct TORCH_API OpaqueTensorImpl : public TensorImpl {
     AT_ERROR("opaque tensors do not have strides");
   }
 
-  bool is_contiguous(
-      c10::MemoryFormat memory_format =
-          c10::MemoryFormat::Contiguous) const override {
-    AT_ERROR("opaque tensors do not have is_contiguous");
-  }
-
   int64_t stride(int64_t d) const override {
     AT_ERROR("opaque tensors do not have strides");
   }
diff --git a/aten/src/ATen/SparseTensorImpl.cpp b/aten/src/ATen/SparseTensorImpl.cpp
@@ -51,6 +51,7 @@ SparseTensorImpl::SparseTensorImpl(at::DispatchKeySet key_set, const caffe2::Typ
 
   is_non_overlapping_and_dense_ = false;
   set_storage_access_should_throw();
+  set_has_contiguity_policy(HasContiguityPolicy::ContiguityNotSupported);
 }
 
 void SparseTensorImpl::release_resources() {
@@ -62,9 +63,6 @@ void SparseTensorImpl::release_resources() {
 IntArrayRef SparseTensorImpl::strides() const {
   AT_ERROR("sparse tensors do not have strides");
 }
-bool SparseTensorImpl::is_contiguous(at::MemoryFormat memory_format) const {
-  AT_ERROR("sparse tensors do not have is_contiguous");
-}
 int64_t SparseTensorImpl::stride(int64_t d) const {
   AT_ERROR("sparse tensors do not have strides");
 }
diff --git a/aten/src/ATen/SparseTensorImpl.h b/aten/src/ATen/SparseTensorImpl.h
@@ -43,7 +43,6 @@ struct TORCH_API SparseTensorImpl : public TensorImpl {
   Tensor values() const { return values_; }
 
   IntArrayRef strides() const override;
-  bool is_contiguous(at::MemoryFormat memory_format=at::MemoryFormat::Contiguous) const override;
   int64_t stride(int64_t d) const override;
   void set_size(int64_t dim, int64_t new_size) override;
   void set_stride(int64_t dim, int64_t new_stride) override;
diff --git a/aten/src/ATen/native/metal/MetalTensorImpl.h b/aten/src/ATen/native/metal/MetalTensorImpl.h
@@ -22,15 +22,15 @@ struct TORCH_API MetalTensorImpl : public OpaqueTensorImpl<OpaqueHandle> {
             device,
             opaque_handle,
             sizes),
-        strides_(strides.vec()) {}
+        strides_(strides.vec()) {
+    TensorImpl::set_has_contiguity_policy(TensorImpl::HasContiguityPolicy::CustomBehavior);
+  }
 
   IntArrayRef strides() const override {
     return strides_;
   }
 
-  bool is_contiguous(
-      c10::MemoryFormat memory_format =
-          c10::MemoryFormat::Contiguous) const override {
+  bool is_contiguous_custom(c10::MemoryFormat memory_format) const override {
     return true;
   }
 
diff --git a/aten/src/ATen/native/vulkan/VulkanOpaqueTensorImpl.h b/aten/src/ATen/native/vulkan/VulkanOpaqueTensorImpl.h
@@ -23,15 +23,15 @@ struct VulkanOpaqueTensorImpl : public OpaqueTensorImpl<OpaqueHandle> {
             opaque_handle,
             sizes,
             false),
-        strides_(strides.vec()) {}
+        strides_(strides.vec()) {
+    TensorImpl::set_has_contiguity_policy(TensorImpl::HasContiguityPolicy::CustomBehavior);
+  }
 
   IntArrayRef strides() const override {
     return strides_;
   }
 
-  bool is_contiguous(
-      c10::MemoryFormat memory_format =
-          c10::MemoryFormat::Contiguous) const override {
+  bool is_contiguous_custom(c10::MemoryFormat memory_format) const override {
     return true;
   }
 
diff --git a/c10/core/TensorImpl.cpp b/c10/core/TensorImpl.cpp
@@ -276,17 +276,22 @@ void TensorImpl::throw_storage_access_error() const {
   TORCH_CHECK_NOT_IMPLEMENTED(false, "Cannot access storage of ", tensorimpl_type_name());
 }
 
-bool TensorImpl::is_contiguous(at::MemoryFormat memory_format) const {
-#ifdef DEBUG
-  AT_ASSERT(compute_contiguous() == is_contiguous_);
-#endif
-  if (memory_format == at::MemoryFormat::ChannelsLast) {
-      return is_channels_last_contiguous_;
-  }
-  else if (memory_format == at::MemoryFormat::ChannelsLast3d) {
-      return is_channels_last_3d_contiguous_;
+bool TensorImpl::is_contiguous_nondefault_policy_impl(at::MemoryFormat memory_format) const {
+  if (has_contiguity_ == static_cast<uint8_t>(HasContiguityPolicy::ContiguityNotSupported)) {
+    TORCH_CHECK_NOT_IMPLEMENTED(
+        false, "Tensors of type ", tensorimpl_type_name(),
+        " do not have is_contiguous");
+  } else {
+    TORCH_INTERNAL_ASSERT_DEBUG_ONLY(has_contiguity_ == static_cast<uint8_t>(HasContiguityPolicy::CustomBehavior));
+    return is_contiguous_custom(memory_format);
   }
-  return is_contiguous_;
+}
+
+bool TensorImpl::is_contiguous_custom(at::MemoryFormat memory_format) const {
+  TORCH_INTERNAL_ASSERT(
+      false,
+      "TensorImpl::is_contiguous_custom should never be called; did you "
+      "set_has_contiguity_policy and forget to override is_contiguous_custom?");
 }
 
 static void deletePlacementDeleteContext(void* ptr) {
@@ -381,6 +386,7 @@ void TensorImpl::copy_tensor_metadata_except_version_counter(
   dest_impl->device_opt_ = src_impl->device_opt_;
   dest_impl->key_set_ = src_impl->key_set_;
   dest_impl->is_contiguous_ = src_impl->is_contiguous_;
+  dest_impl->has_contiguity_ = src_impl->has_contiguity_;
   dest_impl->is_channels_last_contiguous_ = src_impl->is_channels_last_contiguous_;
   dest_impl->is_channels_last_3d_contiguous_ = src_impl->is_channels_last_3d_contiguous_;
   dest_impl->is_channels_last_ = src_impl->is_channels_last_;
diff --git a/c10/core/TensorImpl.h b/c10/core/TensorImpl.h
@@ -483,9 +483,37 @@ struct C10_API TensorImpl : public c10::intrusive_ptr_target {
    * Tensors with non-trivial strides are not contiguous.  See
    * compute_contiguous() for the exact definition of whether or not
    * a tensor is contiguous or not.
+   *
+   * NOTE: is_contiguous is only `TENSORIMPL_MAYBE_VIRTUAL` for
+   * backward compatibility. See `set_has_contiguity_policy` and
+   * `is_contiguous_custom` for the encouraged customization point.
    */
-  virtual bool is_contiguous(at::MemoryFormat memory_format=at::MemoryFormat::Contiguous) const;
+  TENSORIMPL_MAYBE_VIRTUAL bool is_contiguous(at::MemoryFormat memory_format=at::MemoryFormat::Contiguous) const {
+    if (C10_UNLIKELY(has_contiguity_ != static_cast<uint8_t>(HasContiguityPolicy::Default))) {
+      return is_contiguous_nondefault_policy_impl(memory_format);
+    }
+    TORCH_INTERNAL_ASSERT_DEBUG_ONLY(compute_contiguous() == is_contiguous_);
+    if (memory_format == at::MemoryFormat::ChannelsLast) {
+      return is_channels_last_contiguous_;
+    }
+    else if (memory_format == at::MemoryFormat::ChannelsLast3d) {
+      return is_channels_last_3d_contiguous_;
+    }
+    return is_contiguous_;
+  }
 
+ private:
+  bool is_contiguous_nondefault_policy_impl(at::MemoryFormat) const;
+
+ protected:
+  /**
+   * Customization point for is_contiguous; must also
+   * set_has_contiguity_policy(HasContiguityPolicy::Custom) for this
+   * to be called.
+   */
+  virtual bool is_contiguous_custom(at::MemoryFormat memory_format) const;
+
+ public:
   bool is_sparse() const {
     // NB: This method is not virtual and avoid dispatches for performance reasons.
     return key_set_.has(DispatchKey::SparseCPU) ||
@@ -1725,6 +1753,24 @@ struct C10_API TensorImpl : public c10::intrusive_ptr_target {
   }
 
 protected:
+  // Policy for adjusting the behavior of is_contiguous(). Allows
+  // subclass customization while still being able to inline
+  // is_contiguous() in the common case.
+  enum class HasContiguityPolicy : uint8_t {
+    // Default behavior: check is_contiguous_ and similar bitflags.
+    Default,
+    // Throw a generic error message that this tensor type does not
+    // support is_contiguous.
+    ContiguityNotSupported,
+    // Call virtual is_contiguous_custom method to implement custom
+    // is_contiguous behavior.
+    CustomBehavior,
+  };
+
+  void set_has_contiguity_policy(HasContiguityPolicy p) {
+    has_contiguity_ = static_cast<uint8_t>(p);
+  }
+
   Storage storage_;
 
 private:
@@ -1801,13 +1847,19 @@ struct C10_API TensorImpl : public c10::intrusive_ptr_target {
   c10::optional<c10::Device> device_opt_;
 
   // Tensor is contiguous
-  bool is_contiguous_ = true;
+  bool is_contiguous_ : 1;
+  // gcc doesn't like enum class bitfields; see
+  // https://gcc.gnu.org/bugzilla/show_bug.cgi?id=61414
+  /* HasContiguityPolicy */ uint8_t has_contiguity_ : 2;
 
   // Tensor is a subclass that does not permit storage access.
   bool storage_access_should_throw_ = false;
 
   // default member initializers for bit-fields only available with -std=c++2a or -std=gnu++2a
   inline void init_bitfields() {
+    is_contiguous_ = true;
+    has_contiguity_ = static_cast<uint8_t>(HasContiguityPolicy::Default);
+
     is_channels_last_ = false;
     is_channels_last_contiguous_ = false;
     is_channels_last_3d_ = false;

Original file line number	Diff line number	Diff line change
`@@ -16,6 +16,7 @@ BatchedTensorImpl::BatchedTensorImpl(Tensor value, BatchDims bdims)`
`16`	`16`	`{`
`17`	`17`	`TORCH_INTERNAL_ASSERT(value_.defined());`
`18`	`18`	`set_storage_access_should_throw();`
	`19`	`+ set_has_contiguity_policy(HasContiguityPolicy::CustomBehavior);`
`19`	`20`	`checkInvariants();`
`20`	`21`
`21`	`22`	`const auto public_dims = value_.dim() - bdims_.size();`
`@@ -74,7 +75,7 @@ void BatchedTensorImpl::checkInvariants() const {`
`74`	`75`	`}`
`75`	`76`
`76`	`77`	`// The following are publically exposed as methods of Tensor`
`77`		`-bool BatchedTensorImpl::is_contiguous(at::MemoryFormat memory_format) const {`
	`78`	`+bool BatchedTensorImpl::is_contiguous_custom(at::MemoryFormat memory_format) const {`
`78`	`79`	`TORCH_CHECK(memory_format == MemoryFormat::Contiguous,`
`79`	`80`	`"NYI: querying is_contiguous inside of vmap for memory_format ",`
`80`	`81`	`"other than torch.contiguous_format");`
Original file line number	Diff line number	Diff line change
`@@ -51,6 +51,7 @@ SparseTensorImpl::SparseTensorImpl(at::DispatchKeySet key_set, const caffe2::Typ`
`51`	`51`
`52`	`52`	`is_non_overlapping_and_dense_ = false;`
`53`	`53`	`set_storage_access_should_throw();`
	`54`	`+ set_has_contiguity_policy(HasContiguityPolicy::ContiguityNotSupported);`
`54`	`55`	`}`
`55`	`56`
`56`	`57`	`void SparseTensorImpl::release_resources() {`
`@@ -62,9 +63,6 @@ void SparseTensorImpl::release_resources() {`
`62`	`63`	`IntArrayRef SparseTensorImpl::strides() const {`
`63`	`64`	`AT_ERROR("sparse tensors do not have strides");`
`64`	`65`	`}`
`65`		`-bool SparseTensorImpl::is_contiguous(at::MemoryFormat memory_format) const {`
`66`		`- AT_ERROR("sparse tensors do not have is_contiguous");`
`67`		`-}`
`68`	`66`	`int64_t SparseTensorImpl::stride(int64_t d) const {`
`69`	`67`	`AT_ERROR("sparse tensors do not have strides");`
`70`	`68`	`}`