Fix strict aliasing rule violation in bitwise_binary_op (#66194) (#69619)

author Eli Uriegas <1700823+seemethere@users.noreply.github.com>

Wed, 8 Dec 2021 23:01:18 +0000 (15:01 -0800)

committer GitHub <noreply@github.com>

Wed, 8 Dec 2021 23:01:18 +0000 (15:01 -0800)
author Eli Uriegas <1700823+seemethere@users.noreply.github.com>
Wed, 8 Dec 2021 23:01:18 +0000 (15:01 -0800)
committer GitHub <noreply@github.com>
Wed, 8 Dec 2021 23:01:18 +0000 (15:01 -0800)
diff --git a/aten/src/ATen/cpu/vec/vec_base.h b/aten/src/ATen/cpu/vec/vec_base.h

index da5f318..8761d90 100644 (file)
--- a/aten/src/ATen/cpu/vec/vec_base.h
+++ b/aten/src/ATen/cpu/vec/vec_base.h
@@ -146,6 +146,10 @@ public:
    inline operator T*() {
      return values;
    }
+  // Return the values as char* for type punning
+  auto as_bytes() const -> const char* {
+    return reinterpret_cast<const char*>(values);
+  }
    template <int64_t mask_>
    static Vectorized<T> blend(const Vectorized<T>& a, const Vectorized<T>& b) {
      int64_t mask = mask_;
@@ -735,15 +739,33 @@ inline Vectorized<T> operator^(const Vectorized<T>& a, const Vectorized<T>& b) {
  
  #else
  
+template <typename T>
+auto load(char const* data) -> T {
+  T ret;
+  std::memcpy(&ret, data, sizeof(ret));
+  return ret;
+}
+
  template<class T, typename Op>
  static inline Vectorized<T> bitwise_binary_op(const Vectorized<T> &a, const Vectorized<T> &b, Op op) {
    static constexpr uint32_t element_no = VECTOR_WIDTH / sizeof(intmax_t);
    __at_align__ intmax_t buffer[element_no];
-  const intmax_t *a_ptr = reinterpret_cast<const intmax_t*>((const T*) a);
-  const intmax_t *b_ptr = reinterpret_cast<const intmax_t*>((const T*) b);
-  for (uint32_t i = 0U; i < element_no; ++ i) {
-    buffer[i] = op(a_ptr[i], b_ptr[i]);
-  }
+  static_assert(VECTOR_WIDTH % sizeof(intmax_t) == 0, "VECTOR_WIDTH not a multiple of sizeof(intmax_t)");
+  static_assert(sizeof(buffer) == sizeof(Vectorized<T>), "sizeof(buffer) must match sizeof(Vectorized<T>)");
+  // We should be using memcpy in order to respect the strict aliasing rule
+  // see: https://github.com/pytorch/pytorch/issues/66119
+  // Using char* is defined in the C11 standard 6.5 Expression paragraph 7
+  // (http://www.open-std.org/jtc1/sc22/wg14/www/docs/n1570.pdf)
+  const auto* a_data = a.as_bytes();
+  const auto* b_data = b.as_bytes();
+  // load each intmax_t chunk and process; increase pointers by sizeof(intmax_t)
+  for (auto& out : buffer) {
+    out = op(load<intmax_t>(a_data), load<intmax_t>(b_data));
+    a_data += sizeof(intmax_t);
+    b_data += sizeof(intmax_t);
+  }
+  assert(a_data == a.as_bytes() + sizeof(a));
+  assert(b_data == b.as_bytes() + sizeof(b));
    return Vectorized<T>::loadu(buffer);
  }
author	Eli Uriegas <1700823+seemethere@users.noreply.github.com>
	Wed, 8 Dec 2021 23:01:18 +0000 (15:01 -0800)
committer	GitHub <noreply@github.com>
	Wed, 8 Dec 2021 23:01:18 +0000 (15:01 -0800)