[SYCL] Change internal host vec representation (#13596)

steffenlarsen · web-flow · commit 5df262fd4af4 · 2024-04-30T16:20:45.000-07:00
This commit changes the internal representation of sycl::vec&lt;sycl::half,
N&gt; to use sycl::half directly instead of the wrapper implementation used
inside them. This avoids strict alias violation in the operator[] for
the host implementation.

Signed-off-by: Larsen, Steffen &lt;steffen.larsen@intel.com&gt;
diff --git a/sycl/include/sycl/half_type.hpp b/sycl/include/sycl/half_type.hpp
@@ -228,42 +228,48 @@ class half;
 
 // Several aliases are defined below:
 // - StorageT: actual representation of half data type. It is used by scalar
-//   half values and by 'sycl::vec' class. On device side, it points to some
-//   native half data type, while on host some custom data type is used to
-//   emulate operations of 16-bit floating-point values
+//   half values. On device side, it points to some native half data type, while
+//   on host some custom data type is used to emulate operations of 16-bit
+//   floating-point values
 //
 // - BIsRepresentationT: data type which is used by built-in functions. It is
 //   distinguished from StorageT, because on host, we can still operate on the
 //   wrapper itself and there is no sense in direct usage of underlying data
 //   type (too many changes required for BIs implementation without any
 //   foreseeable profits)
 //
-// - VecNStorageT - representation of N-element vector of halfs. Follows the
-//   same logic as StorageT
+// - VecElemT: representation of each element in the vector. On device it is
+//   the same as StorageT to carry a native vector representation, while on
+//   host it stores the sycl::half implementation directly.
+//
+// - VecNStorageT: representation of N-element vector of halfs. Follows the
+//   same logic as VecElemT.
 #ifdef __SYCL_DEVICE_ONLY__
 using StorageT = _Float16;
 using BIsRepresentationT = _Float16;
+using VecElemT = _Float16;
 
-using Vec2StorageT = StorageT __attribute__((ext_vector_type(2)));
-using Vec3StorageT = StorageT __attribute__((ext_vector_type(3)));
-using Vec4StorageT = StorageT __attribute__((ext_vector_type(4)));
-using Vec8StorageT = StorageT __attribute__((ext_vector_type(8)));
-using Vec16StorageT = StorageT __attribute__((ext_vector_type(16)));
+using Vec2StorageT = VecElemT __attribute__((ext_vector_type(2)));
+using Vec3StorageT = VecElemT __attribute__((ext_vector_type(3)));
+using Vec4StorageT = VecElemT __attribute__((ext_vector_type(4)));
+using Vec8StorageT = VecElemT __attribute__((ext_vector_type(8)));
+using Vec16StorageT = VecElemT __attribute__((ext_vector_type(16)));
 #else // SYCL_DEVICE_ONLY
 using StorageT = detail::host_half_impl::half;
 // No need to extract underlying data type for built-in functions operating on
 // host
 using BIsRepresentationT = half;
+using VecElemT = half;
 
 // On the host side we cannot use OpenCL cl_half# types as an underlying type
 // for vec because they are actually defined as an integer type under the
 // hood. As a result half values will be converted to the integer and passed
 // as a kernel argument which is expected to be floating point number.
-using Vec2StorageT = std::array<StorageT, 2>;
-using Vec3StorageT = std::array<StorageT, 3>;
-using Vec4StorageT = std::array<StorageT, 4>;
-using Vec8StorageT = std::array<StorageT, 8>;
-using Vec16StorageT = std::array<StorageT, 16>;
+using Vec2StorageT = std::array<VecElemT, 2>;
+using Vec3StorageT = std::array<VecElemT, 3>;
+using Vec4StorageT = std::array<VecElemT, 4>;
+using Vec8StorageT = std::array<VecElemT, 8>;
+using Vec16StorageT = std::array<VecElemT, 16>;
 #endif // SYCL_DEVICE_ONLY
 
 #ifndef __SYCL_DEVICE_ONLY__
diff --git a/sycl/include/sycl/vector.hpp b/sycl/include/sycl/vector.hpp
@@ -300,9 +300,9 @@ struct VecStorage<
 
 // Single element half
 template <> struct VecStorage<half, 1, void> {
-  using DataType = sycl::detail::half_impl::StorageT;
+  using DataType = sycl::detail::half_impl::VecElemT;
 #ifdef __SYCL_DEVICE_ONLY__
-  using VectorDataType = sycl::detail::half_impl::StorageT;
+  using VectorDataType = sycl::detail::half_impl::VecElemT;
 #endif // __SYCL_DEVICE_ONLY__
 };
 
@@ -365,10 +365,12 @@ template <typename Type, int NumElements> class vec {
   // in the class, so vec<float, 16> should be equal to float16 in memory.
   using DataType = typename detail::VecStorage<DataT, NumElements>::DataType;
 
+#ifdef __SYCL_DEVICE_ONLY__
+  static constexpr bool IsHostHalf = false;
+#else
   static constexpr bool IsHostHalf =
-      std::is_same_v<DataT, sycl::detail::half_impl::half> &&
-      std::is_same_v<sycl::detail::half_impl::StorageT,
-                     sycl::detail::host_half_impl::half>;
+      std::is_same_v<DataT, sycl::detail::half_impl::half>;
+#endif
 
   static constexpr bool IsBfloat16 =
       std::is_same_v<DataT, sycl::ext::oneapi::bfloat16>;