Skip to content
This repository was archived by the owner on Aug 30, 2024. It is now read-only.

Commit 36f736c

Browse files
Sync ipex(modify prefetch) (#320)
* fix block_load elems(drop 10%) * u1 __SYCL_DEPRECATED("u1 is reserved/unsupported") = 1, // unsigned 1 bit s1 __SYCL_DEPRECATED("s1 is reserved/unsupported") = 2, // signed 1 bit * save * update prefetch gather and scatter 2024.2 * update atomic * fix comilpe on 2024.1 * conflict * sync_ipex(update prefetch) * clang format * sync ipex 69258612b * unused var
1 parent 5d86a6b commit 36f736c

File tree

21 files changed

+776
-509
lines changed

21 files changed

+776
-509
lines changed

include/common/core/common.hpp

Lines changed: 16 additions & 10 deletions
Original file line numberDiff line numberDiff line change
@@ -227,16 +227,22 @@ enum class atomic_op : uint8_t {
227227

228228
/// xetla dpas argument typ
229229
enum class argument_type : uint8_t {
230-
U1 = 0, // unsigned 1 bit
231-
S1 = 1, // signed 1 bit
232-
U2 = 2, // unsigned 2 bits
233-
S2 = 3, // signed 2 bits
234-
U4 = 4, // unsigned 4 bits
235-
S4 = 5, // signed 4 bits
236-
U8 = 6, // unsigned 8 bits
237-
S8 = 7, // signed 8 bits
238-
BF16 = 8, // bfloat 16
239-
FP16 = 9, // half float
230+
Invalid = 0,
231+
#if __INTEL_LLVM_COMPILER >= 20240200
232+
U1 __SYCL_DEPRECATED("u1 is reserved/unsupported") = 1, // unsigned 1 bit
233+
S1 __SYCL_DEPRECATED("s1 is reserved/unsupported") = 2, // signed 1 bit
234+
#else
235+
U1 = 1, // unsigned 1 bit
236+
S1 = 2, // signed 1 bit
237+
#endif
238+
U2 = 3, // unsigned 2 bits
239+
S2 = 4, // signed 2 bits
240+
U4 = 5, // unsigned 4 bits
241+
S4 = 6, // signed 4 bits
242+
U8 = 7, // unsigned 8 bits
243+
S8 = 8, // signed 8 bits
244+
BF16 = 9, // bfloat 16
245+
FP16 = 10, // half float
240246
TF32 = 12, // tensorfloat 32
241247
DF = 13, // double (64bits)
242248
NUM_ARG_TYPES = 14

include/common/core/math_mma.hpp

Lines changed: 16 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -33,7 +33,11 @@ namespace detail {
3333
///
3434
template <typename dtype>
3535
constexpr gpu::xetla::argument_type mma_argument_type() {
36+
#if __INTEL_LLVM_COMPILER < 20240200
3637
return gpu::xetla::argument_type::U1;
38+
#else
39+
return gpu::xetla::argument_type::U2;
40+
#endif
3741
}
3842

3943
template <>
@@ -72,7 +76,11 @@ constexpr gpu::xetla::argument_type mma_argument_type<fp16>() {
7276
template <gpu::xetla::argument_type arg_type>
7377
constexpr __ESIMD_NS::xmx::dpas_argument_type get_argument_type() {
7478
static_assert(
75-
arg_type == gpu::xetla::argument_type::U2 ||
79+
#if __INTEL_LLVM_COMPILER < 20240200
80+
arg_type == gpu::xetla::argument_type::U1 ||
81+
arg_type == gpu::xetla::argument_type::S1 ||
82+
#endif
83+
arg_type == gpu::xetla::argument_type::U2 ||
7684
arg_type == gpu::xetla::argument_type::S2 ||
7785
arg_type == gpu::xetla::argument_type::U4 ||
7886
arg_type == gpu::xetla::argument_type::S4 ||
@@ -82,7 +90,14 @@ constexpr __ESIMD_NS::xmx::dpas_argument_type get_argument_type() {
8290
arg_type == gpu::xetla::argument_type::BF16 ||
8391
arg_type == gpu::xetla::argument_type::TF32,
8492
"Unsupported argument type");
93+
8594
switch (arg_type) {
95+
#if __INTEL_LLVM_COMPILER < 20240200
96+
case gpu::xetla::argument_type::U1:
97+
return __ESIMD_NS::xmx::dpas_argument_type::u1;
98+
case gpu::xetla::argument_type::S1:
99+
return __ESIMD_NS::xmx::dpas_argument_type::s1;
100+
#endif
86101
case gpu::xetla::argument_type::U2:
87102
return __ESIMD_NS::xmx::dpas_argument_type::u2;
88103
case gpu::xetla::argument_type::S2:

0 commit comments

Comments
 (0)