This repository was archived by the owner on Aug 30, 2024. It is now read-only.
File tree Expand file tree Collapse file tree 2 files changed +6
-4
lines changed
include/experimental/group/gemm/impl
tests/integration/gemv/int4 Expand file tree Collapse file tree 2 files changed +6
-4
lines changed Original file line number Diff line number Diff line change @@ -286,7 +286,9 @@ class gemm_t<
286286 mem_desc_scale_t ,
287287 scale_tile_desc_t ,
288288 subgroup::msg_type_v<scale_tile_desc_t , mem_desc_scale_t >,
289- arch_tag>;
289+ (tile_size_x_b > 1 && arch_tag == gpu_arch::XeHpc) // TODO(Yi): PVC 2d WA
290+ ? gpu_arch::XeHpg
291+ : arch_tag>;
290292
291293 // compress int4 along N dimensions
292294 using zero_pt_tile_desc_t = subgroup::tile_desc_t <
Original file line number Diff line number Diff line change 1616
1717#include < utils/utils.hpp>
1818#include " xetla.hpp"
19- // #define UT_DEBUG
19+ #define UT_DEBUG
2020using namespace gpu ::xetla;
2121using namespace gpu ::xetla::group;
2222// The number of times the kernel is executed
@@ -35,9 +35,9 @@ class test_col_major_1 {
3535 static constexpr size_t mat_n = 4096 ;
3636 static constexpr size_t mat_k = 4096 ;
3737 static constexpr size_t wg_m = 64 ;
38- static constexpr size_t wg_n = 32 ;
38+ static constexpr size_t wg_n = 64 ;
3939 static constexpr size_t sg_m = 16 ;
40- static constexpr size_t sg_n = 8 ;
40+ static constexpr size_t sg_n = 16 ;
4141 static constexpr size_t sg_k = 32 ;
4242 static constexpr size_t dequant_s = 128 ;
4343 static constexpr quant_mode quant_mode = quant_mode::I4_SYM;
You can’t perform that action at this time.
0 commit comments