@@ -86,7 +86,7 @@ struct fused_config_t {
8686 {start_x_b, start_y_b}); \
8787 gemm_args.init(mem_desc_a, mem_desc_b, inner_loop_count_##id); \
8888 op (g, matAcc_##acc_id, gemm_args); \
89- SW_BARRIER ();
89+ sw_barrier ();
9090
9191#define MATC_STORE (ptr_c ) \
9292 mem_desc_c.init( \
@@ -229,7 +229,7 @@ struct gru_layer {
229229 int start_n = (j)*wg_tile_n;
230230 CONFIG_SETTING (batch_size, -1 , hidden_size);
231231 matAcc_0.init (0 );
232- SW_BARRIER ();
232+ sw_barrier ();
233233
234234 // calculate reset gate: r_t = \sigmoid(X_t x W_ir + h_{t - 1} x W_hr)
235235 // acc0 = X_t x W_ir
@@ -278,19 +278,19 @@ struct gru_layer {
278278 matAcc_0.reg = matAcc_0.reg * (1 - matAcc_1.reg ) +
279279 matAcc_1.reg *
280280 xetla_cvt<Act_T, T, matAcc_t::tile_elems>(mat_hidden.reg );
281- SW_BARRIER ();
281+ sw_barrier ();
282282
283283 if (seq_id == seq_len - 1 ) {
284284 MATC_STORE (args->layer_output );
285- SW_BARRIER ();
285+ sw_barrier ();
286286 __esimd_barrier ();
287287 }
288288 MATC_STORE (args->cell_out_ptr + seq_id * io_size);
289- SW_BARRIER ();
289+ sw_barrier ();
290290 __esimd_barrier ();
291291
292292 MATC_STORE (args->one_cell_ptr + (seq_id % 2 ) * io_size);
293- SW_BARRIER ();
293+ sw_barrier ();
294294 __esimd_barrier ();
295295 }
296296 args->hx_ptr = args->one_cell_ptr + (seq_id % 2 ) * io_size;
@@ -386,7 +386,7 @@ struct kernel_xcoder_gru_fusion {
386386 args.W_hz_ptr = (W_hz_ptr);
387387 args.W_in_ptr = (W_in_ptr);
388388 args.W_hn_ptr = (W_hn_ptr);
389- SW_BARRIER ();
389+ sw_barrier ();
390390 fused_op::call (item, &args);
391391 ping = (ping + 1 ) % 2 ;
392392 pong = (pong + 1 ) % 2 ;
@@ -411,7 +411,7 @@ struct kernel_xcoder_gru_fusion {
411411 ? hidden_out_ptr
412412 : (ping_pong_buffer + ping * one_layer_size);
413413 args.layer_ptr = ((ping_pong_buffer + pong * one_layer_size));
414- SW_BARRIER ();
414+ sw_barrier ();
415415 fused_op::call (item, &args);
416416 ping = (ping + 1 ) % 2 ;
417417 pong = (pong + 1 ) % 2 ;
0 commit comments