Skip to content

Commit

Permalink
cpu : aarch64 : reorder : zp correction for 4d shapes (#2224)
Browse files Browse the repository at this point in the history
  • Loading branch information
Shreyas-fuj authored and mgouicem committed Dec 4, 2024
1 parent 12bafbe commit 836ea10
Show file tree
Hide file tree
Showing 2 changed files with 10 additions and 1 deletion.
2 changes: 1 addition & 1 deletion src/cpu/aarch64/jit_uni_reorder.cpp
Original file line number Diff line number Diff line change
Expand Up @@ -781,7 +781,7 @@ struct jit_uni_reorder_kernel_f32_t : public kernel_t, public jit_generator {
// transposition on the fly
const bool fast_return = prb_.src_scale_type != scale_type_t::MANY
&& prb_.dst_scale_type != scale_type_t::MANY
&& prb_.beta == 0.f;
&& prb_.beta == 0.f && !prb_.req_src_zp && !prb_.req_dst_zp;
if (fast_return) {
if (prb_.src_scale_type == scale_type_t::COMMON)
for (int ur = 0; ur < reg_unroll; ur += load_step)
Expand Down
9 changes: 9 additions & 0 deletions tests/benchdnn/inputs/reorder/test_reorder_ci
Original file line number Diff line number Diff line change
Expand Up @@ -12,6 +12,15 @@
--oflag=
2x16x3x4 1x17x5x3 30x1

--reset

# 4d reorders
--sdt=s8,u8
--ddt=f32
--attr-zero-points=src:common:-1
--stag=adbc
1x12x128x33

--reset
# compensation reorders without groups
--sdt=f32,s8,bf16
Expand Down

0 comments on commit 836ea10

Please sign in to comment.