Skip to content

Commit

Permalink
cpu: aarch64: Re-enable ACL indirect conv for BF16
Browse files Browse the repository at this point in the history
  • Loading branch information
fadara01 authored and Radu2k committed Dec 2, 2024
1 parent 373bc5b commit 0de7263
Showing 1 changed file with 3 additions and 1 deletion.
4 changes: 3 additions & 1 deletion src/cpu/aarch64/acl_indirect_gemm_convolution.cpp
Original file line number Diff line number Diff line change
Expand Up @@ -96,11 +96,13 @@ status_t acl_indirect_gemm_convolution_fwd_t::pd_t::init(engine_t *engine) {

const bool is_fp16_ok = expect_data_types(f16, f16, f16, f16, undef)
&& attr()->has_default_values(smask_t::post_ops, f16);
const bool is_bf16_ok = expect_data_types(bf16, bf16, bf16, bf16, undef)
&& attr_.post_ops_.len() == 0;
const bool is_fp32_ok = expect_data_types(f32, f32, f32, f32, undef)
&& attr()->has_default_values(
smask_t::post_ops | smask_t::fpmath_mode, f32);
bool ok = is_fwd() && set_default_alg_kind(alg_kind::convolution_direct)
&& utils::one_of(true, is_fp16_ok, is_fp32_ok)
&& utils::one_of(true, is_fp16_ok, is_bf16_ok, is_fp32_ok)
&& !has_zero_dim_memory();
if (!ok) return status::unimplemented;

Expand Down

0 comments on commit 0de7263

Please sign in to comment.