Skip to content

Commit

Permalink
fix sdpa fusion failed in f16 case
Browse files Browse the repository at this point in the history
  • Loading branch information
xczhai committed Sep 24, 2024
1 parent 1e9768b commit 2643652
Showing 1 changed file with 3 additions and 1 deletion.
Original file line number Diff line number Diff line change
Expand Up @@ -389,16 +389,18 @@ void Transformations::PreLpt(const std::vector<ov::element::Type>& defaultPrecis
precisions_map fp_convert_precision_map = {{ov::element::f32, ov::element::f16}};
#if defined(OPENVINO_ARCH_ARM) || defined(OPENVINO_ARCH_ARM64)
type_to_fuse_map fuse_map = {{ov::opset1::FakeQuantize::get_type_info_static(), fuse_type_to_fq}};
constexpr bool cvt_input_output_precision = true;
#else
type_to_fuse_map fuse_map = {};
constexpr bool cvt_input_output_precision = false;
#endif
const bool keep_precision_sensitive_in_fp32 = true;
CPU_REGISTER_PASS_COMMON(manager,
ov::pass::ConvertPrecision,
fp_convert_precision_map,
fuse_map,
keep_precision_sensitive_in_fp32,
false);
cvt_input_output_precision);
}
CPU_REGISTER_PASS_COMMON(manager, ov::pass::KeepConstAndDecompression);
CPU_SET_CALLBACK_COMMON(manager,
Expand Down

0 comments on commit 2643652

Please sign in to comment.