From 36578f01a829cf676820ffe6251e65e65d734374 Mon Sep 17 00:00:00 2001 From: Xiuchuan Zhai Date: Wed, 30 Oct 2024 23:17:54 -0400 Subject: [PATCH] remove extra or redundant Convert in FP16 - remove Convert for ReadValue node --- .../src/transformations/transformation_pipeline.cpp | 5 ++++- 1 file changed, 4 insertions(+), 1 deletion(-) diff --git a/src/plugins/intel_cpu/src/transformations/transformation_pipeline.cpp b/src/plugins/intel_cpu/src/transformations/transformation_pipeline.cpp index 9dd1da2d471e5a..caa29cb8566ae0 100644 --- a/src/plugins/intel_cpu/src/transformations/transformation_pipeline.cpp +++ b/src/plugins/intel_cpu/src/transformations/transformation_pipeline.cpp @@ -408,12 +408,15 @@ void Transformations::PreLpt(const std::vector& defaultPrecis type_to_fuse_map fuse_map = {{ov::op::PagedAttentionExtension::get_type_info_static(), fuse_type_to_pa}}; #endif const bool keep_precision_sensitive_in_fp32 = true; + const bool need_convert_input_output_precision = false; + const bool save_original_precision_attribute = true; CPU_REGISTER_PASS_COMMON(manager, ov::pass::ConvertPrecision, fp_convert_precision_map, fuse_map, keep_precision_sensitive_in_fp32, - false); + need_convert_input_output_precision, + save_original_precision_attribute); } CPU_REGISTER_PASS_COMMON(manager, ov::pass::KeepConstAndDecompression); CPU_SET_CALLBACK_COMMON(manager,