diff --git a/src/graph/backend/dnnl/kernels/sdp_primitive.cpp b/src/graph/backend/dnnl/kernels/sdp_primitive.cpp index fc4fb533ca8..f98d9bbedc9 100644 --- a/src/graph/backend/dnnl/kernels/sdp_primitive.cpp +++ b/src/graph/backend/dnnl/kernels/sdp_primitive.cpp @@ -74,6 +74,10 @@ status_t sdp_primitive_kernel_t::compile_impl( BACKEND_DNNL_ADD_PASS(pipeline, convert_to_runtime_src_zero_points); BACKEND_DNNL_ADD_PASS(pipeline, fuse_src_zero_points); BACKEND_DNNL_ADD_PASS(pipeline, insert_runtime_u8_to_s8_for_matmul); + BACKEND_DNNL_ADD_PASS(pipeline, convert_to_runtime_dst_scales); + BACKEND_DNNL_ADD_PASS(pipeline, fuse_dst_scales); + BACKEND_DNNL_ADD_PASS(pipeline, convert_to_runtime_dst_zero_points); + BACKEND_DNNL_ADD_PASS(pipeline, fuse_dst_zero_points); } BACKEND_DNNL_ADD_PASS(pipeline, binary_canonicalization); BACKEND_DNNL_ADD_PASS(pipeline, insert_permute_for_matmul); @@ -83,6 +87,7 @@ status_t sdp_primitive_kernel_t::compile_impl( pipeline.reset_visualize_arg(true, false); BACKEND_DNNL_ADD_PASS(pipeline, infer_shape); + BACKEND_DNNL_ADD_PASS(pipeline, fuse_src_transpose_to_matmul); BACKEND_DNNL_ADD_PASS(pipeline, fuse_dst_transpose_to_matmul); BACKEND_DNNL_ADD_PASS(pipeline, layout_propagation);