diff --git a/src/plugins/intel_gpu/src/runtime/execution_config.cpp b/src/plugins/intel_gpu/src/runtime/execution_config.cpp index f3b9058f7ebdc8..c418636ab6db78 100644 --- a/src/plugins/intel_gpu/src/runtime/execution_config.cpp +++ b/src/plugins/intel_gpu/src/runtime/execution_config.cpp @@ -256,6 +256,11 @@ void ExecutionConfig::apply_user_properties(const cldnn::device_info& info) { set_property(ov::intel_gpu::queue_type(QueueTypes::in_order)); } + // Enable KV-cache compression by default for non-systolic platforms + if (!info.supports_immad) { + set_property(ov::hint::kv_cache_precision(ov::element::i8)); + } + user_properties.clear(); }