diff --git a/src/plugins/intel_cpu/src/config.h b/src/plugins/intel_cpu/src/config.h index 75bfde2303a34f..44b78df043cee6 100644 --- a/src/plugins/intel_cpu/src/config.h +++ b/src/plugins/intel_cpu/src/config.h @@ -67,8 +67,8 @@ struct Config { // TODO: Executor cache may leads to incorrect behavior on oneDNN ACL primitives size_t rtCacheCapacity = 0ul; #endif - size_t keyCacheGroupSize = 0ul; - size_t valueCacheGroupSize = 0ul; + size_t keyCacheGroupSize = 32ul; + size_t valueCacheGroupSize = 32ul; ov::threading::IStreamsExecutor::Config streamExecutorConfig; int streams = 1; bool streamsChanged = false; diff --git a/src/plugins/intel_cpu/tests/functional/custom/subgraph_tests/src/classes/concat_sdp.cpp b/src/plugins/intel_cpu/tests/functional/custom/subgraph_tests/src/classes/concat_sdp.cpp index 83fc0a635546fc..ab893ac060f55b 100644 --- a/src/plugins/intel_cpu/tests/functional/custom/subgraph_tests/src/classes/concat_sdp.cpp +++ b/src/plugins/intel_cpu/tests/functional/custom/subgraph_tests/src/classes/concat_sdp.cpp @@ -76,6 +76,8 @@ void ConcatSDPTest::SetUp() { auto v_ps = inputDynamicShapes[0]; if (m_isDiffKVHeadSize) { v_ps[3] += m_diffKVHeadSize; + // v_ps[3] must be divisible by value_cache_group_size + configuration[ov::value_cache_group_size.name()] = "16"; } inputParams.push_back(std::make_shared(inType, v_ps)); inputParams[0]->set_friendly_name("q");