From dd848c2d683b0f593141920ea147729a9bc72879 Mon Sep 17 00:00:00 2001 From: sunxiaoxia2022 Date: Tue, 29 Oct 2024 18:35:52 +0800 Subject: [PATCH 01/30] add property enable_cpu_reservation --- .../include/openvino/runtime/properties.hpp | 18 ++ .../tests/unit/executor_config_test.cpp | 165 +++++++++++++++++- src/plugins/intel_cpu/src/compiled_model.cpp | 4 + src/plugins/intel_cpu/src/config.cpp | 10 ++ src/plugins/intel_cpu/src/config.h | 1 + .../intel_cpu/src/cpu_streams_calculation.cpp | 2 +- src/plugins/intel_cpu/src/plugin.cpp | 4 + src/plugins/intel_gpu/src/graph/program.cpp | 2 + .../intel_gpu/src/plugin/compiled_model.cpp | 3 + src/plugins/intel_gpu/src/plugin/plugin.cpp | 1 + .../src/runtime/execution_config.cpp | 7 + 11 files changed, 213 insertions(+), 4 deletions(-) diff --git a/src/inference/include/openvino/runtime/properties.hpp b/src/inference/include/openvino/runtime/properties.hpp index 627314748bbe9c..c714c77d6b062b 100644 --- a/src/inference/include/openvino/runtime/properties.hpp +++ b/src/inference/include/openvino/runtime/properties.hpp @@ -479,6 +479,24 @@ static constexpr Property> model_distribution_ */ static constexpr Property enable_cpu_pinning{"ENABLE_CPU_PINNING"}; +/** + * @brief This property allows CPU reservation during inference. + * @ingroup ov_runtime_cpp_prop_api + * + * Cpu Reservation means reserve cpus which will not be used by other plugin. Developer can use this property to + * enable or disable CPU reservation during inference on Windows and Linux. MacOS + * does not support CPU reservation, and this property is always disabled. + * This property defaults to false. If it explicitly set to true, cpu_pinning defaults to true. + * + * The following code is example to use this property. + * + * @code + * ie.set_property(ov::hint::enable_cpu_reservation(true)); + * ie.set_property(ov::hint::enable_cpu_reservation(false)); + * @endcode + */ +static constexpr Property enable_cpu_reservation{"ENABLE_CPU_RESERVATION"}; + /** * @brief This property define if using hyper threading during inference. * @ingroup ov_runtime_cpp_prop_api diff --git a/src/inference/tests/unit/executor_config_test.cpp b/src/inference/tests/unit/executor_config_test.cpp index 8e67d0d5039c50..09866836aab1bb 100644 --- a/src/inference/tests/unit/executor_config_test.cpp +++ b/src/inference/tests/unit/executor_config_test.cpp @@ -5,6 +5,7 @@ #include #include "common_test_utils/test_common.hpp" +#include "openvino/runtime/threading/cpu_streams_info.hpp" #include "openvino/runtime/threading/istreams_executor.hpp" #include "os/cpu_map_info.hpp" @@ -22,6 +23,7 @@ struct ExecutorConfigTestCase { int _num_streams; int _threads_per_stream; ov::hint::SchedulingCoreType _core_type; + bool _cpu_reservation; bool _cpu_pinning; std::vector> _streams_info_table_in; std::vector> _streams_info_table; @@ -45,13 +47,46 @@ class ExecutorConfigTest : public ov::test::TestsCommon, test_data._num_streams, test_data._threads_per_stream, test_data._core_type, - false, + test_data._cpu_reservation, test_data._cpu_pinning, test_data._streams_info_table_in}; - - ASSERT_EQ(test_data._cpu_pinning, config.get_cpu_pinning()); + ASSERT_EQ(test_data._cpu_reservation, config.get_cpu_reservation()); + if (test_data._cpu_reservation && !test_data._cpu_pinning) { + ASSERT_EQ(true, config.get_cpu_pinning()); + } else { + ASSERT_EQ(test_data._cpu_pinning, config.get_cpu_pinning()); + } ASSERT_EQ(test_data._streams_info_table, config.get_streams_info_table()); ASSERT_EQ(test_data._stream_processors, config.get_stream_processor_ids()); + if (test_data._cpu_reservation) { + std::vector> proc_type_table = test_data._proc_type_table; + for (size_t i = 0; i < test_data._streams_info_table.size(); i++) { + if (test_data._streams_info_table[i][PROC_TYPE] >= MAIN_CORE_PROC && + test_data._streams_info_table[i][PROC_TYPE] <= HYPER_THREADING_PROC) { + int nstreams = test_data._streams_info_table[i][NUMBER_OF_STREAMS] > 0 + ? test_data._streams_info_table[i][NUMBER_OF_STREAMS] + : 1; + int nthreads = nstreams * test_data._streams_info_table[i][THREADS_PER_STREAM]; + if (proc_type_table.size() > 1) { + for (size_t j = 0; j < proc_type_table.size(); j++) { + if (proc_type_table[j][PROC_NUMA_NODE_ID] == + test_data._streams_info_table[i][STREAM_NUMA_NODE_ID] && + proc_type_table[j][PROC_SOCKET_ID] == + test_data._streams_info_table[i][STREAM_SOCKET_ID]) { + proc_type_table[j][test_data._streams_info_table[i][PROC_TYPE]] -= nthreads; + proc_type_table[j][ALL_PROC] -= nthreads; + proc_type_table[0][test_data._streams_info_table[i][PROC_TYPE]] -= nthreads; + proc_type_table[0][ALL_PROC] -= nthreads; + } + } + } else { + proc_type_table[0][test_data._streams_info_table[i][PROC_TYPE]] -= nthreads; + proc_type_table[0][ALL_PROC] -= nthreads; + } + } + } + ASSERT_EQ(proc_type_table, cpu._proc_type_table); + } } }; @@ -79,6 +114,7 @@ ExecutorConfigTestCase _1sockets_streams_4_threads_1 = { 4, // param[in]: the number of streams 1, // param[in]: the number of threads per stream ov::hint::SchedulingCoreType::ANY_CORE, // param[in]: specified cpu core type + false, // param[in]: specified cpu reservation false, // param[in]: specified cpu pinning {}, // param[in]: streams info table // param[out]: streams_info_table, {NUMBER_OF_STREAMS, PROC_TYPE, THREADS_PER_STREAM, STREAM_NUMA_NODE_ID, @@ -112,6 +148,7 @@ ExecutorConfigTestCase _1sockets_streams_4_threads_0 = { 0, ov::hint::SchedulingCoreType::ANY_CORE, false, + false, {}, {}, {}, @@ -139,6 +176,7 @@ ExecutorConfigTestCase _1sockets_streams_1_threads_12 = { 12, ov::hint::SchedulingCoreType::ANY_CORE, false, + false, {}, { {1, ALL_PROC, 12, 0, 0}, @@ -170,6 +208,7 @@ ExecutorConfigTestCase _1sockets_streams_1_threads_10 = { 10, ov::hint::SchedulingCoreType::ANY_CORE, false, + false, {}, { {1, ALL_PROC, 10, 0, 0}, @@ -201,6 +240,7 @@ ExecutorConfigTestCase _1sockets_streams_12_threads_1 = { 1, ov::hint::SchedulingCoreType::ANY_CORE, false, + false, {}, { {6, MAIN_CORE_PROC, 1, 0, 0}, @@ -231,6 +271,7 @@ ExecutorConfigTestCase _1sockets_streams_13_threads_1 = { 1, ov::hint::SchedulingCoreType::ANY_CORE, false, + false, {}, { {6, MAIN_CORE_PROC, 1, 0, 0}, @@ -261,6 +302,7 @@ ExecutorConfigTestCase _1sockets_streams_6_threads_1_core_e = { 1, ov::hint::SchedulingCoreType::ECORE_ONLY, false, + false, {}, { {6, MAIN_CORE_PROC, 1, 0, 0}, @@ -291,6 +333,7 @@ ExecutorConfigTestCase _1sockets_streams_5_threads_1_binding = { 1, ov::hint::SchedulingCoreType::ANY_CORE, true, + true, {}, { {5, MAIN_CORE_PROC, 1, 0, 0}, @@ -346,6 +389,7 @@ ExecutorConfigTestCase _2sockets_streams_36_threads_1 = { 1, ov::hint::SchedulingCoreType::ANY_CORE, false, + false, {}, { {18, MAIN_CORE_PROC, 1, 0, 0}, @@ -402,6 +446,7 @@ ExecutorConfigTestCase _2sockets_streams_4_threads_5 = { 5, ov::hint::SchedulingCoreType::ANY_CORE, false, + false, {}, { {3, MAIN_CORE_PROC, 5, 0, 0}, @@ -458,6 +503,7 @@ ExecutorConfigTestCase _2sockets_streams_1_threads_36 = { 36, ov::hint::SchedulingCoreType::ANY_CORE, false, + false, {}, { {1, ALL_PROC, 36, -1, -1}, @@ -515,6 +561,7 @@ ExecutorConfigTestCase _2sockets_streams_1_threads_30 = { 30, ov::hint::SchedulingCoreType::ANY_CORE, false, + false, {}, { {1, ALL_PROC, 30, -1, -1}, @@ -524,6 +571,65 @@ ExecutorConfigTestCase _2sockets_streams_1_threads_30 = { {}, }; +ExecutorConfigTestCase _2sockets_streams_1_threads_30_binding = { + { + {72, 36, 0, 36, -1, -1}, + {36, 18, 0, 18, 0, 0}, + {36, 18, 0, 18, 1, 1}, + }, + { + {0, 0, 0, 0, HYPER_THREADING_PROC, 0, -1}, {1, 0, 0, 1, HYPER_THREADING_PROC, 1, -1}, + {2, 0, 0, 2, HYPER_THREADING_PROC, 2, -1}, {3, 0, 0, 3, HYPER_THREADING_PROC, 3, -1}, + {4, 0, 0, 4, HYPER_THREADING_PROC, 4, -1}, {5, 0, 0, 5, HYPER_THREADING_PROC, 5, -1}, + {6, 0, 0, 6, HYPER_THREADING_PROC, 6, -1}, {7, 0, 0, 7, HYPER_THREADING_PROC, 7, -1}, + {8, 0, 0, 8, HYPER_THREADING_PROC, 8, -1}, {9, 0, 0, 9, HYPER_THREADING_PROC, 9, -1}, + {10, 0, 0, 10, HYPER_THREADING_PROC, 10, -1}, {11, 0, 0, 11, HYPER_THREADING_PROC, 11, -1}, + {12, 0, 0, 12, HYPER_THREADING_PROC, 12, -1}, {13, 0, 0, 13, HYPER_THREADING_PROC, 13, -1}, + {14, 0, 0, 14, HYPER_THREADING_PROC, 14, -1}, {15, 0, 0, 15, HYPER_THREADING_PROC, 15, -1}, + {16, 0, 0, 16, HYPER_THREADING_PROC, 16, -1}, {17, 0, 0, 17, HYPER_THREADING_PROC, 17, -1}, + {18, 1, 1, 18, HYPER_THREADING_PROC, 18, -1}, {19, 1, 1, 19, HYPER_THREADING_PROC, 19, -1}, + {20, 1, 1, 20, HYPER_THREADING_PROC, 20, -1}, {21, 1, 1, 21, HYPER_THREADING_PROC, 21, -1}, + {22, 1, 1, 22, HYPER_THREADING_PROC, 22, -1}, {23, 1, 1, 23, HYPER_THREADING_PROC, 23, -1}, + {24, 1, 1, 24, HYPER_THREADING_PROC, 24, -1}, {25, 1, 1, 25, HYPER_THREADING_PROC, 25, -1}, + {26, 1, 1, 26, HYPER_THREADING_PROC, 26, -1}, {27, 1, 1, 27, HYPER_THREADING_PROC, 27, -1}, + {28, 1, 1, 28, HYPER_THREADING_PROC, 28, -1}, {29, 1, 1, 29, HYPER_THREADING_PROC, 29, -1}, + {30, 1, 1, 30, HYPER_THREADING_PROC, 30, -1}, {31, 1, 1, 31, HYPER_THREADING_PROC, 31, -1}, + {32, 1, 1, 32, HYPER_THREADING_PROC, 32, -1}, {33, 1, 1, 33, HYPER_THREADING_PROC, 33, -1}, + {34, 1, 1, 34, HYPER_THREADING_PROC, 34, -1}, {35, 1, 1, 35, HYPER_THREADING_PROC, 35, -1}, + {36, 0, 0, 36, MAIN_CORE_PROC, 36, -1}, {37, 0, 0, 37, MAIN_CORE_PROC, 37, -1}, + {38, 0, 0, 38, MAIN_CORE_PROC, 38, -1}, {39, 0, 0, 39, MAIN_CORE_PROC, 39, -1}, + {40, 0, 0, 40, MAIN_CORE_PROC, 40, -1}, {41, 0, 0, 41, MAIN_CORE_PROC, 41, -1}, + {42, 0, 0, 42, MAIN_CORE_PROC, 42, -1}, {43, 0, 0, 43, MAIN_CORE_PROC, 43, -1}, + {44, 0, 0, 44, MAIN_CORE_PROC, 44, -1}, {45, 0, 0, 45, MAIN_CORE_PROC, 45, -1}, + {46, 0, 0, 46, MAIN_CORE_PROC, 46, -1}, {47, 0, 0, 47, MAIN_CORE_PROC, 47, -1}, + {48, 0, 0, 48, MAIN_CORE_PROC, 48, -1}, {49, 0, 0, 49, MAIN_CORE_PROC, 49, -1}, + {50, 0, 0, 50, MAIN_CORE_PROC, 50, -1}, {51, 0, 0, 51, MAIN_CORE_PROC, 51, -1}, + {52, 0, 0, 52, MAIN_CORE_PROC, 52, -1}, {53, 0, 0, 53, MAIN_CORE_PROC, 53, -1}, + {54, 1, 1, 54, MAIN_CORE_PROC, 54, -1}, {55, 1, 1, 55, MAIN_CORE_PROC, 55, -1}, + {56, 1, 1, 56, MAIN_CORE_PROC, 56, -1}, {57, 1, 1, 57, MAIN_CORE_PROC, 57, -1}, + {58, 1, 1, 58, MAIN_CORE_PROC, 58, -1}, {59, 1, 1, 59, MAIN_CORE_PROC, 59, -1}, + {60, 1, 1, 60, MAIN_CORE_PROC, 60, -1}, {61, 1, 1, 61, MAIN_CORE_PROC, 61, -1}, + {62, 1, 1, 62, MAIN_CORE_PROC, 62, -1}, {63, 1, 1, 63, MAIN_CORE_PROC, 63, -1}, + {64, 1, 1, 64, MAIN_CORE_PROC, 64, -1}, {65, 1, 1, 65, MAIN_CORE_PROC, 65, -1}, + {66, 1, 1, 66, MAIN_CORE_PROC, 66, -1}, {67, 1, 1, 67, MAIN_CORE_PROC, 67, -1}, + {68, 1, 1, 68, MAIN_CORE_PROC, 68, -1}, {69, 1, 1, 69, MAIN_CORE_PROC, 69, -1}, + {70, 1, 1, 70, MAIN_CORE_PROC, 70, -1}, {71, 1, 1, 71, MAIN_CORE_PROC, 71, -1}, + }, + 1, + 30, + ov::hint::SchedulingCoreType::ANY_CORE, + true, + false, + {}, + { + {1, ALL_PROC, 30, -1, -1}, + {0, MAIN_CORE_PROC, 18, 0, 0}, + {0, MAIN_CORE_PROC, 12, 1, 1}, + }, + {{36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, + 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65}}, +}; + ExecutorConfigTestCase _pecore_streams_5_threads_2 = { { {24, 8, 8, 8, 0, 0}, @@ -546,6 +652,7 @@ ExecutorConfigTestCase _pecore_streams_5_threads_2 = { 2, ov::hint::SchedulingCoreType::ANY_CORE, false, + false, {}, { {4, MAIN_CORE_PROC, 2, 0, 0}, @@ -576,6 +683,7 @@ ExecutorConfigTestCase _pecore_streams_5_threads_5 = { 5, ov::hint::SchedulingCoreType::ANY_CORE, false, + false, {}, { {2, MAIN_CORE_PROC, 4, 0, 0}, @@ -607,6 +715,7 @@ ExecutorConfigTestCase _pecore_streams_4_threads_5 = { 5, ov::hint::SchedulingCoreType::ANY_CORE, false, + false, {}, { {1, MAIN_CORE_PROC, 5, 0, 0}, @@ -638,6 +747,7 @@ ExecutorConfigTestCase _pecore_streams_4_threads_1 = { 1, ov::hint::SchedulingCoreType::ANY_CORE, false, + false, {}, { {4, MAIN_CORE_PROC, 1, 0, 0}, @@ -667,6 +777,7 @@ ExecutorConfigTestCase _pecore_streams_5_threads_10 = { 10, ov::hint::SchedulingCoreType::ANY_CORE, false, + false, {}, { {2, MAIN_CORE_PROC, 4, 0, 0}, @@ -698,6 +809,7 @@ ExecutorConfigTestCase _pecore_streams_26_threads_1 = { 1, ov::hint::SchedulingCoreType::ANY_CORE, false, + false, {}, { {8, MAIN_CORE_PROC, 1, 0, 0}, @@ -729,6 +841,7 @@ ExecutorConfigTestCase _pecore_streams_26_threads_1_p = { 1, ov::hint::SchedulingCoreType::PCORE_ONLY, false, + false, {}, { {8, MAIN_CORE_PROC, 1, 0, 0}, @@ -759,6 +872,7 @@ ExecutorConfigTestCase _pecore_streams_26_threads_1_e = { 1, ov::hint::SchedulingCoreType::ECORE_ONLY, false, + false, {}, { {8, EFFICIENT_CORE_PROC, 1, 0, 0}, @@ -788,6 +902,7 @@ ExecutorConfigTestCase _pecore_streams_1_threads_0 = { 0, ov::hint::SchedulingCoreType::ANY_CORE, false, + false, {}, {}, {}, @@ -815,6 +930,7 @@ ExecutorConfigTestCase _pecore_streams_1_threads_1_p = { 1, ov::hint::SchedulingCoreType::PCORE_ONLY, false, + false, {}, { {1, MAIN_CORE_PROC, 1, 0, 0}, @@ -844,6 +960,7 @@ ExecutorConfigTestCase _pecore_streams_1_threads_1_e = { 1, ov::hint::SchedulingCoreType::ECORE_ONLY, false, + false, {}, { {1, EFFICIENT_CORE_PROC, 1, 0, 0}, @@ -873,6 +990,7 @@ ExecutorConfigTestCase _pecore_streams_1_threads_16_p = { 16, ov::hint::SchedulingCoreType::PCORE_ONLY, false, + false, {}, { {1, ALL_PROC, 16, 0, 0}, @@ -904,6 +1022,7 @@ ExecutorConfigTestCase _pecore_streams_1_threads_18_p = { 18, ov::hint::SchedulingCoreType::PCORE_ONLY, false, + false, {}, { {1, ALL_PROC, 16, 0, 0}, @@ -935,6 +1054,7 @@ ExecutorConfigTestCase _pecore_streams_1_threads_10_p = { 10, ov::hint::SchedulingCoreType::PCORE_ONLY, false, + false, {}, { {1, ALL_PROC, 10, 0, 0}, @@ -966,6 +1086,7 @@ ExecutorConfigTestCase _pecore_streams_10_threads_1_e = { 1, ov::hint::SchedulingCoreType::ECORE_ONLY, false, + false, {}, { {8, EFFICIENT_CORE_PROC, 1, 0, 0}, @@ -995,6 +1116,39 @@ ExecutorConfigTestCase _pecore_streams_10_threads_1_binding = { 2, ov::hint::SchedulingCoreType::ANY_CORE, true, + true, + {}, + { + {4, MAIN_CORE_PROC, 2, 0, 0}, + {4, EFFICIENT_CORE_PROC, 2, 0, 0}, + {2, HYPER_THREADING_PROC, 2, 0, 0}, + }, + {{0, 2}, {4, 6}, {8, 10}, {12, 14}, {16, 17}, {18, 19}, {20, 21}, {22, 23}, {1, 3}, {5, 7}}, +}; + +ExecutorConfigTestCase _pecore_streams_10_threads_2_reservation = { + { + {24, 8, 8, 8, 0, 0}, + }, + { + {0, 0, 0, 0, MAIN_CORE_PROC, 0, -1}, {1, 0, 0, 0, HYPER_THREADING_PROC, 1, -1}, + {2, 0, 0, 1, MAIN_CORE_PROC, 2, -1}, {3, 0, 0, 1, HYPER_THREADING_PROC, 3, -1}, + {4, 0, 0, 2, MAIN_CORE_PROC, 4, -1}, {5, 0, 0, 2, HYPER_THREADING_PROC, 5, -1}, + {6, 0, 0, 3, MAIN_CORE_PROC, 6, -1}, {7, 0, 0, 3, HYPER_THREADING_PROC, 7, -1}, + {8, 0, 0, 4, MAIN_CORE_PROC, 8, -1}, {9, 0, 0, 4, HYPER_THREADING_PROC, 9, -1}, + {10, 0, 0, 5, MAIN_CORE_PROC, 10, -1}, {11, 0, 0, 5, HYPER_THREADING_PROC, 11, -1}, + {12, 0, 0, 6, MAIN_CORE_PROC, 12, -1}, {13, 0, 0, 6, HYPER_THREADING_PROC, 13, -1}, + {14, 0, 0, 7, MAIN_CORE_PROC, 14, -1}, {15, 0, 0, 7, HYPER_THREADING_PROC, 15, -1}, + {16, 0, 0, 8, EFFICIENT_CORE_PROC, 16, -1}, {17, 0, 0, 9, EFFICIENT_CORE_PROC, 17, -1}, + {18, 0, 0, 10, EFFICIENT_CORE_PROC, 18, -1}, {19, 0, 0, 11, EFFICIENT_CORE_PROC, 19, -1}, + {20, 0, 0, 12, EFFICIENT_CORE_PROC, 20, -1}, {21, 0, 0, 13, EFFICIENT_CORE_PROC, 21, -1}, + {22, 0, 0, 14, EFFICIENT_CORE_PROC, 22, -1}, {23, 0, 0, 15, EFFICIENT_CORE_PROC, 23, -1}, + }, + 10, + 2, + ov::hint::SchedulingCoreType::ANY_CORE, + true, + false, {}, { {4, MAIN_CORE_PROC, 2, 0, 0}, @@ -1026,6 +1180,7 @@ ExecutorConfigTestCase _pecore_streams_info_table_1 = { 8, ov::hint::SchedulingCoreType::PCORE_ONLY, false, + false, { {2, MAIN_CORE_PROC, 2, 0, 0}, {2, EFFICIENT_CORE_PROC, 2, 0, 0}, @@ -1059,6 +1214,7 @@ ExecutorConfigTestCase _pecore_streams_info_table_2 = { 8, ov::hint::SchedulingCoreType::PCORE_ONLY, false, + false, { {5, MAIN_CORE_PROC, 2, 0, 0}, {2, EFFICIENT_CORE_PROC, 2, 0, 0}, @@ -1091,6 +1247,7 @@ ExecutorConfigTestCase _pecore_streams_info_table_3 = { 8, ov::hint::SchedulingCoreType::PCORE_ONLY, true, + true, { {2, MAIN_CORE_PROC, 2, 0, 0}, {2, EFFICIENT_CORE_PROC, 2, 0, 0}, @@ -1120,6 +1277,7 @@ INSTANTIATE_TEST_SUITE_P(smoke_ExecutorConfig, _2sockets_streams_4_threads_5, _2sockets_streams_1_threads_36, _2sockets_streams_1_threads_30, + _2sockets_streams_1_threads_30_binding, _pecore_streams_5_threads_2, _pecore_streams_5_threads_5, _pecore_streams_4_threads_5, @@ -1136,6 +1294,7 @@ INSTANTIATE_TEST_SUITE_P(smoke_ExecutorConfig, _pecore_streams_1_threads_10_p, _pecore_streams_10_threads_1_e, _pecore_streams_10_threads_1_binding, + _pecore_streams_10_threads_2_reservation, _pecore_streams_info_table_1, _pecore_streams_info_table_2, _pecore_streams_info_table_3)); diff --git a/src/plugins/intel_cpu/src/compiled_model.cpp b/src/plugins/intel_cpu/src/compiled_model.cpp index bbee5d937be5d5..1d2d76c3b4b8bd 100644 --- a/src/plugins/intel_cpu/src/compiled_model.cpp +++ b/src/plugins/intel_cpu/src/compiled_model.cpp @@ -247,6 +247,7 @@ ov::Any CompiledModel::get_property(const std::string& name) const { RO_property(ov::hint::execution_mode.name()), RO_property(ov::hint::num_requests.name()), RO_property(ov::hint::enable_cpu_pinning.name()), + RO_property(ov::hint::enable_cpu_reservation.name()), RO_property(ov::hint::scheduling_core_type.name()), RO_property(ov::hint::model_distribution_policy.name()), RO_property(ov::hint::enable_hyper_threading.name()), @@ -307,6 +308,9 @@ ov::Any CompiledModel::get_property(const std::string& name) const { } else if (name == ov::hint::enable_cpu_pinning.name()) { const bool use_pin = config.enableCpuPinning; return decltype(ov::hint::enable_cpu_pinning)::value_type(use_pin); + } else if (name == ov::hint::enable_cpu_reservation.name()) { + const bool use_reserve = config.enableCpuReservation; + return decltype(ov::hint::enable_cpu_reservation)::value_type(use_reserve); } else if (name == ov::hint::scheduling_core_type) { const auto stream_mode = config.schedulingCoreType; return stream_mode; diff --git a/src/plugins/intel_cpu/src/config.cpp b/src/plugins/intel_cpu/src/config.cpp index 421dca07747932..6d50abf348f283 100644 --- a/src/plugins/intel_cpu/src/config.cpp +++ b/src/plugins/intel_cpu/src/config.cpp @@ -178,6 +178,16 @@ void Config::readProperties(const ov::AnyMap& prop, const ModelType modelType) { ov::hint::enable_cpu_pinning.name(), ". Expected only true/false."); } + } else if (key == ov::hint::enable_cpu_reservation.name()) { + try { + enableCpuReservation = val.as(); + } catch (ov::Exception&) { + OPENVINO_THROW("Wrong value ", + val.as(), + "for property key ", + ov::hint::enable_cpu_reservation.name(), + ". Expected only true/false."); + } } else if (key == ov::hint::scheduling_core_type.name()) { try { schedulingCoreType = val.as(); diff --git a/src/plugins/intel_cpu/src/config.h b/src/plugins/intel_cpu/src/config.h index 79cdf3a5e827ec..3592f6da6f43dc 100644 --- a/src/plugins/intel_cpu/src/config.h +++ b/src/plugins/intel_cpu/src/config.h @@ -75,6 +75,7 @@ struct Config { uint32_t hintNumRequests = 0; bool enableCpuPinning = true; bool changedCpuPinning = false; + bool enableCpuReservation = false; ov::hint::SchedulingCoreType schedulingCoreType = ov::hint::SchedulingCoreType::ANY_CORE; std::set modelDistributionPolicy = {}; int streamsRankLevel = 1; diff --git a/src/plugins/intel_cpu/src/cpu_streams_calculation.cpp b/src/plugins/intel_cpu/src/cpu_streams_calculation.cpp index 7f5f968b10c3fe..8125e8983b8c5f 100644 --- a/src/plugins/intel_cpu/src/cpu_streams_calculation.cpp +++ b/src/plugins/intel_cpu/src/cpu_streams_calculation.cpp @@ -691,7 +691,7 @@ std::vector> generate_stream_info(const int streams, config.streams, config.threadsPerStream, ov::hint::SchedulingCoreType::ANY_CORE, - false, + config.enableCpuReservation, cpu_pinning, streams_info_table}; diff --git a/src/plugins/intel_cpu/src/plugin.cpp b/src/plugins/intel_cpu/src/plugin.cpp index 5c88772eeedabc..79c607a0a74eb2 100644 --- a/src/plugins/intel_cpu/src/plugin.cpp +++ b/src/plugins/intel_cpu/src/plugin.cpp @@ -346,6 +346,9 @@ ov::Any Plugin::get_property(const std::string& name, const ov::AnyMap& options) } else if (name == ov::hint::enable_cpu_pinning) { const bool pin_value = engConfig.enableCpuPinning; return decltype(ov::hint::enable_cpu_pinning)::value_type(pin_value); + } else if (name == ov::hint::enable_cpu_reservation) { + const bool reserve_value = engConfig.enableCpuReservation; + return decltype(ov::hint::enable_cpu_reservation)::value_type(reserve_value); } else if (name == ov::hint::scheduling_core_type) { const auto core_type = engConfig.schedulingCoreType; return core_type; @@ -422,6 +425,7 @@ ov::Any Plugin::get_ro_property(const std::string& name, const ov::AnyMap& optio RW_property(ov::hint::execution_mode.name()), RW_property(ov::hint::num_requests.name()), RW_property(ov::hint::enable_cpu_pinning.name()), + RW_property(ov::hint::enable_cpu_reservation.name()), RW_property(ov::hint::scheduling_core_type.name()), RW_property(ov::hint::model_distribution_policy.name()), RW_property(ov::hint::enable_hyper_threading.name()), diff --git a/src/plugins/intel_gpu/src/graph/program.cpp b/src/plugins/intel_gpu/src/graph/program.cpp index 1e2e84043dc82b..16d23b1ebfb099 100644 --- a/src/plugins/intel_gpu/src/graph/program.cpp +++ b/src/plugins/intel_gpu/src/graph/program.cpp @@ -113,11 +113,13 @@ static ov::threading::IStreamsExecutor::Config make_task_executor_config(const E default: OPENVINO_ASSERT(false, "[GPU] Can't create task executor: invalid host task priority value: ", priority); } bool enable_cpu_pinning = config.get_property(ov::hint::enable_cpu_pinning); + bool enable_cpu_reservation = config.get_property(ov::hint::enable_cpu_reservation); ov::threading::IStreamsExecutor::Config task_executor_config(tags, streams, 1, core_type, + enable_cpu_reservation, enable_cpu_pinning); return task_executor_config; diff --git a/src/plugins/intel_gpu/src/plugin/compiled_model.cpp b/src/plugins/intel_gpu/src/plugin/compiled_model.cpp index 15ff4447b4bafe..573bb8a2f83648 100644 --- a/src/plugins/intel_gpu/src/plugin/compiled_model.cpp +++ b/src/plugins/intel_gpu/src/plugin/compiled_model.cpp @@ -25,11 +25,13 @@ std::shared_ptr create_task_executor(const std::sh // the CPU behavior return plugin->get_executor_manager()->get_executor("GPU"); } else if (config.get_property(ov::hint::enable_cpu_pinning)) { + bool enable_cpu_reservation = config.get_property(ov::hint::enable_cpu_reservation); return std::make_shared( ov::threading::IStreamsExecutor::Config{"Intel GPU plugin executor", config.get_property(ov::num_streams), 1, ov::hint::SchedulingCoreType::PCORE_ONLY, + enable_cpu_reservation, true}); } else { return std::make_shared( @@ -242,6 +244,7 @@ ov::Any CompiledModel::get_property(const std::string& name) const { // Configs ov::PropertyName{ov::enable_profiling.name(), PropertyMutability::RO}, ov::PropertyName{ov::hint::enable_cpu_pinning.name(), PropertyMutability::RO}, + ov::PropertyName{ov::hint::enable_cpu_reservation.name(), PropertyMutability::RO}, ov::PropertyName{ov::hint::model_priority.name(), PropertyMutability::RO}, ov::PropertyName{ov::intel_gpu::hint::host_task_priority.name(), PropertyMutability::RO}, ov::PropertyName{ov::intel_gpu::hint::queue_priority.name(), PropertyMutability::RO}, diff --git a/src/plugins/intel_gpu/src/plugin/plugin.cpp b/src/plugins/intel_gpu/src/plugin/plugin.cpp index 2d29601ef0b69d..4ba8ba3a70d646 100644 --- a/src/plugins/intel_gpu/src/plugin/plugin.cpp +++ b/src/plugins/intel_gpu/src/plugin/plugin.cpp @@ -564,6 +564,7 @@ std::vector Plugin::get_supported_properties() const { ov::PropertyName{ov::hint::num_requests.name(), PropertyMutability::RW}, ov::PropertyName{ov::hint::inference_precision.name(), PropertyMutability::RW}, ov::PropertyName{ov::hint::enable_cpu_pinning.name(), PropertyMutability::RW}, + ov::PropertyName{ov::hint::enable_cpu_reservation.name(), PropertyMutability::RW}, ov::PropertyName{ov::device::id.name(), PropertyMutability::RW}, ov::PropertyName{ov::hint::dynamic_quantization_group_size.name(), PropertyMutability::RW} }; diff --git a/src/plugins/intel_gpu/src/runtime/execution_config.cpp b/src/plugins/intel_gpu/src/runtime/execution_config.cpp index 7661444cc4fd7b..70e74d46378b42 100644 --- a/src/plugins/intel_gpu/src/runtime/execution_config.cpp +++ b/src/plugins/intel_gpu/src/runtime/execution_config.cpp @@ -46,6 +46,7 @@ void ExecutionConfig::set_default() { std::make_tuple(ov::hint::execution_mode, ov::hint::ExecutionMode::PERFORMANCE), std::make_tuple(ov::hint::num_requests, 0), std::make_tuple(ov::hint::enable_cpu_pinning, false), + std::make_tuple(ov::hint::enable_cpu_reservation, false), std::make_tuple(ov::intel_gpu::hint::host_task_priority, ov::hint::Priority::MEDIUM), std::make_tuple(ov::intel_gpu::hint::queue_throttle, ov::intel_gpu::hint::ThrottleLevel::MEDIUM), @@ -235,6 +236,12 @@ void ExecutionConfig::apply_user_properties(const cldnn::device_info& info) { if (info.supports_immad) { set_property(ov::intel_gpu::queue_type(QueueTypes::in_order)); } + if (!is_set_by_user(ov::hint::enable_cpu_reservation)) { + bool enable_cpu_pinning = get_property(ov::hint::enable_cpu_pinning); + if (enable_cpu_pinning) { + set_property(ov::hint::enable_cpu_reservation(true)); + } + } user_properties.clear(); } From 23a6e4283551da4db5c7b02d378fb237163cf54c Mon Sep 17 00:00:00 2001 From: sunxiaoxia2022 Date: Tue, 29 Oct 2024 23:43:08 +0800 Subject: [PATCH 02/30] update enable_cpu_pinning when enable_cpu_reservation=true && enable_cpu_pinning=false in GPU plugin --- src/plugins/intel_gpu/src/runtime/execution_config.cpp | 3 +++ .../behavior/ov_plugin/properties_tests.cpp | 1 + 2 files changed, 4 insertions(+) diff --git a/src/plugins/intel_gpu/src/runtime/execution_config.cpp b/src/plugins/intel_gpu/src/runtime/execution_config.cpp index 70e74d46378b42..8b13c23c5e4ef4 100644 --- a/src/plugins/intel_gpu/src/runtime/execution_config.cpp +++ b/src/plugins/intel_gpu/src/runtime/execution_config.cpp @@ -242,6 +242,9 @@ void ExecutionConfig::apply_user_properties(const cldnn::device_info& info) { set_property(ov::hint::enable_cpu_reservation(true)); } } + if (get_property(ov::hint::enable_cpu_reservation) && !get_property(ov::hint::enable_cpu_pinning)) { + set_property(ov::hint::enable_cpu_pinning(true)); + } user_properties.clear(); } diff --git a/src/plugins/intel_gpu/tests/functional/shared_tests_instances/behavior/ov_plugin/properties_tests.cpp b/src/plugins/intel_gpu/tests/functional/shared_tests_instances/behavior/ov_plugin/properties_tests.cpp index e502636c36e8df..f89af230327e40 100644 --- a/src/plugins/intel_gpu/tests/functional/shared_tests_instances/behavior/ov_plugin/properties_tests.cpp +++ b/src/plugins/intel_gpu/tests/functional/shared_tests_instances/behavior/ov_plugin/properties_tests.cpp @@ -33,6 +33,7 @@ const std::vector gpu_compileModel_properties = { {ov::hint::performance_mode(ov::hint::PerformanceMode::LATENCY), ov::hint::num_requests(10), ov::hint::enable_cpu_pinning(true), + ov::hint::enable_cpu_reservation(false), ov::enable_profiling(true)}}; INSTANTIATE_TEST_SUITE_P(smoke_gpuCompileModelBehaviorTests, From ce804eef9b1e2228b9d9cd3031b3527006a13010 Mon Sep 17 00:00:00 2001 From: sunxiaoxia2022 Date: Wed, 30 Oct 2024 17:12:35 +0800 Subject: [PATCH 03/30] update test case --- .../tests/unit/executor_config_test.cpp | 122 ++++++++++++++++++ 1 file changed, 122 insertions(+) diff --git a/src/inference/tests/unit/executor_config_test.cpp b/src/inference/tests/unit/executor_config_test.cpp index 09866836aab1bb..a3ca2624294ff7 100644 --- a/src/inference/tests/unit/executor_config_test.cpp +++ b/src/inference/tests/unit/executor_config_test.cpp @@ -312,6 +312,66 @@ ExecutorConfigTestCase _1sockets_streams_6_threads_1_core_e = { }; ExecutorConfigTestCase _1sockets_streams_5_threads_1_binding = { + { + {12, 6, 0, 6, 0, 0}, + }, + { + {0, 0, 0, 0, MAIN_CORE_PROC, 0, -1}, + {1, 0, 0, 0, HYPER_THREADING_PROC, 1, -1}, + {2, 0, 0, 1, MAIN_CORE_PROC, 2, -1}, + {3, 0, 0, 1, HYPER_THREADING_PROC, 3, -1}, + {4, 0, 0, 2, MAIN_CORE_PROC, 4, -1}, + {5, 0, 0, 2, HYPER_THREADING_PROC, 5, -1}, + {6, 0, 0, 3, MAIN_CORE_PROC, 6, -1}, + {7, 0, 0, 3, HYPER_THREADING_PROC, 7, -1}, + {8, 0, 0, 4, MAIN_CORE_PROC, 8, -1}, + {9, 0, 0, 4, HYPER_THREADING_PROC, 9, -1}, + {10, 0, 0, 5, MAIN_CORE_PROC, 10, -1}, + {11, 0, 0, 5, HYPER_THREADING_PROC, 11, -1}, + }, + 5, + 1, + ov::hint::SchedulingCoreType::ANY_CORE, + false, + true, + {}, + { + {5, MAIN_CORE_PROC, 1, 0, 0}, + }, + {{0}, {2}, {4}, {6}, {8}}, +}; + +ExecutorConfigTestCase _1sockets_streams_5_threads_1_reservation = { + { + {12, 6, 0, 6, 0, 0}, + }, + { + {0, 0, 0, 0, MAIN_CORE_PROC, 0, -1}, + {1, 0, 0, 0, HYPER_THREADING_PROC, 1, -1}, + {2, 0, 0, 1, MAIN_CORE_PROC, 2, -1}, + {3, 0, 0, 1, HYPER_THREADING_PROC, 3, -1}, + {4, 0, 0, 2, MAIN_CORE_PROC, 4, -1}, + {5, 0, 0, 2, HYPER_THREADING_PROC, 5, -1}, + {6, 0, 0, 3, MAIN_CORE_PROC, 6, -1}, + {7, 0, 0, 3, HYPER_THREADING_PROC, 7, -1}, + {8, 0, 0, 4, MAIN_CORE_PROC, 8, -1}, + {9, 0, 0, 4, HYPER_THREADING_PROC, 9, -1}, + {10, 0, 0, 5, MAIN_CORE_PROC, 10, -1}, + {11, 0, 0, 5, HYPER_THREADING_PROC, 11, -1}, + }, + 5, + 1, + ov::hint::SchedulingCoreType::ANY_CORE, + true, + false, + {}, + { + {5, MAIN_CORE_PROC, 1, 0, 0}, + }, + {{0}, {2}, {4}, {6}, {8}}, +}; + +ExecutorConfigTestCase _1sockets_streams_5_threads_1_binding_reservation = { { {12, 6, 0, 6, 0, 0}, }, @@ -572,6 +632,65 @@ ExecutorConfigTestCase _2sockets_streams_1_threads_30 = { }; ExecutorConfigTestCase _2sockets_streams_1_threads_30_binding = { + { + {72, 36, 0, 36, -1, -1}, + {36, 18, 0, 18, 0, 0}, + {36, 18, 0, 18, 1, 1}, + }, + { + {0, 0, 0, 0, HYPER_THREADING_PROC, 0, -1}, {1, 0, 0, 1, HYPER_THREADING_PROC, 1, -1}, + {2, 0, 0, 2, HYPER_THREADING_PROC, 2, -1}, {3, 0, 0, 3, HYPER_THREADING_PROC, 3, -1}, + {4, 0, 0, 4, HYPER_THREADING_PROC, 4, -1}, {5, 0, 0, 5, HYPER_THREADING_PROC, 5, -1}, + {6, 0, 0, 6, HYPER_THREADING_PROC, 6, -1}, {7, 0, 0, 7, HYPER_THREADING_PROC, 7, -1}, + {8, 0, 0, 8, HYPER_THREADING_PROC, 8, -1}, {9, 0, 0, 9, HYPER_THREADING_PROC, 9, -1}, + {10, 0, 0, 10, HYPER_THREADING_PROC, 10, -1}, {11, 0, 0, 11, HYPER_THREADING_PROC, 11, -1}, + {12, 0, 0, 12, HYPER_THREADING_PROC, 12, -1}, {13, 0, 0, 13, HYPER_THREADING_PROC, 13, -1}, + {14, 0, 0, 14, HYPER_THREADING_PROC, 14, -1}, {15, 0, 0, 15, HYPER_THREADING_PROC, 15, -1}, + {16, 0, 0, 16, HYPER_THREADING_PROC, 16, -1}, {17, 0, 0, 17, HYPER_THREADING_PROC, 17, -1}, + {18, 1, 1, 18, HYPER_THREADING_PROC, 18, -1}, {19, 1, 1, 19, HYPER_THREADING_PROC, 19, -1}, + {20, 1, 1, 20, HYPER_THREADING_PROC, 20, -1}, {21, 1, 1, 21, HYPER_THREADING_PROC, 21, -1}, + {22, 1, 1, 22, HYPER_THREADING_PROC, 22, -1}, {23, 1, 1, 23, HYPER_THREADING_PROC, 23, -1}, + {24, 1, 1, 24, HYPER_THREADING_PROC, 24, -1}, {25, 1, 1, 25, HYPER_THREADING_PROC, 25, -1}, + {26, 1, 1, 26, HYPER_THREADING_PROC, 26, -1}, {27, 1, 1, 27, HYPER_THREADING_PROC, 27, -1}, + {28, 1, 1, 28, HYPER_THREADING_PROC, 28, -1}, {29, 1, 1, 29, HYPER_THREADING_PROC, 29, -1}, + {30, 1, 1, 30, HYPER_THREADING_PROC, 30, -1}, {31, 1, 1, 31, HYPER_THREADING_PROC, 31, -1}, + {32, 1, 1, 32, HYPER_THREADING_PROC, 32, -1}, {33, 1, 1, 33, HYPER_THREADING_PROC, 33, -1}, + {34, 1, 1, 34, HYPER_THREADING_PROC, 34, -1}, {35, 1, 1, 35, HYPER_THREADING_PROC, 35, -1}, + {36, 0, 0, 36, MAIN_CORE_PROC, 36, -1}, {37, 0, 0, 37, MAIN_CORE_PROC, 37, -1}, + {38, 0, 0, 38, MAIN_CORE_PROC, 38, -1}, {39, 0, 0, 39, MAIN_CORE_PROC, 39, -1}, + {40, 0, 0, 40, MAIN_CORE_PROC, 40, -1}, {41, 0, 0, 41, MAIN_CORE_PROC, 41, -1}, + {42, 0, 0, 42, MAIN_CORE_PROC, 42, -1}, {43, 0, 0, 43, MAIN_CORE_PROC, 43, -1}, + {44, 0, 0, 44, MAIN_CORE_PROC, 44, -1}, {45, 0, 0, 45, MAIN_CORE_PROC, 45, -1}, + {46, 0, 0, 46, MAIN_CORE_PROC, 46, -1}, {47, 0, 0, 47, MAIN_CORE_PROC, 47, -1}, + {48, 0, 0, 48, MAIN_CORE_PROC, 48, -1}, {49, 0, 0, 49, MAIN_CORE_PROC, 49, -1}, + {50, 0, 0, 50, MAIN_CORE_PROC, 50, -1}, {51, 0, 0, 51, MAIN_CORE_PROC, 51, -1}, + {52, 0, 0, 52, MAIN_CORE_PROC, 52, -1}, {53, 0, 0, 53, MAIN_CORE_PROC, 53, -1}, + {54, 1, 1, 54, MAIN_CORE_PROC, 54, -1}, {55, 1, 1, 55, MAIN_CORE_PROC, 55, -1}, + {56, 1, 1, 56, MAIN_CORE_PROC, 56, -1}, {57, 1, 1, 57, MAIN_CORE_PROC, 57, -1}, + {58, 1, 1, 58, MAIN_CORE_PROC, 58, -1}, {59, 1, 1, 59, MAIN_CORE_PROC, 59, -1}, + {60, 1, 1, 60, MAIN_CORE_PROC, 60, -1}, {61, 1, 1, 61, MAIN_CORE_PROC, 61, -1}, + {62, 1, 1, 62, MAIN_CORE_PROC, 62, -1}, {63, 1, 1, 63, MAIN_CORE_PROC, 63, -1}, + {64, 1, 1, 64, MAIN_CORE_PROC, 64, -1}, {65, 1, 1, 65, MAIN_CORE_PROC, 65, -1}, + {66, 1, 1, 66, MAIN_CORE_PROC, 66, -1}, {67, 1, 1, 67, MAIN_CORE_PROC, 67, -1}, + {68, 1, 1, 68, MAIN_CORE_PROC, 68, -1}, {69, 1, 1, 69, MAIN_CORE_PROC, 69, -1}, + {70, 1, 1, 70, MAIN_CORE_PROC, 70, -1}, {71, 1, 1, 71, MAIN_CORE_PROC, 71, -1}, + }, + 1, + 30, + ov::hint::SchedulingCoreType::ANY_CORE, + false, + true, + {}, + { + {1, ALL_PROC, 30, -1, -1}, + {0, MAIN_CORE_PROC, 18, 0, 0}, + {0, MAIN_CORE_PROC, 12, 1, 1}, + }, + {{36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, + 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65}}, +}; + +ExecutorConfigTestCase _2sockets_streams_1_threads_30_reservation = { { {72, 36, 0, 36, -1, -1}, {36, 18, 0, 18, 0, 0}, @@ -1273,11 +1392,14 @@ INSTANTIATE_TEST_SUITE_P(smoke_ExecutorConfig, _1sockets_streams_13_threads_1, _1sockets_streams_6_threads_1_core_e, _1sockets_streams_5_threads_1_binding, + _1sockets_streams_5_threads_1_reservation, + _1sockets_streams_5_threads_1_binding_reservation, _2sockets_streams_36_threads_1, _2sockets_streams_4_threads_5, _2sockets_streams_1_threads_36, _2sockets_streams_1_threads_30, _2sockets_streams_1_threads_30_binding, + _2sockets_streams_1_threads_30_reservation, _pecore_streams_5_threads_2, _pecore_streams_5_threads_5, _pecore_streams_4_threads_5, From bf63bf9fb18ac5b43b4e4281f2e9aa567ce429b7 Mon Sep 17 00:00:00 2001 From: sunxiaoxia2022 Date: Tue, 12 Nov 2024 23:53:51 +0800 Subject: [PATCH 04/30] support cpu_reservation=true,cpu_pinning=false --- src/inference/src/dev/threading/istreams_executor.cpp | 6 +----- src/inference/tests/unit/executor_config_test.cpp | 6 +----- src/plugins/intel_gpu/src/runtime/execution_config.cpp | 6 +----- 3 files changed, 3 insertions(+), 15 deletions(-) diff --git a/src/inference/src/dev/threading/istreams_executor.cpp b/src/inference/src/dev/threading/istreams_executor.cpp index 53a0c32806c6aa..4712ae3af193c4 100644 --- a/src/inference/src/dev/threading/istreams_executor.cpp +++ b/src/inference/src/dev/threading/istreams_executor.cpp @@ -163,10 +163,6 @@ void IStreamsExecutor::Config::update_executor_config() { return; } - if (_cpu_reservation && !_cpu_pinning) { - _cpu_pinning = true; - } - if (!_streams_info_table.empty()) { streams_info_available = true; std::vector threads_proc_type(HYPER_THREADING_PROC + 1, 0); @@ -265,7 +261,7 @@ void IStreamsExecutor::Config::update_executor_config() { } } - if (_cpu_pinning) { + if (_cpu_pinning || _cpu_reservation) { reserve_available_cpus(_streams_info_table, _stream_processor_ids, _cpu_reservation ? CPU_USED : NOT_USED); } diff --git a/src/inference/tests/unit/executor_config_test.cpp b/src/inference/tests/unit/executor_config_test.cpp index a3ca2624294ff7..ea117d8fa0c72a 100644 --- a/src/inference/tests/unit/executor_config_test.cpp +++ b/src/inference/tests/unit/executor_config_test.cpp @@ -51,11 +51,7 @@ class ExecutorConfigTest : public ov::test::TestsCommon, test_data._cpu_pinning, test_data._streams_info_table_in}; ASSERT_EQ(test_data._cpu_reservation, config.get_cpu_reservation()); - if (test_data._cpu_reservation && !test_data._cpu_pinning) { - ASSERT_EQ(true, config.get_cpu_pinning()); - } else { - ASSERT_EQ(test_data._cpu_pinning, config.get_cpu_pinning()); - } + ASSERT_EQ(test_data._cpu_pinning, config.get_cpu_pinning()); ASSERT_EQ(test_data._streams_info_table, config.get_streams_info_table()); ASSERT_EQ(test_data._stream_processors, config.get_stream_processor_ids()); if (test_data._cpu_reservation) { diff --git a/src/plugins/intel_gpu/src/runtime/execution_config.cpp b/src/plugins/intel_gpu/src/runtime/execution_config.cpp index 8b13c23c5e4ef4..3307fa25f4ae1e 100644 --- a/src/plugins/intel_gpu/src/runtime/execution_config.cpp +++ b/src/plugins/intel_gpu/src/runtime/execution_config.cpp @@ -237,14 +237,10 @@ void ExecutionConfig::apply_user_properties(const cldnn::device_info& info) { set_property(ov::intel_gpu::queue_type(QueueTypes::in_order)); } if (!is_set_by_user(ov::hint::enable_cpu_reservation)) { - bool enable_cpu_pinning = get_property(ov::hint::enable_cpu_pinning); - if (enable_cpu_pinning) { + if (get_property(ov::hint::enable_cpu_pinning)) { set_property(ov::hint::enable_cpu_reservation(true)); } } - if (get_property(ov::hint::enable_cpu_reservation) && !get_property(ov::hint::enable_cpu_pinning)) { - set_property(ov::hint::enable_cpu_pinning(true)); - } user_properties.clear(); } From dd43e4ac3d4b99dfc97fad075734e8493d804a7e Mon Sep 17 00:00:00 2001 From: sunxiaoxia2022 Date: Tue, 12 Nov 2024 23:56:09 +0800 Subject: [PATCH 05/30] change comments --- src/inference/include/openvino/runtime/properties.hpp | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/src/inference/include/openvino/runtime/properties.hpp b/src/inference/include/openvino/runtime/properties.hpp index c714c77d6b062b..943013d219b314 100644 --- a/src/inference/include/openvino/runtime/properties.hpp +++ b/src/inference/include/openvino/runtime/properties.hpp @@ -486,7 +486,7 @@ static constexpr Property enable_cpu_pinning{"ENABLE_CPU_PINNING"}; * Cpu Reservation means reserve cpus which will not be used by other plugin. Developer can use this property to * enable or disable CPU reservation during inference on Windows and Linux. MacOS * does not support CPU reservation, and this property is always disabled. - * This property defaults to false. If it explicitly set to true, cpu_pinning defaults to true. + * This property defaults to false. * * The following code is example to use this property. * From 13a146e8bbde4c17cfb595751acd884b7e7e070f Mon Sep 17 00:00:00 2001 From: sunxiaoxia2022 Date: Wed, 13 Nov 2024 23:48:03 +0800 Subject: [PATCH 06/30] add enable_cpu_reservation to CpuExecNetworkSupportedPropertiesAreAvailable and PluginAllSupportedPropertiesAreAvailable --- .../custom/behavior/ov_executable_network/properties.cpp | 1 + .../tests/functional/custom/behavior/ov_plugin/properties.cpp | 1 + 2 files changed, 2 insertions(+) diff --git a/src/plugins/intel_cpu/tests/functional/custom/behavior/ov_executable_network/properties.cpp b/src/plugins/intel_cpu/tests/functional/custom/behavior/ov_executable_network/properties.cpp index 365e7c56dcef82..17add01f1490a7 100644 --- a/src/plugins/intel_cpu/tests/functional/custom/behavior/ov_executable_network/properties.cpp +++ b/src/plugins/intel_cpu/tests/functional/custom/behavior/ov_executable_network/properties.cpp @@ -32,6 +32,7 @@ TEST_F(OVClassConfigTestCPU, smoke_CpuExecNetworkSupportedPropertiesAreAvailable RO_property(ov::hint::execution_mode.name()), RO_property(ov::hint::num_requests.name()), RO_property(ov::hint::enable_cpu_pinning.name()), + RO_property(ov::hint::enable_cpu_reservation.name()), RO_property(ov::hint::scheduling_core_type.name()), RO_property(ov::hint::model_distribution_policy.name()), RO_property(ov::hint::enable_hyper_threading.name()), diff --git a/src/plugins/intel_cpu/tests/functional/custom/behavior/ov_plugin/properties.cpp b/src/plugins/intel_cpu/tests/functional/custom/behavior/ov_plugin/properties.cpp index 904d2b81dc05b6..853461e37012dd 100644 --- a/src/plugins/intel_cpu/tests/functional/custom/behavior/ov_plugin/properties.cpp +++ b/src/plugins/intel_cpu/tests/functional/custom/behavior/ov_plugin/properties.cpp @@ -47,6 +47,7 @@ TEST_F(OVClassConfigTestCPU, smoke_PluginAllSupportedPropertiesAreAvailable) { RW_property(ov::hint::execution_mode.name()), RW_property(ov::hint::num_requests.name()), RW_property(ov::hint::enable_cpu_pinning.name()), + RW_property(ov::hint::enable_cpu_reservation.name()), RW_property(ov::hint::scheduling_core_type.name()), RW_property(ov::hint::model_distribution_policy.name()), RW_property(ov::hint::enable_hyper_threading.name()), From 79099f0b84360803fd36272da86a34e4a9c41946 Mon Sep 17 00:00:00 2001 From: "Shen, Wanglei" Date: Wed, 4 Dec 2024 01:29:53 +0800 Subject: [PATCH 07/30] initial implementation --- .../intel_cpu/src/cpu_streams_calculation.cpp | 13 +++++++------ .../unit/streams_info/streams_info_table_test.cpp | 10 +++++----- 2 files changed, 12 insertions(+), 11 deletions(-) diff --git a/src/plugins/intel_cpu/src/cpu_streams_calculation.cpp b/src/plugins/intel_cpu/src/cpu_streams_calculation.cpp index 0ed64d49ea68dd..9068244a12f840 100644 --- a/src/plugins/intel_cpu/src/cpu_streams_calculation.cpp +++ b/src/plugins/intel_cpu/src/cpu_streams_calculation.cpp @@ -175,11 +175,7 @@ std::vector> get_streams_info_table(const int input_streams, std::unordered_set socket_id_list(proc_type_table.size()); for (size_t i = 1; i < proc_type_table.size(); i++) { if (!socket_id_list.count(proc_type_table[i][PROC_SOCKET_ID])) { - if (proc_type_table[i][PROC_SOCKET_ID] == input_current_socket_id) { - proc_socket_table.insert(proc_socket_table.begin(), proc_type_table[i]); - } else { - proc_socket_table.push_back(proc_type_table[i]); - } + proc_socket_table.push_back(proc_type_table[i]); socket_id_list.insert(proc_type_table[i][PROC_SOCKET_ID]); } else { for (auto& row : proc_socket_table) { @@ -201,7 +197,12 @@ std::vector> get_streams_info_table(const int input_streams, ((input_streams_changed == true) && (input_streams == 1))) { n_streams = 1; stream_info[NUMBER_OF_STREAMS] = n_streams; - current_socket_id = input_current_socket_id == -1 ? get_current_socket_id() : input_current_socket_id; + for (size_t n = 0; n < proc_socket_table.size(); n++) { + if (proc_socket_table[n][ALL_PROC] > 0) { + current_socket_id = proc_socket_table[n][PROC_SOCKET_ID]; + break; + } + } if (input_threads > 0) { if (hint_model_distribution_policy.size() == 0) { for (auto& row : proc_socket_table) { diff --git a/src/plugins/intel_cpu/tests/unit/streams_info/streams_info_table_test.cpp b/src/plugins/intel_cpu/tests/unit/streams_info/streams_info_table_test.cpp index 908c8802981ab8..6f7a64c6bea24c 100644 --- a/src/plugins/intel_cpu/tests/unit/streams_info/streams_info_table_test.cpp +++ b/src/plugins/intel_cpu/tests/unit/streams_info/streams_info_table_test.cpp @@ -2575,10 +2575,10 @@ StreamsCalculationTestCase _2sockets_mock_latency_35 = { "LATENCY", {}, {{200, 100, 0, 100, -1, -1}, + {20, 10, 0, 10, 3, 3}, {80, 40, 0, 40, 0, 0}, {60, 30, 0, 30, 1, 1}, - {40, 20, 0, 20, 2, 2}, - {20, 10, 0, 10, 3, 3}}, + {40, 20, 0, 20, 2, 2}}, {{1, ALL_PROC, 20, 3, 3}, {0, MAIN_CORE_PROC, 10, 3, 3}, {0, HYPER_THREADING_PROC, 10, 3, 3}}, }; StreamsCalculationTestCase _2sockets_mock_latency_36 = { @@ -2591,10 +2591,10 @@ StreamsCalculationTestCase _2sockets_mock_latency_36 = { "LATENCY", {}, {{200, 100, 0, 100, -1, -1}, + {20, 10, 0, 10, 3, 3}, {80, 40, 0, 40, 0, 0}, {60, 30, 0, 30, 1, 1}, - {40, 20, 0, 20, 2, 2}, - {20, 10, 0, 10, 3, 3}}, + {40, 20, 0, 20, 2, 2}}, {{1, ALL_PROC, 20, 3, 3}, {0, MAIN_CORE_PROC, 10, 3, 3}, {0, HYPER_THREADING_PROC, 10, 3, 3}}, }; StreamsCalculationTestCase _2sockets_mock_latency_37 = { @@ -2606,7 +2606,7 @@ StreamsCalculationTestCase _2sockets_mock_latency_37 = { 1, "LATENCY", {ov::hint::ModelDistributionPolicy::TENSOR_PARALLEL}, - {{48, 48, 0, 0, -1, -1}, {24, 24, 0, 0, 0, 0}, {24, 24, 0, 0, 1, 1}}, + {{48, 48, 0, 0, -1, -1}, {24, 24, 0, 0, 1, 1}, {24, 24, 0, 0, 0, 0}}, {{1, MAIN_CORE_PROC, 48, -1, -1}, {-1, MAIN_CORE_PROC, 24, 1, 1}, {-1, MAIN_CORE_PROC, 24, 0, 0}}, }; StreamsCalculationTestCase _2sockets_mock_latency_38 = { From b6ba3a6ec11e728cd6ddf7344ff51fcd76eab39a Mon Sep 17 00:00:00 2001 From: "Shen, Wanglei" Date: Wed, 4 Dec 2024 20:49:19 +0800 Subject: [PATCH 08/30] update current_socket_id --- .../intel_cpu/src/cpu_streams_calculation.cpp | 18 +++++++++++++----- 1 file changed, 13 insertions(+), 5 deletions(-) diff --git a/src/plugins/intel_cpu/src/cpu_streams_calculation.cpp b/src/plugins/intel_cpu/src/cpu_streams_calculation.cpp index 9068244a12f840..2a03e69dafb646 100644 --- a/src/plugins/intel_cpu/src/cpu_streams_calculation.cpp +++ b/src/plugins/intel_cpu/src/cpu_streams_calculation.cpp @@ -169,13 +169,19 @@ std::vector> get_streams_info_table(const int input_streams, } }; + current_socket_id = input_current_socket_id == -1 ? get_current_socket_id() : input_current_socket_id; + if (proc_type_table.size() == 1) { proc_socket_table.push_back(proc_type_table[0]); } else { std::unordered_set socket_id_list(proc_type_table.size()); for (size_t i = 1; i < proc_type_table.size(); i++) { if (!socket_id_list.count(proc_type_table[i][PROC_SOCKET_ID])) { - proc_socket_table.push_back(proc_type_table[i]); + if (proc_type_table[i][PROC_SOCKET_ID] == current_socket_id) { + proc_socket_table.insert(proc_socket_table.begin(), proc_type_table[i]); + } else { + proc_socket_table.push_back(proc_type_table[i]); + } socket_id_list.insert(proc_type_table[i][PROC_SOCKET_ID]); } else { for (auto& row : proc_socket_table) { @@ -197,10 +203,12 @@ std::vector> get_streams_info_table(const int input_streams, ((input_streams_changed == true) && (input_streams == 1))) { n_streams = 1; stream_info[NUMBER_OF_STREAMS] = n_streams; - for (size_t n = 0; n < proc_socket_table.size(); n++) { - if (proc_socket_table[n][ALL_PROC] > 0) { - current_socket_id = proc_socket_table[n][PROC_SOCKET_ID]; - break; + if (proc_socket_table[0][ALL_PROC] == 0) { + for (size_t n = 0; n < proc_socket_table.size(); n++) { + if (proc_socket_table[n][ALL_PROC] > 0) { + current_socket_id = proc_socket_table[n][PROC_SOCKET_ID]; + break; + } } } if (input_threads > 0) { From 7c53ce36be6ce33a73a2c487d6fddcc11b3f950d Mon Sep 17 00:00:00 2001 From: "Shen, Wanglei" Date: Thu, 5 Dec 2024 07:01:53 +0800 Subject: [PATCH 09/30] Revert "update current_socket_id" This reverts commit b6ba3a6ec11e728cd6ddf7344ff51fcd76eab39a. --- .../intel_cpu/src/cpu_streams_calculation.cpp | 18 +++++------------- 1 file changed, 5 insertions(+), 13 deletions(-) diff --git a/src/plugins/intel_cpu/src/cpu_streams_calculation.cpp b/src/plugins/intel_cpu/src/cpu_streams_calculation.cpp index 2a03e69dafb646..9068244a12f840 100644 --- a/src/plugins/intel_cpu/src/cpu_streams_calculation.cpp +++ b/src/plugins/intel_cpu/src/cpu_streams_calculation.cpp @@ -169,19 +169,13 @@ std::vector> get_streams_info_table(const int input_streams, } }; - current_socket_id = input_current_socket_id == -1 ? get_current_socket_id() : input_current_socket_id; - if (proc_type_table.size() == 1) { proc_socket_table.push_back(proc_type_table[0]); } else { std::unordered_set socket_id_list(proc_type_table.size()); for (size_t i = 1; i < proc_type_table.size(); i++) { if (!socket_id_list.count(proc_type_table[i][PROC_SOCKET_ID])) { - if (proc_type_table[i][PROC_SOCKET_ID] == current_socket_id) { - proc_socket_table.insert(proc_socket_table.begin(), proc_type_table[i]); - } else { - proc_socket_table.push_back(proc_type_table[i]); - } + proc_socket_table.push_back(proc_type_table[i]); socket_id_list.insert(proc_type_table[i][PROC_SOCKET_ID]); } else { for (auto& row : proc_socket_table) { @@ -203,12 +197,10 @@ std::vector> get_streams_info_table(const int input_streams, ((input_streams_changed == true) && (input_streams == 1))) { n_streams = 1; stream_info[NUMBER_OF_STREAMS] = n_streams; - if (proc_socket_table[0][ALL_PROC] == 0) { - for (size_t n = 0; n < proc_socket_table.size(); n++) { - if (proc_socket_table[n][ALL_PROC] > 0) { - current_socket_id = proc_socket_table[n][PROC_SOCKET_ID]; - break; - } + for (size_t n = 0; n < proc_socket_table.size(); n++) { + if (proc_socket_table[n][ALL_PROC] > 0) { + current_socket_id = proc_socket_table[n][PROC_SOCKET_ID]; + break; } } if (input_threads > 0) { From 9e7ed1cdd34e36af21b964781cf8d6b531595e45 Mon Sep 17 00:00:00 2001 From: "Shen, Wanglei" Date: Wed, 18 Dec 2024 20:09:46 +0800 Subject: [PATCH 10/30] initial implementation --- .../dev_api/openvino/runtime/system_conf.hpp | 7 +++ src/inference/src/system_conf.cpp | 43 +++++++++++++++++++ .../intel_cpu/src/cpu_streams_calculation.cpp | 18 ++++++++ .../intel_cpu/src/cpu_streams_calculation.hpp | 8 ++++ 4 files changed, 76 insertions(+) diff --git a/src/inference/dev_api/openvino/runtime/system_conf.hpp b/src/inference/dev_api/openvino/runtime/system_conf.hpp index bebc2014ab8028..fbb0fafb376fbf 100644 --- a/src/inference/dev_api/openvino/runtime/system_conf.hpp +++ b/src/inference/dev_api/openvino/runtime/system_conf.hpp @@ -219,6 +219,13 @@ OPENVINO_RUNTIME_API std::vector> get_proc_type_table(); */ OPENVINO_RUNTIME_API int get_current_socket_id(); +/** + * @brief Returns the numa node ID in cpu mapping table of the currently running thread. + * @ingroup ov_dev_api_system_conf + * @return numa node ID in cpu mapping + */ +OPENVINO_RUNTIME_API int get_current_numa_node_id(); + /** * @brief Returns a table of original number of processor types without filtering other plugins occupying CPU * resources. The difference from get_proc_type_table: This is used to get the configuration of current machine. For diff --git a/src/inference/src/system_conf.cpp b/src/inference/src/system_conf.cpp index 3227b1a3034903..8d1804e980b2c6 100644 --- a/src/inference/src/system_conf.cpp +++ b/src/inference/src/system_conf.cpp @@ -261,6 +261,10 @@ int get_current_socket_id() { return 0; } +int get_current_numa_node_id() { + return 0; +} + std::vector> get_proc_type_table() { return {{-1}}; } @@ -322,6 +326,10 @@ int get_current_socket_id() { return 0; } +int get_current_numa_node_id() { + return 0; +} + std::vector> get_proc_type_table() { CPU& cpu = cpu_info(); std::lock_guard lock{cpu._cpu_mutex}; @@ -411,8 +419,43 @@ int get_current_socket_id() { return 0; } + +int get_current_numa_node_id() { + CPU& cpu = cpu_info(); + int cur_processor_id = sched_getcpu(); + + for (auto& row : cpu._cpu_mapping_table) { + if (cur_processor_id == row[CPU_MAP_PROCESSOR_ID]) { + return row[CPU_MAP_NUMA_NODE_ID]; + } + } + + return 0; +} # else int get_current_socket_id() { + CPU& cpu = cpu_info(); + int cur_processor_id = GetCurrentProcessorNumber(); + + for (auto& row : cpu._cpu_mapping_table) { + if (cur_processor_id == row[CPU_MAP_PROCESSOR_ID]) { + return row[CPU_MAP_SOCKET_ID]; + } + } + + return 0; +} + +int get_current_numa_node_id() { + CPU& cpu = cpu_info(); + int cur_processor_id = GetCurrentProcessorNumber();; + + for (auto& row : cpu._cpu_mapping_table) { + if (cur_processor_id == row[CPU_MAP_PROCESSOR_ID]) { + return row[CPU_MAP_NUMA_NODE_ID]; + } + } + return 0; } # endif diff --git a/src/plugins/intel_cpu/src/cpu_streams_calculation.cpp b/src/plugins/intel_cpu/src/cpu_streams_calculation.cpp index 3af6a52d5f3342..c0cddf96da725d 100644 --- a/src/plugins/intel_cpu/src/cpu_streams_calculation.cpp +++ b/src/plugins/intel_cpu/src/cpu_streams_calculation.cpp @@ -27,6 +27,19 @@ using namespace ov::threading; namespace ov { namespace intel_cpu { +void sort_table_by_numa_node_id(const int current_numa_node, std::vector>& proc_type_table) { + if (proc_type_table.size() > 1) { + for (size_t i = 1; i < proc_type_table.size(); i++) { + if (current_numa_node == proc_type_table[i][PROC_NUMA_NODE_ID]) { + std::rotate(proc_type_table.begin() + 1, proc_type_table.begin() + i, proc_type_table.end()); + break; + } + } + } + + return; +}; + std::vector> get_streams_info_table( const int input_streams, const bool input_streams_changed, @@ -683,6 +696,11 @@ std::vector> generate_stream_info(const int streams, model_prefer_threads = get_model_prefer_threads(streams, proc_type_table, model, config); } + if (proc_type_table.size() > 1) { + const auto cur_numa_node_id = get_current_numa_node_id(); + sort_table_by_numa_node_id(cur_numa_node_id, proc_type_table); + } + auto streams_info_table = get_streams_info_table(config.streams, config.streamsChanged, config.threads, diff --git a/src/plugins/intel_cpu/src/cpu_streams_calculation.hpp b/src/plugins/intel_cpu/src/cpu_streams_calculation.hpp index 0a0b4a1449b7cb..e472b838b1272c 100644 --- a/src/plugins/intel_cpu/src/cpu_streams_calculation.hpp +++ b/src/plugins/intel_cpu/src/cpu_streams_calculation.hpp @@ -109,5 +109,13 @@ std::vector> generate_stream_info(const int streams, */ void get_num_streams(const int streams, const std::shared_ptr& model, Config& config); +/** + * @brief Sort proc_type_table by numa node id on which application is running. The numa node will move to first + * row. + * @param[in] current_numa_node numa node ID on which application is running. + * @param[in] proc_type_table summary table of number of processors per type + */ +void sort_table_by_numa_node_id(const int current_numa_node, std::vector>& proc_type_table); + } // namespace intel_cpu } // namespace ov From 5cdfc10224e1d9790bb5a6ad2884c3c637965afb Mon Sep 17 00:00:00 2001 From: "Shen, Wanglei" Date: Thu, 19 Dec 2024 01:31:54 +0800 Subject: [PATCH 11/30] refactor streams calculation --- src/inference/src/os/cpu_map_info.hpp | 32 --- src/inference/src/os/lin/lin_system_conf.cpp | 5 - src/inference/src/os/win/win_system_conf.cpp | 5 - .../unit/cpu_map_parser/update_proc_table.cpp | 173 --------------- .../intel_cpu/src/cpu_streams_calculation.cpp | 14 +- .../intel_cpu/src/cpu_streams_calculation.hpp | 7 +- .../unit/streams_info/streams_e2e_test.cpp | 4 +- .../streams_info/streams_info_table_test.cpp | 208 +----------------- .../streams_info/update_proc_table_test.cpp | 72 ++++++ 9 files changed, 85 insertions(+), 435 deletions(-) delete mode 100644 src/inference/tests/unit/cpu_map_parser/update_proc_table.cpp create mode 100644 src/plugins/intel_cpu/tests/unit/streams_info/update_proc_table_test.cpp diff --git a/src/inference/src/os/cpu_map_info.hpp b/src/inference/src/os/cpu_map_info.hpp index 2cc6cef768d68d..1182ea4c974e01 100644 --- a/src/inference/src/os/cpu_map_info.hpp +++ b/src/inference/src/os/cpu_map_info.hpp @@ -54,38 +54,6 @@ class CPU { std::mutex _cpu_mutex; int _socket_idx = 0; -private: - /** - * @brief Sort proc_type_table by CPU ID on which application is running. The numa node containing this CPU ID - * will move to first row. - * @param[in] _processor_id CPU ID on which application is running. - * @param[in] _proc_type_table summary table of number of processors per type - * @param[in] _cpu_mapping_table CPU mapping table for each processor - * @return - */ - void sort_table_by_cpu_id(const int _processor_id, - std::vector>& _proc_type_table, - const std::vector>& _cpu_mapping_table) { - int current_numa_node = 0; - int current_socket = 0; - - for (auto& row : _cpu_mapping_table) { - if (_processor_id == row[CPU_MAP_PROCESSOR_ID]) { - current_numa_node = row[CPU_MAP_NUMA_NODE_ID]; - current_socket = row[CPU_MAP_SOCKET_ID]; - break; - } - } - for (size_t i = 1; i < _proc_type_table.size(); i++) { - if ((current_numa_node == _proc_type_table[i][PROC_NUMA_NODE_ID]) && - (current_socket == _proc_type_table[i][PROC_SOCKET_ID])) { - std::rotate(_proc_type_table.begin() + 1, _proc_type_table.begin() + i, _proc_type_table.end()); - break; - } - } - }; - - friend class LinuxSortProcTableTests; }; CPU& cpu_info(); diff --git a/src/inference/src/os/lin/lin_system_conf.cpp b/src/inference/src/os/lin/lin_system_conf.cpp index f8bd16173b8fce..e30bcbbe8bc55e 100644 --- a/src/inference/src/os/lin/lin_system_conf.cpp +++ b/src/inference/src/os/lin/lin_system_conf.cpp @@ -282,11 +282,6 @@ CPU::CPU() { OPENVINO_THROW("CPU affinity check failed. No CPU is eligible to run inference."); }; - if (_proc_type_table.size() > 1) { - int cur_processor_id = sched_getcpu(); - sort_table_by_cpu_id(cur_processor_id, _proc_type_table, _cpu_mapping_table); - } - _org_proc_type_table = _proc_type_table; cpu_debug(); diff --git a/src/inference/src/os/win/win_system_conf.cpp b/src/inference/src/os/win/win_system_conf.cpp index 97831207df73d5..504ab0e8e9d925 100644 --- a/src/inference/src/os/win/win_system_conf.cpp +++ b/src/inference/src/os/win/win_system_conf.cpp @@ -52,11 +52,6 @@ CPU::CPU() { } } - if (_proc_type_table.size() > 1) { - int cur_processor_id = GetCurrentProcessorNumber(); - sort_table_by_cpu_id(cur_processor_id, _proc_type_table, _cpu_mapping_table); - } - cpu_debug(); } diff --git a/src/inference/tests/unit/cpu_map_parser/update_proc_table.cpp b/src/inference/tests/unit/cpu_map_parser/update_proc_table.cpp deleted file mode 100644 index fe255b85f47a33..00000000000000 --- a/src/inference/tests/unit/cpu_map_parser/update_proc_table.cpp +++ /dev/null @@ -1,173 +0,0 @@ -// Copyright (C) 2018-2024 Intel Corporation -// SPDX-License-Identifier: Apache-2.0 -// - -#include - -#include "common_test_utils/test_common.hpp" -#include "openvino/runtime/system_conf.hpp" -#include "os/cpu_map_info.hpp" - -using namespace testing; - -namespace ov { - -#ifdef __linux__ - -struct LinuxSortProcTableTestCase { - int current_processor_id; - std::vector> _proc_type_table_input; - std::vector> _cpu_mapping_table; - std::vector> _proc_type_table_output; -}; - -class LinuxSortProcTableTests : public ov::test::TestsCommon, - public testing::WithParamInterface> { -public: - void SetUp() override { - const auto& test_data = std::get<0>(GetParam()); - - CPU& cpu = cpu_info(); - std::vector> test_proc_type_table = test_data._proc_type_table_input; - - cpu.sort_table_by_cpu_id(test_data.current_processor_id, test_proc_type_table, test_data._cpu_mapping_table); - - ASSERT_EQ(test_proc_type_table, test_data._proc_type_table_output); - } -}; - -LinuxSortProcTableTestCase proc_table_2sockets_24cores_hyperthreading_1 = { - 2, - {{48, 24, 0, 24, -1, -1}, {12, 6, 0, 6, 0, 0}, {12, 6, 0, 6, 1, 0}, {12, 6, 0, 6, 2, 1}, {12, 6, 0, 6, 3, 1}}, - { - {0, 0, 0, 0, HYPER_THREADING_PROC, 0, -1}, {1, 2, 1, 12, HYPER_THREADING_PROC, 12, -1}, - {2, 0, 0, 1, HYPER_THREADING_PROC, 1, -1}, {3, 2, 1, 13, HYPER_THREADING_PROC, 13, -1}, - {4, 0, 0, 2, HYPER_THREADING_PROC, 2, -1}, {5, 2, 1, 14, HYPER_THREADING_PROC, 14, -1}, - {6, 0, 0, 3, HYPER_THREADING_PROC, 3, -1}, {7, 2, 1, 15, HYPER_THREADING_PROC, 15, -1}, - {8, 0, 0, 4, HYPER_THREADING_PROC, 4, -1}, {9, 2, 1, 16, HYPER_THREADING_PROC, 16, -1}, - {10, 0, 0, 5, HYPER_THREADING_PROC, 5, -1}, {11, 2, 1, 17, HYPER_THREADING_PROC, 17, -1}, - {12, 1, 0, 6, HYPER_THREADING_PROC, 6, -1}, {13, 3, 1, 18, HYPER_THREADING_PROC, 18, -1}, - {14, 1, 0, 7, HYPER_THREADING_PROC, 7, -1}, {15, 3, 1, 19, HYPER_THREADING_PROC, 19, -1}, - {16, 1, 0, 8, HYPER_THREADING_PROC, 8, -1}, {17, 3, 1, 20, HYPER_THREADING_PROC, 20, -1}, - {18, 1, 0, 9, HYPER_THREADING_PROC, 9, -1}, {19, 3, 1, 21, HYPER_THREADING_PROC, 21, -1}, - {20, 1, 0, 10, HYPER_THREADING_PROC, 10, -1}, {21, 3, 1, 22, HYPER_THREADING_PROC, 22, -1}, - {22, 1, 0, 11, HYPER_THREADING_PROC, 11, -1}, {23, 3, 1, 23, HYPER_THREADING_PROC, 23, -1}, - {24, 0, 0, 0, MAIN_CORE_PROC, 0, -1}, {25, 2, 1, 12, MAIN_CORE_PROC, 12, -1}, - {26, 0, 0, 1, MAIN_CORE_PROC, 1, -1}, {27, 2, 1, 13, MAIN_CORE_PROC, 13, -1}, - {28, 0, 0, 2, MAIN_CORE_PROC, 2, -1}, {29, 2, 1, 14, MAIN_CORE_PROC, 14, -1}, - {30, 0, 0, 3, MAIN_CORE_PROC, 3, -1}, {31, 2, 1, 15, MAIN_CORE_PROC, 15, -1}, - {32, 0, 0, 4, MAIN_CORE_PROC, 4, -1}, {33, 2, 1, 16, MAIN_CORE_PROC, 16, -1}, - {34, 0, 0, 5, MAIN_CORE_PROC, 5, -1}, {35, 2, 1, 17, MAIN_CORE_PROC, 17, -1}, - {36, 1, 0, 6, MAIN_CORE_PROC, 6, -1}, {37, 3, 1, 18, MAIN_CORE_PROC, 18, -1}, - {38, 1, 0, 7, MAIN_CORE_PROC, 7, -1}, {39, 3, 1, 19, MAIN_CORE_PROC, 19, -1}, - {40, 1, 0, 8, MAIN_CORE_PROC, 8, -1}, {41, 3, 1, 20, MAIN_CORE_PROC, 20, -1}, - {42, 1, 0, 9, MAIN_CORE_PROC, 9, -1}, {43, 3, 1, 21, MAIN_CORE_PROC, 21, -1}, - {44, 1, 0, 10, MAIN_CORE_PROC, 10, -1}, {45, 3, 1, 22, MAIN_CORE_PROC, 22, -1}, - {46, 1, 0, 11, MAIN_CORE_PROC, 11, -1}, {47, 3, 1, 23, MAIN_CORE_PROC, 23, -1}, - }, - {{48, 24, 0, 24, -1, -1}, {12, 6, 0, 6, 0, 0}, {12, 6, 0, 6, 1, 0}, {12, 6, 0, 6, 2, 1}, {12, 6, 0, 6, 3, 1}}, -}; -LinuxSortProcTableTestCase proc_table_2sockets_24cores_hyperthreading_2 = { - 16, - {{48, 24, 0, 24, -1, -1}, {12, 6, 0, 6, 0, 0}, {12, 6, 0, 6, 1, 0}, {12, 6, 0, 6, 2, 1}, {12, 6, 0, 6, 3, 1}}, - { - {0, 0, 0, 0, HYPER_THREADING_PROC, 0, -1}, {1, 2, 1, 12, HYPER_THREADING_PROC, 12, -1}, - {2, 0, 0, 1, HYPER_THREADING_PROC, 1, -1}, {3, 2, 1, 13, HYPER_THREADING_PROC, 13, -1}, - {4, 0, 0, 2, HYPER_THREADING_PROC, 2, -1}, {5, 2, 1, 14, HYPER_THREADING_PROC, 14, -1}, - {6, 0, 0, 3, HYPER_THREADING_PROC, 3, -1}, {7, 2, 1, 15, HYPER_THREADING_PROC, 15, -1}, - {8, 0, 0, 4, HYPER_THREADING_PROC, 4, -1}, {9, 2, 1, 16, HYPER_THREADING_PROC, 16, -1}, - {10, 0, 0, 5, HYPER_THREADING_PROC, 5, -1}, {11, 2, 1, 17, HYPER_THREADING_PROC, 17, -1}, - {12, 1, 0, 6, HYPER_THREADING_PROC, 6, -1}, {13, 3, 1, 18, HYPER_THREADING_PROC, 18, -1}, - {14, 1, 0, 7, HYPER_THREADING_PROC, 7, -1}, {15, 3, 1, 19, HYPER_THREADING_PROC, 19, -1}, - {16, 1, 0, 8, HYPER_THREADING_PROC, 8, -1}, {17, 3, 1, 20, HYPER_THREADING_PROC, 20, -1}, - {18, 1, 0, 9, HYPER_THREADING_PROC, 9, -1}, {19, 3, 1, 21, HYPER_THREADING_PROC, 21, -1}, - {20, 1, 0, 10, HYPER_THREADING_PROC, 10, -1}, {21, 3, 1, 22, HYPER_THREADING_PROC, 22, -1}, - {22, 1, 0, 11, HYPER_THREADING_PROC, 11, -1}, {23, 3, 1, 23, HYPER_THREADING_PROC, 23, -1}, - {24, 0, 0, 0, MAIN_CORE_PROC, 0, -1}, {25, 2, 1, 12, MAIN_CORE_PROC, 12, -1}, - {26, 0, 0, 1, MAIN_CORE_PROC, 1, -1}, {27, 2, 1, 13, MAIN_CORE_PROC, 13, -1}, - {28, 0, 0, 2, MAIN_CORE_PROC, 2, -1}, {29, 2, 1, 14, MAIN_CORE_PROC, 14, -1}, - {30, 0, 0, 3, MAIN_CORE_PROC, 3, -1}, {31, 2, 1, 15, MAIN_CORE_PROC, 15, -1}, - {32, 0, 0, 4, MAIN_CORE_PROC, 4, -1}, {33, 2, 1, 16, MAIN_CORE_PROC, 16, -1}, - {34, 0, 0, 5, MAIN_CORE_PROC, 5, -1}, {35, 2, 1, 17, MAIN_CORE_PROC, 17, -1}, - {36, 1, 0, 6, MAIN_CORE_PROC, 6, -1}, {37, 3, 1, 18, MAIN_CORE_PROC, 18, -1}, - {38, 1, 0, 7, MAIN_CORE_PROC, 7, -1}, {39, 3, 1, 19, MAIN_CORE_PROC, 19, -1}, - {40, 1, 0, 8, MAIN_CORE_PROC, 8, -1}, {41, 3, 1, 20, MAIN_CORE_PROC, 20, -1}, - {42, 1, 0, 9, MAIN_CORE_PROC, 9, -1}, {43, 3, 1, 21, MAIN_CORE_PROC, 21, -1}, - {44, 1, 0, 10, MAIN_CORE_PROC, 10, -1}, {45, 3, 1, 22, MAIN_CORE_PROC, 22, -1}, - {46, 1, 0, 11, MAIN_CORE_PROC, 11, -1}, {47, 3, 1, 23, MAIN_CORE_PROC, 23, -1}, - }, - {{48, 24, 0, 24, -1, -1}, {12, 6, 0, 6, 1, 0}, {12, 6, 0, 6, 2, 1}, {12, 6, 0, 6, 3, 1}, {12, 6, 0, 6, 0, 0}}, -}; -LinuxSortProcTableTestCase proc_table_2sockets_24cores_hyperthreading_3 = { - 7, - {{48, 24, 0, 24, -1, -1}, {12, 6, 0, 6, 0, 0}, {12, 6, 0, 6, 1, 0}, {12, 6, 0, 6, 2, 1}, {12, 6, 0, 6, 3, 1}}, - { - {0, 0, 0, 0, HYPER_THREADING_PROC, 0, -1}, {1, 2, 1, 12, HYPER_THREADING_PROC, 12, -1}, - {2, 0, 0, 1, HYPER_THREADING_PROC, 1, -1}, {3, 2, 1, 13, HYPER_THREADING_PROC, 13, -1}, - {4, 0, 0, 2, HYPER_THREADING_PROC, 2, -1}, {5, 2, 1, 14, HYPER_THREADING_PROC, 14, -1}, - {6, 0, 0, 3, HYPER_THREADING_PROC, 3, -1}, {7, 2, 1, 15, HYPER_THREADING_PROC, 15, -1}, - {8, 0, 0, 4, HYPER_THREADING_PROC, 4, -1}, {9, 2, 1, 16, HYPER_THREADING_PROC, 16, -1}, - {10, 0, 0, 5, HYPER_THREADING_PROC, 5, -1}, {11, 2, 1, 17, HYPER_THREADING_PROC, 17, -1}, - {12, 1, 0, 6, HYPER_THREADING_PROC, 6, -1}, {13, 3, 1, 18, HYPER_THREADING_PROC, 18, -1}, - {14, 1, 0, 7, HYPER_THREADING_PROC, 7, -1}, {15, 3, 1, 19, HYPER_THREADING_PROC, 19, -1}, - {16, 1, 0, 8, HYPER_THREADING_PROC, 8, -1}, {17, 3, 1, 20, HYPER_THREADING_PROC, 20, -1}, - {18, 1, 0, 9, HYPER_THREADING_PROC, 9, -1}, {19, 3, 1, 21, HYPER_THREADING_PROC, 21, -1}, - {20, 1, 0, 10, HYPER_THREADING_PROC, 10, -1}, {21, 3, 1, 22, HYPER_THREADING_PROC, 22, -1}, - {22, 1, 0, 11, HYPER_THREADING_PROC, 11, -1}, {23, 3, 1, 23, HYPER_THREADING_PROC, 23, -1}, - {24, 0, 0, 0, MAIN_CORE_PROC, 0, -1}, {25, 2, 1, 12, MAIN_CORE_PROC, 12, -1}, - {26, 0, 0, 1, MAIN_CORE_PROC, 1, -1}, {27, 2, 1, 13, MAIN_CORE_PROC, 13, -1}, - {28, 0, 0, 2, MAIN_CORE_PROC, 2, -1}, {29, 2, 1, 14, MAIN_CORE_PROC, 14, -1}, - {30, 0, 0, 3, MAIN_CORE_PROC, 3, -1}, {31, 2, 1, 15, MAIN_CORE_PROC, 15, -1}, - {32, 0, 0, 4, MAIN_CORE_PROC, 4, -1}, {33, 2, 1, 16, MAIN_CORE_PROC, 16, -1}, - {34, 0, 0, 5, MAIN_CORE_PROC, 5, -1}, {35, 2, 1, 17, MAIN_CORE_PROC, 17, -1}, - {36, 1, 0, 6, MAIN_CORE_PROC, 6, -1}, {37, 3, 1, 18, MAIN_CORE_PROC, 18, -1}, - {38, 1, 0, 7, MAIN_CORE_PROC, 7, -1}, {39, 3, 1, 19, MAIN_CORE_PROC, 19, -1}, - {40, 1, 0, 8, MAIN_CORE_PROC, 8, -1}, {41, 3, 1, 20, MAIN_CORE_PROC, 20, -1}, - {42, 1, 0, 9, MAIN_CORE_PROC, 9, -1}, {43, 3, 1, 21, MAIN_CORE_PROC, 21, -1}, - {44, 1, 0, 10, MAIN_CORE_PROC, 10, -1}, {45, 3, 1, 22, MAIN_CORE_PROC, 22, -1}, - {46, 1, 0, 11, MAIN_CORE_PROC, 11, -1}, {47, 3, 1, 23, MAIN_CORE_PROC, 23, -1}, - }, - {{48, 24, 0, 24, -1, -1}, {12, 6, 0, 6, 2, 1}, {12, 6, 0, 6, 3, 1}, {12, 6, 0, 6, 0, 0}, {12, 6, 0, 6, 1, 0}}, -}; -LinuxSortProcTableTestCase proc_table_2sockets_24cores_hyperthreading_4 = { - 21, - {{48, 24, 0, 24, -1, -1}, {12, 6, 0, 6, 0, 0}, {12, 6, 0, 6, 1, 0}, {12, 6, 0, 6, 2, 1}, {12, 6, 0, 6, 3, 1}}, - { - {0, 0, 0, 0, HYPER_THREADING_PROC, 0, -1}, {1, 2, 1, 12, HYPER_THREADING_PROC, 12, -1}, - {2, 0, 0, 1, HYPER_THREADING_PROC, 1, -1}, {3, 2, 1, 13, HYPER_THREADING_PROC, 13, -1}, - {4, 0, 0, 2, HYPER_THREADING_PROC, 2, -1}, {5, 2, 1, 14, HYPER_THREADING_PROC, 14, -1}, - {6, 0, 0, 3, HYPER_THREADING_PROC, 3, -1}, {7, 2, 1, 15, HYPER_THREADING_PROC, 15, -1}, - {8, 0, 0, 4, HYPER_THREADING_PROC, 4, -1}, {9, 2, 1, 16, HYPER_THREADING_PROC, 16, -1}, - {10, 0, 0, 5, HYPER_THREADING_PROC, 5, -1}, {11, 2, 1, 17, HYPER_THREADING_PROC, 17, -1}, - {12, 1, 0, 6, HYPER_THREADING_PROC, 6, -1}, {13, 3, 1, 18, HYPER_THREADING_PROC, 18, -1}, - {14, 1, 0, 7, HYPER_THREADING_PROC, 7, -1}, {15, 3, 1, 19, HYPER_THREADING_PROC, 19, -1}, - {16, 1, 0, 8, HYPER_THREADING_PROC, 8, -1}, {17, 3, 1, 20, HYPER_THREADING_PROC, 20, -1}, - {18, 1, 0, 9, HYPER_THREADING_PROC, 9, -1}, {19, 3, 1, 21, HYPER_THREADING_PROC, 21, -1}, - {20, 1, 0, 10, HYPER_THREADING_PROC, 10, -1}, {21, 3, 1, 22, HYPER_THREADING_PROC, 22, -1}, - {22, 1, 0, 11, HYPER_THREADING_PROC, 11, -1}, {23, 3, 1, 23, HYPER_THREADING_PROC, 23, -1}, - {24, 0, 0, 0, MAIN_CORE_PROC, 0, -1}, {25, 2, 1, 12, MAIN_CORE_PROC, 12, -1}, - {26, 0, 0, 1, MAIN_CORE_PROC, 1, -1}, {27, 2, 1, 13, MAIN_CORE_PROC, 13, -1}, - {28, 0, 0, 2, MAIN_CORE_PROC, 2, -1}, {29, 2, 1, 14, MAIN_CORE_PROC, 14, -1}, - {30, 0, 0, 3, MAIN_CORE_PROC, 3, -1}, {31, 2, 1, 15, MAIN_CORE_PROC, 15, -1}, - {32, 0, 0, 4, MAIN_CORE_PROC, 4, -1}, {33, 2, 1, 16, MAIN_CORE_PROC, 16, -1}, - {34, 0, 0, 5, MAIN_CORE_PROC, 5, -1}, {35, 2, 1, 17, MAIN_CORE_PROC, 17, -1}, - {36, 1, 0, 6, MAIN_CORE_PROC, 6, -1}, {37, 3, 1, 18, MAIN_CORE_PROC, 18, -1}, - {38, 1, 0, 7, MAIN_CORE_PROC, 7, -1}, {39, 3, 1, 19, MAIN_CORE_PROC, 19, -1}, - {40, 1, 0, 8, MAIN_CORE_PROC, 8, -1}, {41, 3, 1, 20, MAIN_CORE_PROC, 20, -1}, - {42, 1, 0, 9, MAIN_CORE_PROC, 9, -1}, {43, 3, 1, 21, MAIN_CORE_PROC, 21, -1}, - {44, 1, 0, 10, MAIN_CORE_PROC, 10, -1}, {45, 3, 1, 22, MAIN_CORE_PROC, 22, -1}, - {46, 1, 0, 11, MAIN_CORE_PROC, 11, -1}, {47, 3, 1, 23, MAIN_CORE_PROC, 23, -1}, - }, - {{48, 24, 0, 24, -1, -1}, {12, 6, 0, 6, 3, 1}, {12, 6, 0, 6, 0, 0}, {12, 6, 0, 6, 1, 0}, {12, 6, 0, 6, 2, 1}}, -}; - -TEST_P(LinuxSortProcTableTests, LinuxProcTable) {} - -INSTANTIATE_TEST_SUITE_P(CPUMap, - LinuxSortProcTableTests, - testing::Values(proc_table_2sockets_24cores_hyperthreading_1, - proc_table_2sockets_24cores_hyperthreading_2, - proc_table_2sockets_24cores_hyperthreading_3, - proc_table_2sockets_24cores_hyperthreading_4)); -#endif -} // namespace ov diff --git a/src/plugins/intel_cpu/src/cpu_streams_calculation.cpp b/src/plugins/intel_cpu/src/cpu_streams_calculation.cpp index c0cddf96da725d..23d166efb44e52 100644 --- a/src/plugins/intel_cpu/src/cpu_streams_calculation.cpp +++ b/src/plugins/intel_cpu/src/cpu_streams_calculation.cpp @@ -46,7 +46,6 @@ std::vector> get_streams_info_table( const int input_threads, const int input_infer_requests, const int model_prefer_threads, - const int input_current_socket_id, const std::string input_perf_hint, const std::set hint_model_distribution_policy, const std::vector>& proc_type_table) { @@ -189,11 +188,7 @@ std::vector> get_streams_info_table( std::unordered_set socket_id_list(proc_type_table.size()); for (size_t i = 1; i < proc_type_table.size(); i++) { if (!socket_id_list.count(proc_type_table[i][PROC_SOCKET_ID])) { - if (proc_type_table[i][PROC_SOCKET_ID] == input_current_socket_id) { - proc_socket_table.insert(proc_socket_table.begin(), proc_type_table[i]); - } else { - proc_socket_table.push_back(proc_type_table[i]); - } + proc_socket_table.push_back(proc_type_table[i]); socket_id_list.insert(proc_type_table[i][PROC_SOCKET_ID]); } else { for (auto& row : proc_socket_table) { @@ -215,7 +210,7 @@ std::vector> get_streams_info_table( ((input_streams_changed == true) && (input_streams == 1))) { n_streams = 1; stream_info[NUMBER_OF_STREAMS] = n_streams; - current_socket_id = input_current_socket_id == -1 ? get_current_socket_id() : input_current_socket_id; + current_socket_id = proc_type_table.size() == 1 ? proc_type_table[0][PROC_SOCKET_ID] : proc_type_table[1][PROC_SOCKET_ID] ; if (input_threads > 0) { if (hint_model_distribution_policy.size() == 0) { n_threads_per_stream = std::min(input_threads, proc_type_table[0][ALL_PROC]); @@ -680,7 +675,7 @@ int get_model_prefer_threads(const int num_streams, } std::vector> generate_stream_info(const int streams, - const int input_current_socket_id, + const int input_numa_node_id, const std::shared_ptr& model, Config& config, std::vector>& proc_type_table, @@ -697,7 +692,7 @@ std::vector> generate_stream_info(const int streams, } if (proc_type_table.size() > 1) { - const auto cur_numa_node_id = get_current_numa_node_id(); + const auto cur_numa_node_id = input_numa_node_id < 0 ? get_current_numa_node_id() : input_numa_node_id; sort_table_by_numa_node_id(cur_numa_node_id, proc_type_table); } @@ -706,7 +701,6 @@ std::vector> generate_stream_info(const int streams, config.threads, config.hintNumRequests, model_prefer_threads, - input_current_socket_id, ov::util::to_string(config.hintPerfMode), config.modelDistributionPolicy, proc_type_table); diff --git a/src/plugins/intel_cpu/src/cpu_streams_calculation.hpp b/src/plugins/intel_cpu/src/cpu_streams_calculation.hpp index e472b838b1272c..347e52164c6641 100644 --- a/src/plugins/intel_cpu/src/cpu_streams_calculation.hpp +++ b/src/plugins/intel_cpu/src/cpu_streams_calculation.hpp @@ -35,8 +35,6 @@ namespace intel_cpu { * function. * - input "0" indicates that the function generates the optimal number of threads per stream based on * processors type information. - * @param[in] input_current_socket_id is the socket ID in cpu mapping table of the currently running thread - * - input "-1" indicates that the function get_streams_info_table will query this id internally. * @param[in] input_perf_hint is performance hint set by user via ov::hint::performance_mode or the default value. * @param[in] hint_llm_distribution_policy is the distribution policy for Large language models * @param[in] proc_type_table is currently available candidate processors. @@ -50,7 +48,6 @@ std::vector> get_streams_info_table( const int input_threads, const int input_infer_requests, const int model_prefer_threads, - const int input_current_socket_id, const std::string input_perf_hint, const std::set hint_llm_distribution_policy, const std::vector>& proc_type_table); @@ -85,7 +82,7 @@ int get_model_prefer_threads(const int num_streams, /** * @brief Generate streams information according to processors type table * @param[in] streams number of streams - * @param[in] input_current_socket_id is the socket ID in cpu mapping table of the currently running thread + * @param[in] input_numa_node_id is the numa node ID in cpu mapping table of the currently running thread * - input "-1" indicates that the function get_streams_info_table will query this id internally. * @param[in] model graph handle * @param[in] config intel cpu configuration @@ -95,7 +92,7 @@ int get_model_prefer_threads(const int num_streams, * ov::hint::enable_hyper_threading */ std::vector> generate_stream_info(const int streams, - const int input_current_socket_id, + const int input_numa_node_id, const std::shared_ptr& model, Config& config, std::vector>& proc_type_table, diff --git a/src/plugins/intel_cpu/tests/unit/streams_info/streams_e2e_test.cpp b/src/plugins/intel_cpu/tests/unit/streams_info/streams_e2e_test.cpp index 7fd491e934f336..9242fd7fd46bc9 100644 --- a/src/plugins/intel_cpu/tests/unit/streams_info/streams_e2e_test.cpp +++ b/src/plugins/intel_cpu/tests/unit/streams_info/streams_e2e_test.cpp @@ -21,7 +21,7 @@ struct StreamGenerateionTestCase { int input_thread; int input_request; int input_model_prefer; - int input_socket_id; + int input_numa_node_id; ov::hint::SchedulingCoreType input_type; bool input_ht_value; bool input_ht_changed; @@ -65,7 +65,7 @@ class StreamGenerationTests : public ov::test::TestsCommon, cpu._proc_type_table = test_data.input_proc_type_table; auto proc_type_table = ov::intel_cpu::generate_stream_info(test_data.input_stream, - test_data.input_socket_id, + test_data.input_numa_node_id, nullptr, config, test_data.input_proc_type_table, diff --git a/src/plugins/intel_cpu/tests/unit/streams_info/streams_info_table_test.cpp b/src/plugins/intel_cpu/tests/unit/streams_info/streams_info_table_test.cpp index 7dc643c181df7e..7034cc3854c611 100644 --- a/src/plugins/intel_cpu/tests/unit/streams_info/streams_info_table_test.cpp +++ b/src/plugins/intel_cpu/tests/unit/streams_info/streams_info_table_test.cpp @@ -20,7 +20,6 @@ struct StreamsCalculationTestCase { int input_threads; int input_infer_requests; int model_prefer_threads; - int input_socket_id; std::string input_perf_hint; std::set hint_llm_distribution_policy; std::vector> proc_type_table; @@ -39,7 +38,6 @@ class StreamsCalculationTests : public ov::test::TestsCommon, test_data.input_threads, test_data.input_infer_requests, test_data.model_prefer_threads, - test_data.input_socket_id, test_data.input_perf_hint, test_data.hint_llm_distribution_policy, test_data.proc_type_table); @@ -55,7 +53,6 @@ StreamsCalculationTestCase _2sockets_104cores_latency_auto_1 = { 0, // param[in]: the number of threads in this simulation 0, // param[in]: the number of infer requests in this simulation 0, // param[in]: the model preferred number of threads in this simulation - 0, // param[in]: the current socket id of the running thread in this simulation "LATENCY", // param[in]: the performance hint in this simulation {ov::hint::ModelDistributionPolicy::TENSOR_PARALLEL}, // param[in]: the hint of max threads per stream in this // simulation @@ -74,7 +71,6 @@ StreamsCalculationTestCase _2sockets_104cores_latency_auto_2 = { 0, 0, 0, - 0, "LATENCY", {ov::hint::ModelDistributionPolicy::TENSOR_PARALLEL}, {{104, 104, 0, 0, -1, -1}, {52, 52, 0, 0, 0, 0}, {52, 52, 0, 0, 1, 1}}, @@ -86,7 +82,6 @@ StreamsCalculationTestCase _2sockets_104cores_latency_auto_3 = { 0, 0, 0, - 0, "LATENCY", {ov::hint::ModelDistributionPolicy::TENSOR_PARALLEL}, {{208, 104, 0, 104, -1, -1}, @@ -108,7 +103,6 @@ StreamsCalculationTestCase _2sockets_104cores_latency_auto_4 = { 0, 0, 0, - 0, "LATENCY", {ov::hint::ModelDistributionPolicy::TENSOR_PARALLEL}, {{104, 104, 0, 0, -1, -1}, {26, 26, 0, 0, 0, 0}, {26, 26, 0, 0, 1, 0}, {26, 26, 0, 0, 2, 1}, {26, 26, 0, 0, 3, 1}}, @@ -126,7 +120,6 @@ StreamsCalculationTestCase _2sockets_104cores_latency_platform_1 = { 0, 0, 0, - 0, "LATENCY", {}, {{208, 104, 0, 104, -1, -1}, {104, 52, 0, 52, 0, 0}, {104, 52, 0, 52, 1, 1}}, @@ -138,7 +131,6 @@ StreamsCalculationTestCase _2sockets_104cores_latency_platform_2 = { 0, 0, 0, - 0, "LATENCY", {}, {{104, 104, 0, 0, -1, -1}, {52, 52, 0, 0, 0, 0}, {52, 52, 0, 0, 1, 1}}, @@ -150,7 +142,6 @@ StreamsCalculationTestCase _2sockets_104cores_latency_platform_3 = { 0, 0, 0, - 0, "LATENCY", {}, {{208, 104, 0, 104, -1, -1}, @@ -170,7 +161,6 @@ StreamsCalculationTestCase _2sockets_104cores_latency_platform_4 = { 0, 0, 0, - 0, "LATENCY", {}, {{104, 104, 0, 0, -1, -1}, {26, 26, 0, 0, 0, 0}, {26, 26, 0, 0, 1, 0}, {26, 26, 0, 0, 2, 1}, {26, 26, 0, 0, 3, 1}}, @@ -182,7 +172,6 @@ StreamsCalculationTestCase _2sockets_104cores_latency_socket_1 = { 0, 0, 0, - 0, "LATENCY", {}, {{208, 104, 0, 104, -1, -1}, {104, 52, 0, 52, 0, 0}, {104, 52, 0, 52, 1, 1}}, @@ -194,7 +183,6 @@ StreamsCalculationTestCase _2sockets_104cores_latency_socket_2 = { 0, 0, 0, - 0, "LATENCY", {}, {{104, 104, 0, 0, -1, -1}, {52, 52, 0, 0, 0, 0}, {52, 52, 0, 0, 1, 1}}, @@ -206,7 +194,6 @@ StreamsCalculationTestCase _2sockets_104cores_latency_socket_3 = { 0, 0, 0, - 0, "LATENCY", {}, {{208, 104, 0, 104, -1, -1}, @@ -226,7 +213,6 @@ StreamsCalculationTestCase _2sockets_104cores_latency_socket_4 = { 0, 0, 0, - 0, "LATENCY", {}, {{104, 104, 0, 0, -1, -1}, {26, 26, 0, 0, 0, 0}, {26, 26, 0, 0, 1, 0}, {26, 26, 0, 0, 2, 1}, {26, 26, 0, 0, 3, 1}}, @@ -238,7 +224,6 @@ StreamsCalculationTestCase _2sockets_104cores_latency_socket_5 = { 0, 0, 0, - 0, "LATENCY", {}, {{60, 60, 0, 0, -1, -1}, {10, 10, 0, 0, 0, 0}, {10, 10, 0, 0, 1, 0}, {20, 20, 0, 0, 2, 1}, {20, 20, 0, 0, 3, 1}}, @@ -250,7 +235,6 @@ StreamsCalculationTestCase _2sockets_104cores_latency_socket_6 = { 0, 0, 0, - 0, "LATENCY", {}, {{60, 60, 0, 0, -1, -1}, {10, 10, 0, 0, 0, 0}, {20, 20, 0, 0, 1, 1}, {10, 10, 0, 0, 2, 0}, {20, 20, 0, 0, 3, 1}}, @@ -262,7 +246,6 @@ StreamsCalculationTestCase _2sockets_104cores_latency_socket_7 = { 0, 0, 0, - 0, "LATENCY", {}, {{104, 104, 0, 0, -1, -1}, {26, 26, 0, 0, 0, 0}, {26, 26, 0, 0, 1, 0}, {26, 26, 0, 0, 2, 1}, {26, 26, 0, 0, 3, 1}}, @@ -274,7 +257,6 @@ StreamsCalculationTestCase _2sockets_104cores_latency_socket_8 = { 208, 0, 0, - 0, "LATENCY", {}, {{208, 104, 0, 104, -1, -1}, {104, 52, 0, 52, 0, 0}, {104, 52, 0, 52, 1, 1}}, @@ -290,7 +272,6 @@ StreamsCalculationTestCase _2sockets_104cores_latency_socket_9 = { 104, 0, 0, - 0, "LATENCY", {}, {{208, 104, 0, 104, -1, -1}, {104, 52, 0, 52, 0, 0}, {104, 52, 0, 52, 1, 1}}, @@ -302,7 +283,6 @@ StreamsCalculationTestCase _2sockets_104cores_latency_socket_10 = { 52, 0, 0, - 0, "LATENCY", {}, {{208, 104, 0, 104, -1, -1}, {104, 52, 0, 52, 0, 0}, {104, 52, 0, 52, 1, 1}}, @@ -315,7 +295,6 @@ StreamsCalculationTestCase _2sockets_104cores_latency_1 = { 20, 0, 0, - 0, "LATENCY", {}, {{208, 104, 0, 104, -1, -1}, {104, 52, 0, 52, 0, 0}, {104, 52, 0, 52, 1, 1}}, @@ -327,7 +306,6 @@ StreamsCalculationTestCase _2sockets_104cores_latency_2 = { 20, 5, 0, - 0, "LATENCY", {}, {{208, 104, 0, 104, -1, -1}, {104, 52, 0, 52, 0, 0}, {104, 52, 0, 52, 1, 1}}, @@ -339,7 +317,6 @@ StreamsCalculationTestCase _2sockets_104cores_latency_4 = { 20, 0, 0, - 0, "LATENCY", {}, {{208, 104, 0, 104, -1, -1}, {104, 52, 0, 52, 0, 0}, {104, 52, 0, 52, 1, 1}}, @@ -351,7 +328,6 @@ StreamsCalculationTestCase _2sockets_104cores_latency_5 = { 20, 5, 0, - 0, "LATENCY", {}, {{208, 104, 0, 104, -1, -1}, {104, 52, 0, 52, 0, 0}, {104, 52, 0, 52, 1, 1}}, @@ -363,7 +339,6 @@ StreamsCalculationTestCase _2sockets_104cores_latency_6 = { 208, 0, 0, - 0, "LATENCY", {}, {{208, 104, 0, 104, -1, -1}, {104, 52, 0, 52, 0, 0}, {104, 52, 0, 52, 1, 1}}, @@ -379,7 +354,6 @@ StreamsCalculationTestCase _2sockets_104cores_tput_1 = { 0, 0, 0, - 0, "THROUGHPUT", {}, {{208, 104, 0, 104, -1, -1}, {104, 52, 0, 52, 0, 0}, {104, 52, 0, 52, 1, 1}}, @@ -394,7 +368,6 @@ StreamsCalculationTestCase _2sockets_104cores_tput_2 = { 0, 0, 0, - 0, "THROUGHPUT", {}, {{208, 104, 0, 104, -1, -1}, {104, 52, 0, 52, 0, 0}, {104, 52, 0, 52, 1, 1}}, @@ -411,7 +384,6 @@ StreamsCalculationTestCase _2sockets_104cores_tput_3 = { 20, 0, 0, - 0, "THROUGHPUT", {}, {{208, 104, 0, 104, -1, -1}, {104, 52, 0, 52, 0, 0}, {104, 52, 0, 52, 1, 1}}, @@ -423,7 +395,6 @@ StreamsCalculationTestCase _2sockets_104cores_tput_4 = { 20, 0, 0, - 0, "THROUGHPUT", {}, {{208, 104, 0, 104, -1, -1}, {104, 52, 0, 52, 0, 0}, {104, 52, 0, 52, 1, 1}}, @@ -435,7 +406,6 @@ StreamsCalculationTestCase _2sockets_104cores_tput_5 = { 0, 0, 1, - 0, "THROUGHPUT", {}, {{208, 104, 0, 104, -1, -1}, {104, 52, 0, 52, 0, 0}, {104, 52, 0, 52, 1, 1}}, @@ -450,7 +420,6 @@ StreamsCalculationTestCase _2sockets_104cores_tput_6 = { 0, 0, 2, - 0, "THROUGHPUT", {}, {{208, 104, 0, 104, -1, -1}, {104, 52, 0, 52, 0, 0}, {104, 52, 0, 52, 1, 1}}, @@ -465,7 +434,6 @@ StreamsCalculationTestCase _2sockets_104cores_tput_7 = { 0, 0, 8, - 0, "THROUGHPUT", {}, {{208, 104, 0, 104, -1, -1}, {104, 52, 0, 52, 0, 0}, {104, 52, 0, 52, 1, 1}}, @@ -486,7 +454,6 @@ StreamsCalculationTestCase _2sockets_104cores_tput_7_1 = { 0, 0, 8, - 0, "THROUGHPUT", {}, {{208, 104, 0, 104, -1, -1}, {104, 52, 0, 52, 0, 0}, {104, 52, 0, 52, 1, 1}}, @@ -507,7 +474,6 @@ StreamsCalculationTestCase _2sockets_104cores_tput_7_2 = { 0, 0, 4, - 0, "THROUGHPUT", {}, {{208, 104, 0, 104, -1, -1}, @@ -529,7 +495,6 @@ StreamsCalculationTestCase _2sockets_104cores_tput_8 = { 40, 0, 8, - 0, "THROUGHPUT", {}, {{208, 104, 0, 104, -1, -1}, {104, 52, 0, 52, 0, 0}, {104, 52, 0, 52, 1, 1}}, @@ -542,7 +507,6 @@ StreamsCalculationTestCase _2sockets_104cores_tput_9 = { 20, 2, 0, - 0, "THROUGHPUT", {}, {{208, 104, 0, 104, -1, -1}, {104, 52, 0, 52, 0, 0}, {104, 52, 0, 52, 1, 1}}, @@ -555,7 +519,6 @@ StreamsCalculationTestCase _2sockets_104cores_tput_10 = { 0, 2, 0, - 0, "THROUGHPUT", {}, {{208, 104, 0, 104, -1, -1}, {104, 52, 0, 52, 0, 0}, {104, 52, 0, 52, 1, 1}}, @@ -573,7 +536,6 @@ StreamsCalculationTestCase _2sockets_104cores_tput_11 = { 0, 5, 0, - 0, "THROUGHPUT", {}, {{208, 104, 0, 104, -1, -1}, {104, 52, 0, 52, 0, 0}, {104, 52, 0, 52, 1, 1}}, @@ -591,7 +553,6 @@ StreamsCalculationTestCase _2sockets_104cores_tput_12 = { 0, 2, 2, - 0, "THROUGHPUT", {}, {{208, 104, 0, 104, -1, -1}, {104, 52, 0, 52, 0, 0}, {104, 52, 0, 52, 1, 1}}, @@ -609,7 +570,6 @@ StreamsCalculationTestCase _2sockets_104cores_tput_13 = { 0, 0, 0, - 0, "THROUGHPUT", {}, {{104, 104, 0, 0, -1, -1}, {52, 52, 0, 0, 0, 0}, {52, 52, 0, 0, 1, 1}}, @@ -622,7 +582,6 @@ StreamsCalculationTestCase _2sockets_104cores_tput_14 = { 0, 0, 0, - 0, "THROUGHPUT", {}, {{104, 104, 0, 0, -1, -1}, {52, 52, 0, 0, 0, 0}, {52, 52, 0, 0, 1, 1}}, @@ -635,7 +594,6 @@ StreamsCalculationTestCase _2sockets_104cores_tput_15 = { 0, 0, 1, - 0, "THROUGHPUT", {}, {{104, 104, 0, 0, -1, -1}, {52, 52, 0, 0, 0, 0}, {52, 52, 0, 0, 1, 1}}, @@ -648,7 +606,6 @@ StreamsCalculationTestCase _2sockets_104cores_tput_16 = { 0, 0, 2, - 0, "THROUGHPUT", {}, {{104, 104, 0, 0, -1, -1}, {52, 52, 0, 0, 0, 0}, {52, 52, 0, 0, 1, 1}}, @@ -661,7 +618,6 @@ StreamsCalculationTestCase _2sockets_104cores_tput_17 = { 0, 0, 8, - 0, "THROUGHPUT", {}, {{104, 104, 0, 0, -1, -1}, {52, 52, 0, 0, 0, 0}, {52, 52, 0, 0, 1, 1}}, @@ -678,7 +634,6 @@ StreamsCalculationTestCase _2sockets_104cores_tput_18 = { 0, 2, 0, - 0, "THROUGHPUT", {}, {{104, 104, 0, 0, -1, -1}, {52, 52, 0, 0, 0, 0}, {52, 52, 0, 0, 1, 1}}, @@ -691,7 +646,6 @@ StreamsCalculationTestCase _2sockets_104cores_tput_19 = { 0, 5, 0, - 0, "THROUGHPUT", {}, {{104, 104, 0, 0, -1, -1}, {52, 52, 0, 0, 0, 0}, {52, 52, 0, 0, 1, 1}}, @@ -704,7 +658,6 @@ StreamsCalculationTestCase _2sockets_104cores_tput_20 = { 0, 2, 2, - 0, "THROUGHPUT", {}, {{104, 104, 0, 0, -1, -1}, {52, 52, 0, 0, 0, 0}, {52, 52, 0, 0, 1, 1}}, @@ -717,7 +670,6 @@ StreamsCalculationTestCase _2sockets_48cores_latency_1 = { 0, 0, 0, - 0, "LATENCY", {}, {{48, 48, 0, 0, -1, -1}, {24, 24, 0, 0, 0, 0}, {24, 24, 0, 0, 1, 1}}, @@ -729,7 +681,6 @@ StreamsCalculationTestCase _2sockets_48cores_latency_2 = { 0, 0, 0, - 0, "LATENCY", {}, {{48, 48, 0, 0, -1, -1}, {24, 24, 0, 0, 0, 0}, {24, 24, 0, 0, 1, 1}}, @@ -741,7 +692,6 @@ StreamsCalculationTestCase _2sockets_48cores_latency_3 = { 96, 0, 0, - 0, "LATENCY", {}, {{48, 48, 0, 0, -1, -1}, {24, 24, 0, 0, 0, 0}, {24, 24, 0, 0, 1, 1}}, @@ -753,7 +703,6 @@ StreamsCalculationTestCase _2sockets_48cores_tput_1 = { 0, 0, 0, - 0, "THROUGHPUT", {}, {{48, 48, 0, 0, -1, -1}, {24, 24, 0, 0, 0, 0}, {24, 24, 0, 0, 1, 1}}, @@ -766,7 +715,6 @@ StreamsCalculationTestCase _2sockets_48cores_tput_2 = { 0, 0, 0, - 0, "THROUGHPUT", {}, {{48, 48, 0, 0, -1, -1}, {24, 24, 0, 0, 0, 0}, {24, 24, 0, 0, 1, 1}}, @@ -779,7 +727,6 @@ StreamsCalculationTestCase _2sockets_48cores_tput_3 = { 100, 0, 0, - 0, "THROUGHPUT", {}, {{48, 48, 0, 0, -1, -1}, {24, 24, 0, 0, 0, 0}, {24, 24, 0, 0, 1, 1}}, @@ -792,7 +739,6 @@ StreamsCalculationTestCase _2sockets_48cores_tput_4 = { 20, 0, 1, - 0, "THROUGHPUT", {}, {{48, 48, 0, 0, -1, -1}, {24, 24, 0, 0, 0, 0}, {24, 24, 0, 0, 1, 1}}, @@ -805,7 +751,6 @@ StreamsCalculationTestCase _2sockets_20cores_tput_1 = { 0, 0, 0, - 0, "THROUGHPUT", {}, {{20, 20, 0, 0, -1, -1}, {10, 10, 0, 0, 0, 0}, {10, 10, 0, 0, 1, 1}}, @@ -818,7 +763,6 @@ StreamsCalculationTestCase _1sockets_14cores_latency_1 = { 0, 0, 0, - 0, "LATENCY", {}, {{14, 6, 8, 0, 0, 0}}, @@ -831,7 +775,6 @@ StreamsCalculationTestCase _1sockets_14cores_latency_2 = { 10, 0, 0, - 0, "LATENCY", {}, {{20, 6, 8, 6, 0, 0}}, @@ -844,7 +787,6 @@ StreamsCalculationTestCase _1sockets_14cores_latency_3 = { 0, 0, 6, - 0, "LATENCY", {}, {{20, 6, 8, 6, 0, 0}}, @@ -857,7 +799,6 @@ StreamsCalculationTestCase _1sockets_14cores_latency_4 = { 0, 0, 14, - 0, "LATENCY", {}, {{20, 6, 8, 6, 0, 0}}, @@ -873,7 +814,6 @@ StreamsCalculationTestCase _1sockets_14cores_latency_5 = { 0, 2, 14, - 0, "LATENCY", {}, {{20, 6, 8, 6, 0, 0}}, @@ -889,7 +829,6 @@ StreamsCalculationTestCase _1sockets_14cores_latency_6 = { 0, 0, 0, - 0, "LATENCY", {}, {{20, 6, 8, 6, 0, 0}}, @@ -905,7 +844,6 @@ StreamsCalculationTestCase _1sockets_14cores_latency_7 = { 0, 0, 6, - 0, "LATENCY", {}, {{14, 6, 8, 0, 0, 0}}, @@ -918,7 +856,6 @@ StreamsCalculationTestCase _1sockets_14cores_latency_8 = { 0, 0, 14, - 0, "LATENCY", {}, {{14, 6, 8, 0, 0, 0}}, @@ -931,7 +868,6 @@ StreamsCalculationTestCase _1sockets_14cores_latency_9 = { 0, 2, 14, - 0, "LATENCY", {}, {{14, 6, 8, 0, 0, 0}}, @@ -944,7 +880,6 @@ StreamsCalculationTestCase _1sockets_14cores_latency_10 = { 0, 0, 0, - 0, "LATENCY", {}, {{14, 6, 8, 0, 0, 0}}, @@ -957,7 +892,6 @@ StreamsCalculationTestCase _1sockets_14cores_latency_11 = { 10, 0, 0, - 0, "LATENCY", {}, {{20, 6, 8, 6, 0, 0}}, @@ -970,7 +904,6 @@ StreamsCalculationTestCase _1sockets_14cores_latency_12 = { 0, 0, 6, - 0, "LATENCY", {}, {{20, 6, 8, 6, 0, 0}}, @@ -983,7 +916,6 @@ StreamsCalculationTestCase _1sockets_14cores_latency_13 = { 0, 0, 14, - 0, "LATENCY", {}, {{20, 6, 8, 6, 0, 0}}, @@ -999,7 +931,6 @@ StreamsCalculationTestCase _1sockets_14cores_latency_14 = { 0, 2, 14, - 0, "LATENCY", {}, {{20, 6, 8, 6, 0, 0}}, @@ -1015,7 +946,6 @@ StreamsCalculationTestCase _1sockets_14cores_latency_15 = { 0, 0, 0, - 0, "LATENCY", {}, {{20, 6, 8, 6, 0, 0}}, @@ -1031,7 +961,6 @@ StreamsCalculationTestCase _1sockets_14cores_latency_16 = { 0, 0, 6, - 0, "LATENCY", {}, {{14, 6, 8, 0, 0, 0}}, @@ -1044,7 +973,6 @@ StreamsCalculationTestCase _1sockets_14cores_latency_17 = { 0, 0, 14, - 0, "LATENCY", {}, {{14, 6, 8, 0, 0, 0}}, @@ -1057,7 +985,6 @@ StreamsCalculationTestCase _1sockets_14cores_latency_18 = { 0, 2, 14, - 0, "LATENCY", {}, {{14, 6, 8, 0, 0, 0}}, @@ -1070,7 +997,6 @@ StreamsCalculationTestCase _1sockets_14cores_tput_1 = { 0, 0, 0, - 0, "THROUGHPUT", {}, {{20, 6, 8, 6, 0, 0}}, @@ -1083,7 +1009,6 @@ StreamsCalculationTestCase _1sockets_14cores_tput_2 = { 0, 0, 0, - 0, "THROUGHPUT", {}, {{20, 6, 8, 6, 0, 0}}, @@ -1096,7 +1021,6 @@ StreamsCalculationTestCase _1sockets_14cores_tput_3 = { 0, 0, 0, - 0, "THROUGHPUT", {}, {{20, 6, 8, 6, 0, 0}}, @@ -1109,7 +1033,6 @@ StreamsCalculationTestCase _1sockets_14cores_tput_4 = { 12, 0, 0, - 0, "THROUGHPUT", {}, {{20, 6, 8, 6, 0, 0}}, @@ -1122,7 +1045,6 @@ StreamsCalculationTestCase _1sockets_14cores_tput_5 = { 0, 0, 1, - 0, "THROUGHPUT", {}, {{20, 6, 8, 6, 0, 0}}, @@ -1135,7 +1057,6 @@ StreamsCalculationTestCase _1sockets_14cores_tput_6 = { 0, 0, 2, - 0, "THROUGHPUT", {}, {{20, 6, 8, 6, 0, 0}}, @@ -1148,7 +1069,6 @@ StreamsCalculationTestCase _1sockets_14cores_tput_7 = { 0, 0, 0, - 0, "THROUGHPUT", {}, {{20, 6, 8, 6, 0, 0}}, @@ -1161,7 +1081,6 @@ StreamsCalculationTestCase _1sockets_14cores_tput_8 = { 100, 0, 0, - 0, "THROUGHPUT", {}, {{20, 6, 8, 6, 0, 0}}, @@ -1174,7 +1093,6 @@ StreamsCalculationTestCase _1sockets_14cores_tput_9 = { 0, 8, 0, - 0, "THROUGHPUT", {}, {{20, 6, 8, 6, 0, 0}}, @@ -1187,7 +1105,6 @@ StreamsCalculationTestCase _1sockets_14cores_tput_10 = { 0, 4, 0, - 0, "THROUGHPUT", {}, {{20, 6, 8, 6, 0, 0}}, @@ -1200,7 +1117,6 @@ StreamsCalculationTestCase _1sockets_14cores_tput_11 = { 0, 2, 0, - 0, "THROUGHPUT", {}, {{20, 6, 8, 6, 0, 0}}, @@ -1213,7 +1129,6 @@ StreamsCalculationTestCase _1sockets_14cores_tput_12 = { 0, 2, 2, - 0, "THROUGHPUT", {}, {{20, 6, 8, 6, 0, 0}}, @@ -1226,7 +1141,6 @@ StreamsCalculationTestCase _1sockets_14cores_tput_13 = { 1, 0, 1, - 0, "THROUGHPUT", {}, {{20, 6, 8, 6, 0, 0}}, @@ -1239,7 +1153,6 @@ StreamsCalculationTestCase _1sockets_14cores_tput_14 = { 9, 0, 1, - 0, "THROUGHPUT", {}, {{20, 6, 8, 6, 0, 0}}, @@ -1252,7 +1165,6 @@ StreamsCalculationTestCase _1sockets_14cores_tput_15 = { 12, 0, 1, - 0, "THROUGHPUT", {}, {{20, 6, 8, 6, 0, 0}}, @@ -1265,7 +1177,6 @@ StreamsCalculationTestCase _1sockets_14cores_tput_16 = { 15, 0, 1, - 0, "THROUGHPUT", {}, {{20, 6, 8, 6, 0, 0}}, @@ -1278,7 +1189,6 @@ StreamsCalculationTestCase _1sockets_14cores_tput_17 = { 14, 0, 6, - 0, "LATENCY", {}, {{20, 6, 8, 6, 0, 0}}, @@ -1291,7 +1201,6 @@ StreamsCalculationTestCase _1sockets_10cores_latency_1 = { 0, 0, 0, - 0, "LATENCY", {}, {{12, 2, 8, 2, 0, 0}}, @@ -1307,7 +1216,6 @@ StreamsCalculationTestCase _1sockets_10cores_latency_2 = { 8, 0, 0, - 0, "LATENCY", {}, {{12, 2, 8, 2, 0, 0}}, @@ -1320,7 +1228,6 @@ StreamsCalculationTestCase _1sockets_10cores_latency_3 = { 0, 0, 2, - 0, "LATENCY", {}, {{12, 2, 8, 2, 0, 0}}, @@ -1333,7 +1240,6 @@ StreamsCalculationTestCase _1sockets_10cores_latency_4 = { 0, 0, 10, - 0, "LATENCY", {}, {{12, 2, 8, 2, 0, 0}}, @@ -1349,7 +1255,6 @@ StreamsCalculationTestCase _1sockets_10cores_latency_5 = { 0, 0, 0, - 0, "LATENCY", {}, {{10, 2, 8, 0, 0, 0}}, @@ -1362,7 +1267,6 @@ StreamsCalculationTestCase _1sockets_10cores_latency_6 = { 0, 0, 2, - 0, "LATENCY", {}, {{10, 2, 8, 0, 0, 0}}, @@ -1375,7 +1279,6 @@ StreamsCalculationTestCase _1sockets_10cores_latency_7 = { 0, 0, 10, - 0, "LATENCY", {}, {{10, 2, 8, 0, 0, 0}}, @@ -1388,7 +1291,6 @@ StreamsCalculationTestCase _1sockets_10cores_tput_1 = { 0, 0, 0, - 0, "THROUGHPUT", {}, {{12, 2, 8, 2, 0, 0}}, @@ -1401,7 +1303,6 @@ StreamsCalculationTestCase _1sockets_10cores_tput_2 = { 0, 0, 0, - 0, "THROUGHPUT", {}, {{12, 2, 8, 2, 0, 0}}, @@ -1414,7 +1315,6 @@ StreamsCalculationTestCase _1sockets_10cores_tput_3 = { 0, 0, 0, - 0, "THROUGHPUT", {}, {{12, 2, 8, 2, 0, 0}}, @@ -1427,7 +1327,6 @@ StreamsCalculationTestCase _1sockets_10cores_tput_4 = { 6, 0, 0, - 0, "THROUGHPUT", {}, {{12, 2, 8, 2, 0, 0}}, @@ -1440,7 +1339,6 @@ StreamsCalculationTestCase _1sockets_10cores_tput_5 = { 0, 0, 1, - 0, "THROUGHPUT", {}, {{12, 2, 8, 2, 0, 0}}, @@ -1453,7 +1351,6 @@ StreamsCalculationTestCase _1sockets_10cores_tput_6 = { 0, 0, 2, - 0, "THROUGHPUT", {}, {{12, 2, 8, 2, 0, 0}}, @@ -1466,7 +1363,6 @@ StreamsCalculationTestCase _1sockets_8cores_latency_1 = { 0, 0, 0, - 0, "LATENCY", {}, {{12, 4, 4, 4, 0, 0}}, @@ -1482,7 +1378,6 @@ StreamsCalculationTestCase _1sockets_8cores_latency_2 = { 100, 0, 0, - 0, "LATENCY", {}, {{12, 4, 4, 4, 0, 0}}, @@ -1498,7 +1393,6 @@ StreamsCalculationTestCase _1sockets_8cores_latency_3 = { 0, 0, 4, - 0, "LATENCY", {}, {{12, 4, 4, 4, 0, 0}}, @@ -1511,7 +1405,6 @@ StreamsCalculationTestCase _1sockets_8cores_latency_4 = { 0, 0, 8, - 0, "LATENCY", {}, {{12, 4, 4, 4, 0, 0}}, @@ -1527,7 +1420,6 @@ StreamsCalculationTestCase _1sockets_8cores_latency_5 = { 0, 0, 0, - 0, "LATENCY", {}, {{8, 4, 4, 0, 0, 0}}, @@ -1540,7 +1432,6 @@ StreamsCalculationTestCase _1sockets_8cores_latency_6 = { 0, 0, 4, - 0, "LATENCY", {}, {{8, 4, 4, 0, 0, 0}}, @@ -1553,7 +1444,6 @@ StreamsCalculationTestCase _1sockets_8cores_latency_7 = { 0, 0, 8, - 0, "LATENCY", {}, {{8, 4, 4, 0, 0, 0}}, @@ -1566,7 +1456,6 @@ StreamsCalculationTestCase _1sockets_8cores_tput_1 = { 0, 0, 0, - 0, "THROUGHPUT", {}, {{12, 4, 4, 4, 0, 0}}, @@ -1579,7 +1468,6 @@ StreamsCalculationTestCase _1sockets_8cores_tput_2 = { 0, 0, 0, - 0, "THROUGHPUT", {}, {{12, 4, 4, 4, 0, 0}}, @@ -1592,7 +1480,6 @@ StreamsCalculationTestCase _1sockets_8cores_tput_3 = { 0, 0, 0, - 0, "THROUGHPUT", {}, {{12, 4, 4, 4, 0, 0}}, @@ -1605,7 +1492,6 @@ StreamsCalculationTestCase _1sockets_8cores_tput_4 = { 0, 0, 0, - 0, "THROUGHPUT", {}, {{12, 4, 4, 4, 0, 0}}, @@ -1618,7 +1504,6 @@ StreamsCalculationTestCase _1sockets_8cores_tput_5 = { 6, 0, 0, - 0, "THROUGHPUT", {}, {{12, 4, 4, 4, 0, 0}}, @@ -1631,7 +1516,6 @@ StreamsCalculationTestCase _1sockets_8cores_tput_6 = { 8, 0, 0, - 0, "THROUGHPUT", {}, {{12, 4, 4, 4, 0, 0}}, @@ -1644,7 +1528,6 @@ StreamsCalculationTestCase _1sockets_8cores_tput_7 = { 0, 0, 1, - 0, "THROUGHPUT", {}, {{12, 4, 4, 4, 0, 0}}, @@ -1657,7 +1540,6 @@ StreamsCalculationTestCase _1sockets_8cores_tput_8 = { 0, 0, 0, - 0, "THROUGHPUT", {}, {{8, 4, 4, 0, 0, 0}}, @@ -1670,7 +1552,6 @@ StreamsCalculationTestCase _1sockets_6cores_latency_1 = { 0, 0, 0, - 0, "LATENCY", {}, {{12, 6, 0, 6, 0, 0}}, @@ -1683,7 +1564,6 @@ StreamsCalculationTestCase _1sockets_6cores_latency_2 = { 100, 0, 0, - 0, "LATENCY", {}, {{12, 6, 0, 6, 0, 0}}, @@ -1696,7 +1576,6 @@ StreamsCalculationTestCase _1sockets_6cores_latency_3 = { 0, 0, 0, - 0, "LATENCY", {}, {{6, 6, 0, 0, 0, 0}}, @@ -1709,7 +1588,6 @@ StreamsCalculationTestCase _1sockets_6cores_tput_1 = { 0, 0, 0, - 0, "THROUGHPUT", {}, {{12, 6, 0, 6, 0, 0}}, @@ -1722,7 +1600,6 @@ StreamsCalculationTestCase _1sockets_6cores_tput_2 = { 0, 0, 0, - 0, "THROUGHPUT", {}, {{12, 6, 0, 6, 0, 0}}, @@ -1735,7 +1612,6 @@ StreamsCalculationTestCase _1sockets_6cores_tput_3 = { 8, 0, 0, - 0, "THROUGHPUT", {}, {{12, 6, 0, 6, 0, 0}}, @@ -1748,7 +1624,6 @@ StreamsCalculationTestCase _1sockets_6cores_tput_4 = { 0, 0, 1, - 0, "THROUGHPUT", {}, {{12, 6, 0, 6, 0, 0}}, @@ -1761,7 +1636,6 @@ StreamsCalculationTestCase _1sockets_4cores_latency_1 = { 0, 0, 0, - 0, "LATENCY", {}, {{4, 4, 0, 0, 0, 0}}, @@ -1774,7 +1648,6 @@ StreamsCalculationTestCase _1sockets_4cores_tput_1 = { 0, 0, 0, - 0, "THROUGHPUT", {}, {{4, 4, 0, 0, 0, 0}}, @@ -1787,7 +1660,6 @@ StreamsCalculationTestCase _1sockets_4cores_tput_2 = { 0, 0, 8, - -1, "THROUGHPUT", {}, {{4, 4, 0, 0, 0, 0}}, @@ -1800,7 +1672,6 @@ StreamsCalculationTestCase _1sockets_4cores_tput_3 = { 0, 0, 8, - -1, "THROUGHPUT", {}, {{4, 4, 0, 0, 0, 0}}, @@ -1813,7 +1684,6 @@ StreamsCalculationTestCase _1sockets_ecores_latency_1 = { 0, 0, 0, - 0, "LATENCY", {}, {{16, 0, 16, 0, 0, 0}}, @@ -1826,7 +1696,6 @@ StreamsCalculationTestCase _1sockets_ecores_latency_2 = { 4, 0, 0, - 0, "LATENCY", {}, {{16, 0, 16, 0, 0, 0}}, @@ -1839,7 +1708,6 @@ StreamsCalculationTestCase _1sockets_ecores_latency_3 = { 0, 4, 0, - 0, "LATENCY", {}, {{16, 0, 16, 0, 0, 0}}, @@ -1852,7 +1720,6 @@ StreamsCalculationTestCase _1sockets_ecores_latency_4 = { 0, 0, 4, - 0, "LATENCY", {}, {{16, 0, 16, 0, 0, 0}}, @@ -1865,7 +1732,6 @@ StreamsCalculationTestCase _1sockets_ecores_tput_1 = { 0, 0, 1, - 0, "THROUGHPUT", {}, {{16, 0, 16, 0, 0, 0}}, @@ -1878,7 +1744,6 @@ StreamsCalculationTestCase _1sockets_ecores_tput_2 = { 0, 0, 4, - 0, "THROUGHPUT", {}, {{16, 0, 16, 0, 0, 0}}, @@ -1891,7 +1756,6 @@ StreamsCalculationTestCase _1sockets_ecores_tput_3 = { 0, 0, 0, - 0, "THROUGHPUT", {}, {{16, 0, 16, 0, 0, 0}}, @@ -1904,7 +1768,6 @@ StreamsCalculationTestCase _1sockets_ecores_tput_4 = { 0, 4, 0, - 0, "THROUGHPUT", {}, {{16, 0, 16, 0, 0, 0}}, @@ -1917,7 +1780,6 @@ StreamsCalculationTestCase _1sockets_ecores_tput_5 = { 0, 0, 4, - 0, "THROUGHPUT", {}, {{16, 0, 16, 0, 0, 0}}, @@ -1930,7 +1792,6 @@ StreamsCalculationTestCase _1sockets_mock_tput_1 = { 15, 0, 1, - 0, "THROUGHPUT", {}, {{20, 6, 7, 6, 0, 0}}, @@ -1943,7 +1804,6 @@ StreamsCalculationTestCase _1sockets_mock_tput_2 = { 0, 0, 0, - 0, "THROUGHPUT", {}, {{27, 27, 0, 0, -1, -1}, {19, 19, 0, 0, 0, 0}, {8, 8, 0, 0, 1, 1}}, @@ -1956,7 +1816,6 @@ StreamsCalculationTestCase _1sockets_mock_tput_3 = { 0, 0, 0, - 0, "THROUGHPUT", {}, {{19, 19, 0, 0, -1, -1}, {11, 11, 0, 0, 0, 0}, {8, 8, 0, 0, 1, 1}}, @@ -1969,7 +1828,6 @@ StreamsCalculationTestCase _1sockets_mock_tput_4 = { 0, 0, 0, - 0, "THROUGHPUT", {}, {{8, 8, 0, 0, 0, 0}}, @@ -1982,7 +1840,6 @@ StreamsCalculationTestCase _2sockets_mock_latency_1 = { 20, 0, 0, - 0, "LATENCY", {}, {{60, 60, 0, 0, -1, -1}, {10, 10, 0, 0, 0, 0}, {20, 20, 0, 0, 1, 0}, {10, 10, 0, 0, 2, 1}, {20, 20, 0, 0, 3, 1}}, @@ -1994,7 +1851,6 @@ StreamsCalculationTestCase _2sockets_mock_latency_2 = { 0, 0, 0, - 1, "LATENCY", {}, {{60, 60, 0, 0, -1, -1}, {20, 20, 0, 0, 1, 1}, {40, 40, 0, 0, 0, 0}}, @@ -2006,7 +1862,6 @@ StreamsCalculationTestCase _2sockets_mock_latency_3 = { 0, 0, 0, - 1, "THROUGHPUT", {}, {{60, 60, 0, 0, -1, -1}, {20, 20, 0, 0, 1, 1}, {40, 40, 0, 0, 0, 0}}, @@ -2018,7 +1873,6 @@ StreamsCalculationTestCase _2sockets_mock_latency_4 = { 10, 0, 0, - 1, "LATENCY", {}, {{60, 60, 0, 0, -1, -1}, {20, 20, 0, 0, 1, 1}, {40, 40, 0, 0, 0, 0}}, @@ -2030,7 +1884,6 @@ StreamsCalculationTestCase _2sockets_mock_latency_5 = { 50, 0, 0, - 1, "LATENCY", {}, {{60, 60, 0, 0, -1, -1}, {20, 20, 0, 0, 1, 1}, {40, 40, 0, 0, 0, 0}}, @@ -2042,7 +1895,6 @@ StreamsCalculationTestCase _2sockets_mock_latency_6 = { 0, 0, 0, - 1, "LATENCY", {}, {{60, 0, 60, 0, -1, -1}, {20, 0, 20, 0, 1, 1}, {40, 0, 40, 0, 0, 0}}, @@ -2054,7 +1906,6 @@ StreamsCalculationTestCase _2sockets_mock_latency_7 = { 0, 0, 0, - 1, "THROUGHPUT", {}, {{60, 0, 60, 0, -1, -1}, {20, 0, 20, 0, 1, 1}, {40, 0, 40, 0, 0, 0}}, @@ -2066,7 +1917,6 @@ StreamsCalculationTestCase _2sockets_mock_latency_8 = { 10, 0, 0, - 1, "LATENCY", {}, {{60, 0, 60, 0, -1, -1}, {20, 0, 20, 0, 1, 1}, {40, 0, 40, 0, 0, 0}}, @@ -2078,7 +1928,6 @@ StreamsCalculationTestCase _2sockets_mock_latency_9 = { 50, 0, 0, - 1, "LATENCY", {}, {{60, 0, 60, 0, -1, -1}, {20, 0, 20, 0, 1, 1}, {40, 0, 40, 0, 0, 0}}, @@ -2090,7 +1939,6 @@ StreamsCalculationTestCase _2sockets_mock_latency_10 = { 0, 0, 0, - 1, "LATENCY", {}, {{60, 30, 0, 30, -1, -1}, {20, 10, 0, 10, 1, 1}, {40, 20, 0, 20, 0, 0}}, @@ -2102,7 +1950,6 @@ StreamsCalculationTestCase _2sockets_mock_latency_11 = { 0, 0, 0, - 1, "THROUGHPUT", {}, {{60, 30, 0, 30, -1, -1}, {20, 10, 0, 10, 1, 1}, {40, 20, 0, 20, 0, 0}}, @@ -2114,7 +1961,6 @@ StreamsCalculationTestCase _2sockets_mock_latency_12 = { 15, 0, 0, - 1, "LATENCY", {}, {{60, 30, 0, 30, -1, -1}, {20, 10, 0, 10, 1, 1}, {40, 20, 0, 20, 0, 0}}, @@ -2126,7 +1972,6 @@ StreamsCalculationTestCase _2sockets_mock_latency_13 = { 50, 0, 0, - 1, "LATENCY", {}, {{60, 30, 0, 30, -1, -1}, {20, 10, 0, 10, 1, 1}, {40, 20, 0, 20, 0, 0}}, @@ -2142,7 +1987,6 @@ StreamsCalculationTestCase _2sockets_mock_latency_14 = { 0, 0, 0, - 3, "LATENCY", {}, {{200, 100, 0, 100, -1, -1}, @@ -2158,7 +2002,6 @@ StreamsCalculationTestCase _2sockets_mock_latency_15 = { 0, 0, 0, - 3, "THROUGHPUT", {}, {{200, 100, 0, 100, -1, -1}, @@ -2174,7 +2017,6 @@ StreamsCalculationTestCase _2sockets_mock_latency_16 = { 15, 0, 0, - 3, "LATENCY", {}, {{200, 100, 0, 100, -1, -1}, @@ -2190,7 +2032,6 @@ StreamsCalculationTestCase _2sockets_mock_latency_17 = { 50, 0, 0, - 3, "LATENCY", {}, {{200, 100, 0, 100, -1, -1}, @@ -2209,7 +2050,6 @@ StreamsCalculationTestCase _2sockets_mock_latency_18 = { 0, 0, 0, - 6, "LATENCY", {}, {{440, 220, 0, 220, -1, -1}, @@ -2229,7 +2069,6 @@ StreamsCalculationTestCase _2sockets_mock_latency_19 = { 0, 0, 0, - 6, "THROUGHPUT", {}, {{440, 220, 0, 220, -1, -1}, @@ -2249,7 +2088,6 @@ StreamsCalculationTestCase _2sockets_mock_latency_20 = { 25, 0, 0, - 6, "LATENCY", {}, {{440, 220, 0, 220, -1, -1}, @@ -2269,7 +2107,6 @@ StreamsCalculationTestCase _2sockets_mock_latency_21 = { 50, 0, 0, - 6, "LATENCY", {}, {{440, 220, 0, 220, -1, -1}, @@ -2292,7 +2129,6 @@ StreamsCalculationTestCase _2sockets_mock_latency_22 = { 0, 0, 0, - 0, "LATENCY", {ov::hint::ModelDistributionPolicy::TENSOR_PARALLEL}, {{60, 30, 0, 30, -1, -1}, {40, 20, 0, 20, 0, 0}, {20, 10, 0, 10, 1, 1}}, @@ -2310,7 +2146,6 @@ StreamsCalculationTestCase _2sockets_mock_latency_23 = { 0, 0, 0, - 0, "LATENCY", {}, {{60, 30, 0, 30, -1, -1}, {40, 20, 0, 20, 0, 0}, {20, 10, 0, 10, 1, 1}}, @@ -2322,7 +2157,6 @@ StreamsCalculationTestCase _2sockets_mock_latency_24 = { 0, 0, 0, - 0, "LATENCY", {}, {{60, 30, 0, 30, -1, -1}, {40, 20, 0, 20, 0, 0}, {20, 10, 0, 10, 1, 1}}, @@ -2334,7 +2168,6 @@ StreamsCalculationTestCase _2sockets_mock_latency_25 = { 0, 0, 0, - 0, "LATENCY", {ov::hint::ModelDistributionPolicy::TENSOR_PARALLEL}, {{200, 100, 0, 100, -1, -1}, @@ -2355,7 +2188,6 @@ StreamsCalculationTestCase _2sockets_mock_latency_26 = { 0, 0, 0, - 0, "LATENCY", {}, {{200, 100, 0, 100, -1, -1}, @@ -2375,7 +2207,6 @@ StreamsCalculationTestCase _2sockets_mock_latency_27 = { 0, 0, 0, - 0, "LATENCY", {}, {{200, 100, 0, 100, -1, -1}, @@ -2395,7 +2226,6 @@ StreamsCalculationTestCase _2sockets_mock_latency_28 = { 200, 0, 0, - 0, "LATENCY", {ov::hint::ModelDistributionPolicy::TENSOR_PARALLEL}, {{200, 100, 0, 100, -1, -1}, @@ -2416,7 +2246,6 @@ StreamsCalculationTestCase _2sockets_mock_latency_29 = { 200, 0, 0, - 0, "LATENCY", {}, {{200, 100, 0, 100, -1, -1}, @@ -2440,7 +2269,6 @@ StreamsCalculationTestCase _2sockets_mock_latency_31 = { 140, 0, 0, - 0, "LATENCY", {ov::hint::ModelDistributionPolicy::TENSOR_PARALLEL}, {{200, 100, 0, 100, -1, -1}, @@ -2461,7 +2289,6 @@ StreamsCalculationTestCase _2sockets_mock_latency_32 = { 70, 0, 0, - 0, "LATENCY", {}, {{200, 100, 0, 100, -1, -1}, @@ -2477,7 +2304,6 @@ StreamsCalculationTestCase _2sockets_mock_latency_33 = { 20, 0, 0, - 0, "LATENCY", {}, {{200, 100, 0, 100, -1, -1}, @@ -2493,7 +2319,6 @@ StreamsCalculationTestCase _2sockets_mock_latency_34 = { 0, 0, 0, - 0, "LATENCY", {ov::hint::ModelDistributionPolicy::TENSOR_PARALLEL}, {{48, 48, 0, 0, -1, -1}, {24, 24, 0, 0, 0, 0}, {24, 24, 0, 0, 1, 1}}, @@ -2505,7 +2330,6 @@ StreamsCalculationTestCase _1sockets_mock_latency_1 = { 0, 0, 14, - 0, "LATENCY", {ov::hint::ModelDistributionPolicy::TENSOR_PARALLEL}, {{14, 6, 8, 0, 0, 0}}, @@ -2517,7 +2341,6 @@ StreamsCalculationTestCase _1sockets_mock_latency_2 = { 0, 0, 6, - 0, "LATENCY", {ov::hint::ModelDistributionPolicy::TENSOR_PARALLEL}, {{14, 6, 8, 0, 0, 0}}, @@ -2529,7 +2352,6 @@ StreamsCalculationTestCase _1sockets_mock_latency_3 = { 0, 0, 14, - 0, "LATENCY", {}, {{14, 6, 8, 0, 0, 0}}, @@ -2541,7 +2363,6 @@ StreamsCalculationTestCase _1sockets_mock_latency_4 = { 0, 0, 6, - 0, "LATENCY", {}, {{14, 6, 8, 0, 0, 0}}, @@ -2553,7 +2374,6 @@ StreamsCalculationTestCase _1sockets_mock_latency_5 = { 0, 0, 14, - 0, "LATENCY", {}, {{14, 6, 8, 0, 0, 0}}, @@ -2565,7 +2385,6 @@ StreamsCalculationTestCase _1sockets_mock_latency_6 = { 0, 0, 6, - 0, "LATENCY", {}, {{14, 6, 8, 0, 0, 0}}, @@ -2577,14 +2396,13 @@ StreamsCalculationTestCase _2sockets_mock_latency_35 = { 200, 0, 0, - 3, "LATENCY", {}, {{200, 100, 0, 100, -1, -1}, + {20, 10, 0, 10, 3, 3}, {80, 40, 0, 40, 0, 0}, {60, 30, 0, 30, 1, 1}, - {40, 20, 0, 20, 2, 2}, - {20, 10, 0, 10, 3, 3}}, + {40, 20, 0, 20, 2, 2}}, {{1, ALL_PROC, 200, -1, -1}, {0, MAIN_CORE_PROC, 10, 3, 3}, {0, HYPER_THREADING_PROC, 10, 3, 3}, @@ -2601,14 +2419,13 @@ StreamsCalculationTestCase _2sockets_mock_latency_36 = { 200, 0, 0, - 3, "LATENCY", {}, {{200, 100, 0, 100, -1, -1}, + {20, 10, 0, 10, 3, 3}, {80, 40, 0, 40, 0, 0}, {60, 30, 0, 30, 1, 1}, - {40, 20, 0, 20, 2, 2}, - {20, 10, 0, 10, 3, 3}}, + {40, 20, 0, 20, 2, 2}}, {{1, ALL_PROC, 200, -1, -1}, {0, MAIN_CORE_PROC, 10, 3, 3}, {0, HYPER_THREADING_PROC, 10, 3, 3}, @@ -2625,10 +2442,9 @@ StreamsCalculationTestCase _2sockets_mock_latency_37 = { 0, 0, 0, - 1, "LATENCY", {ov::hint::ModelDistributionPolicy::TENSOR_PARALLEL}, - {{48, 48, 0, 0, -1, -1}, {24, 24, 0, 0, 0, 0}, {24, 24, 0, 0, 1, 1}}, + {{48, 48, 0, 0, -1, -1}, {24, 24, 0, 0, 1, 1}, {24, 24, 0, 0, 0, 0}}, {{1, MAIN_CORE_PROC, 48, -1, -1}, {-1, MAIN_CORE_PROC, 24, 1, 1}, {-1, MAIN_CORE_PROC, 24, 0, 0}}, }; StreamsCalculationTestCase _2sockets_mock_latency_38 = { @@ -2637,7 +2453,6 @@ StreamsCalculationTestCase _2sockets_mock_latency_38 = { 0, 0, 0, - 0, "LATENCY", {ov::hint::ModelDistributionPolicy::TENSOR_PARALLEL}, {{256, 128, 0, 128, 0, 0}, @@ -2653,7 +2468,6 @@ StreamsCalculationTestCase _2sockets_mock_latency_39 = { 0, 0, 0, - 0, "LATENCY", {}, {{104, 104, 0, 0, -1, -1}, {26, 26, 0, 0, 0, 0}, {26, 26, 0, 0, 1, 0}, {26, 26, 0, 0, 2, 1}, {26, 26, 0, 0, 3, 1}}, @@ -2665,7 +2479,6 @@ StreamsCalculationTestCase _2sockets_mock_latency_40 = { 0, 0, 0, - 0, "LATENCY", {}, {{104, 104, 0, 0, -1, -1}, {26, 26, 0, 0, 1, 0}, {26, 26, 0, 0, 2, 1}, {26, 26, 0, 0, 3, 1}, {26, 26, 0, 0, 0, 0}}, @@ -2677,7 +2490,6 @@ StreamsCalculationTestCase _2sockets_mock_latency_41 = { 0, 0, 0, - 1, "LATENCY", {}, {{104, 104, 0, 0, -1, -1}, {26, 26, 0, 0, 2, 1}, {26, 26, 0, 0, 3, 1}, {26, 26, 0, 0, 0, 0}, {26, 26, 0, 0, 1, 0}}, @@ -2689,7 +2501,6 @@ StreamsCalculationTestCase _2sockets_mock_latency_42 = { 0, 0, 0, - 1, "LATENCY", {}, {{104, 104, 0, 0, -1, -1}, {26, 26, 0, 0, 3, 1}, {26, 26, 0, 0, 0, 0}, {26, 26, 0, 0, 1, 0}, {26, 26, 0, 0, 2, 1}}, @@ -2701,7 +2512,6 @@ StreamsCalculationTestCase _2sockets_mock_latency_43 = { 0, 0, 0, - 0, "LATENCY", {}, {{208, 104, 0, 104, -1, -1}, @@ -2721,7 +2531,6 @@ StreamsCalculationTestCase _2sockets_mock_latency_44 = { 0, 0, 0, - 1, "LATENCY", {}, {{208, 104, 0, 104, -1, -1}, @@ -2741,7 +2550,6 @@ StreamsCalculationTestCase _2sockets_mock_latency_45 = { 0, 0, 0, - 0, "LATENCY", {}, {{208, 208, 0, 0, -1, -1}, {52, 52, 0, 0, 0, 0}, {52, 52, 0, 0, 1, 0}, {52, 52, 0, 0, 2, 1}, {52, 52, 0, 0, 3, 1}}, @@ -2753,7 +2561,6 @@ StreamsCalculationTestCase _2sockets_mock_latency_46 = { 0, 0, 0, - 1, "LATENCY", {}, {{208, 208, 0, 0, -1, -1}, {52, 52, 0, 0, 2, 1}, {52, 52, 0, 0, 3, 1}, {52, 52, 0, 0, 0, 0}, {52, 52, 0, 0, 1, 0}}, @@ -2765,7 +2572,6 @@ StreamsCalculationTestCase _2sockets_mock_latency_47 = { 0, 0, 0, - 0, "LATENCY", {}, {{416, 208, 0, 208, -1, -1}, @@ -2785,7 +2591,6 @@ StreamsCalculationTestCase _2sockets_mock_latency_48 = { 0, 0, 0, - 1, "LATENCY", {}, {{416, 208, 0, 208, -1, -1}, @@ -2805,7 +2610,6 @@ StreamsCalculationTestCase _2sockets_mock_latency_49 = { 80, 0, 0, - 1, "LATENCY", {}, {{416, 208, 0, 208, -1, -1}, @@ -2823,7 +2627,6 @@ StreamsCalculationTestCase _2sockets_mock_latency_50 = { 80, 0, 0, - 1, "LATENCY", {}, {{208, 208, 0, 0, -1, -1}, {52, 52, 0, 0, 2, 1}, {52, 52, 0, 0, 3, 1}, {52, 52, 0, 0, 0, 0}, {52, 52, 0, 0, 1, 0}}, @@ -2835,7 +2638,6 @@ StreamsCalculationTestCase _2sockets_mock_latency_51 = { 16, 0, 0, - 0, "LATENCY", {}, {{16, 16, 0, 0, -1, -1}, {8, 8, 0, 0, 0, 0}, {8, 8, 0, 0, 1, 1}}, diff --git a/src/plugins/intel_cpu/tests/unit/streams_info/update_proc_table_test.cpp b/src/plugins/intel_cpu/tests/unit/streams_info/update_proc_table_test.cpp new file mode 100644 index 00000000000000..08c0cf2c9089e9 --- /dev/null +++ b/src/plugins/intel_cpu/tests/unit/streams_info/update_proc_table_test.cpp @@ -0,0 +1,72 @@ +// Copyright (C) 2018-2024 Intel Corporation +// SPDX-License-Identifier: Apache-2.0 +// + +#include + +#include "common_test_utils/test_common.hpp" +#include "cpu_streams_calculation.hpp" + +using namespace testing; + +namespace ov { + +namespace intel_cpu { + +struct LinuxSortProcTableTestCase { + int current_numa_node_id; + std::vector> _proc_type_table_input; + std::vector> _proc_type_table_output; +}; + +class LinuxSortProcTableTests : public ov::test::TestsCommon, + public testing::WithParamInterface> { +public: + void SetUp() override { + const auto& test_data = std::get<0>(GetParam()); + + std::vector> test_proc_type_table = test_data._proc_type_table_input; + + sort_table_by_numa_node_id(test_data.current_numa_node_id, test_proc_type_table); + + ASSERT_EQ(test_proc_type_table, test_data._proc_type_table_output); + } +}; + +LinuxSortProcTableTestCase proc_table_2sockets_24cores_hyperthreading_1 = { + 0, + {{48, 24, 0, 24, -1, -1}, {12, 6, 0, 6, 0, 0}, {12, 6, 0, 6, 1, 0}, {12, 6, 0, 6, 2, 1}, {12, 6, 0, 6, 3, 1}}, + {{48, 24, 0, 24, -1, -1}, {12, 6, 0, 6, 0, 0}, {12, 6, 0, 6, 1, 0}, {12, 6, 0, 6, 2, 1}, {12, 6, 0, 6, 3, 1}}, +}; +LinuxSortProcTableTestCase proc_table_2sockets_24cores_hyperthreading_2 = { + 1, + {{48, 24, 0, 24, -1, -1}, {12, 6, 0, 6, 0, 0}, {12, 6, 0, 6, 1, 0}, {12, 6, 0, 6, 2, 1}, {12, 6, 0, 6, 3, 1}}, + {{48, 24, 0, 24, -1, -1}, {12, 6, 0, 6, 1, 0}, {12, 6, 0, 6, 2, 1}, {12, 6, 0, 6, 3, 1}, {12, 6, 0, 6, 0, 0}}, +}; +LinuxSortProcTableTestCase proc_table_2sockets_24cores_hyperthreading_3 = { + 2, + {{48, 24, 0, 24, -1, -1}, {12, 6, 0, 6, 0, 0}, {12, 6, 0, 6, 1, 0}, {12, 6, 0, 6, 2, 1}, {12, 6, 0, 6, 3, 1}}, + {{48, 24, 0, 24, -1, -1}, {12, 6, 0, 6, 2, 1}, {12, 6, 0, 6, 3, 1}, {12, 6, 0, 6, 0, 0}, {12, 6, 0, 6, 1, 0}}, +}; +LinuxSortProcTableTestCase proc_table_2sockets_24cores_hyperthreading_4 = { + 3, + {{48, 24, 0, 24, -1, -1}, {12, 6, 0, 6, 0, 0}, {12, 6, 0, 6, 1, 0}, {12, 6, 0, 6, 2, 1}, {12, 6, 0, 6, 3, 1}}, + {{48, 24, 0, 24, -1, -1}, {12, 6, 0, 6, 3, 1}, {12, 6, 0, 6, 0, 0}, {12, 6, 0, 6, 1, 0}, {12, 6, 0, 6, 2, 1}}, +}; +LinuxSortProcTableTestCase proc_table_1sockets_mock = { + 3, + {{48, 24, 0, 24, 0, 0}}, + {{48, 24, 0, 24, 0, 0}}, +}; + +TEST_P(LinuxSortProcTableTests, UpdateProcTable) {} + +INSTANTIATE_TEST_SUITE_P(UpdateProcTableList, + LinuxSortProcTableTests, + testing::Values(proc_table_2sockets_24cores_hyperthreading_1, + proc_table_2sockets_24cores_hyperthreading_2, + proc_table_2sockets_24cores_hyperthreading_3, + proc_table_2sockets_24cores_hyperthreading_4, + proc_table_1sockets_mock)); +} // namespace intel_cpu +} // namespace ov From e68486452befa411bafb0d766550ae637e240480 Mon Sep 17 00:00:00 2001 From: "Shen, Wanglei" Date: Thu, 19 Dec 2024 02:11:45 +0800 Subject: [PATCH 12/30] fix code style issue --- src/inference/src/system_conf.cpp | 2 +- src/plugins/intel_cpu/src/cpu_streams_calculation.cpp | 3 ++- 2 files changed, 3 insertions(+), 2 deletions(-) diff --git a/src/inference/src/system_conf.cpp b/src/inference/src/system_conf.cpp index 8d1804e980b2c6..09db44dc70cc1a 100644 --- a/src/inference/src/system_conf.cpp +++ b/src/inference/src/system_conf.cpp @@ -448,7 +448,7 @@ int get_current_socket_id() { int get_current_numa_node_id() { CPU& cpu = cpu_info(); - int cur_processor_id = GetCurrentProcessorNumber();; + int cur_processor_id = GetCurrentProcessorNumber(); for (auto& row : cpu._cpu_mapping_table) { if (cur_processor_id == row[CPU_MAP_PROCESSOR_ID]) { diff --git a/src/plugins/intel_cpu/src/cpu_streams_calculation.cpp b/src/plugins/intel_cpu/src/cpu_streams_calculation.cpp index 23d166efb44e52..06de0341be927e 100644 --- a/src/plugins/intel_cpu/src/cpu_streams_calculation.cpp +++ b/src/plugins/intel_cpu/src/cpu_streams_calculation.cpp @@ -210,7 +210,8 @@ std::vector> get_streams_info_table( ((input_streams_changed == true) && (input_streams == 1))) { n_streams = 1; stream_info[NUMBER_OF_STREAMS] = n_streams; - current_socket_id = proc_type_table.size() == 1 ? proc_type_table[0][PROC_SOCKET_ID] : proc_type_table[1][PROC_SOCKET_ID] ; + current_socket_id = + proc_type_table.size() == 1 ? proc_type_table[0][PROC_SOCKET_ID] : proc_type_table[1][PROC_SOCKET_ID]; if (input_threads > 0) { if (hint_model_distribution_policy.size() == 0) { n_threads_per_stream = std::min(input_threads, proc_type_table[0][ALL_PROC]); From d1f50d277753a609fd8f3849750852a8ab6b959c Mon Sep 17 00:00:00 2001 From: sunxiaoxia2022 Date: Tue, 24 Dec 2024 04:27:09 +0800 Subject: [PATCH 13/30] set cpu_pinning yes if user only set cpu_reservation yes --- src/plugins/intel_cpu/src/cpu_map_scheduling.cpp | 3 ++- src/plugins/intel_cpu/src/cpu_map_scheduling.hpp | 2 ++ src/plugins/intel_cpu/src/cpu_streams_calculation.cpp | 8 +++++--- .../tests/unit/streams_info/cpu_pinning_test.cpp | 1 + src/plugins/intel_gpu/src/runtime/execution_config.cpp | 5 +++++ 5 files changed, 15 insertions(+), 4 deletions(-) diff --git a/src/plugins/intel_cpu/src/cpu_map_scheduling.cpp b/src/plugins/intel_cpu/src/cpu_map_scheduling.cpp index 450180d837c661..55db84c7583f7c 100644 --- a/src/plugins/intel_cpu/src/cpu_map_scheduling.cpp +++ b/src/plugins/intel_cpu/src/cpu_map_scheduling.cpp @@ -72,6 +72,7 @@ std::vector> apply_hyper_threading(bool& input_ht_hint, bool get_cpu_pinning(bool& input_value, const bool input_changed, + const bool cpu_reservation, const std::vector>& proc_type_table, const std::vector>& streams_info_table) { bool result_value; @@ -90,7 +91,7 @@ bool get_cpu_pinning(bool& input_value, if ((streams_info_table[0][PROC_TYPE] == ALL_PROC) && (streams_info_table[1][PROC_TYPE] != EFFICIENT_CORE_PROC) && (streams_info_table[2][PROC_TYPE] == EFFICIENT_CORE_PROC)) { - result_value = false; + result_value = cpu_reservation; } } } diff --git a/src/plugins/intel_cpu/src/cpu_map_scheduling.hpp b/src/plugins/intel_cpu/src/cpu_map_scheduling.hpp index 9004647cd41e9f..c3889626eb99dd 100644 --- a/src/plugins/intel_cpu/src/cpu_map_scheduling.hpp +++ b/src/plugins/intel_cpu/src/cpu_map_scheduling.hpp @@ -44,12 +44,14 @@ std::vector> apply_hyper_threading(bool& input_ht_hint, * @brief whether pinning cpu cores according to enableCpuPinning property * @param[in] input_type indicate value of property enableCpuPinning. * @param[in] input_changed indicate if value is set by user. + * @param[in] cpu_reservation indicate if cpu need to be reserved * @param[in] proc_type_table indicate processors information of this platform * @param[in] streams_info_table indicate streams detail of this model * @return whether pinning threads to cpu cores */ bool get_cpu_pinning(bool& input_value, const bool input_changed, + const bool cpu_reservation, const std::vector>& proc_type_table, const std::vector>& streams_info_table); diff --git a/src/plugins/intel_cpu/src/cpu_streams_calculation.cpp b/src/plugins/intel_cpu/src/cpu_streams_calculation.cpp index b9b21c652b9584..5cf819d72f4daf 100644 --- a/src/plugins/intel_cpu/src/cpu_streams_calculation.cpp +++ b/src/plugins/intel_cpu/src/cpu_streams_calculation.cpp @@ -693,15 +693,17 @@ std::vector> generate_stream_info(const int streams, ov::util::to_string(config.hintPerfMode), config.modelDistributionPolicy, proc_type_table); - // streams_info_table = {{1, 1, 56, 1, 1}, {-1, 1, 28, 1, 1}, {-1, 1, 28, 0, 0}}; if (config.modelDistributionPolicy.find(ov::hint::ModelDistributionPolicy::TENSOR_PARALLEL) != config.modelDistributionPolicy.end()) { config.streamsRankTable = get_streams_rank_table(streams_info_table, config.streamsRankLevel, config.numSubStreams); } - auto cpu_pinning = - get_cpu_pinning(config.enableCpuPinning, config.changedCpuPinning, proc_type_table, streams_info_table); + auto cpu_pinning = get_cpu_pinning(config.enableCpuPinning, + config.changedCpuPinning, + config.enableCpuReservation, + proc_type_table, + streams_info_table); config.streamExecutorConfig = IStreamsExecutor::Config{"CPUStreamsExecutor", config.streams, diff --git a/src/plugins/intel_cpu/tests/unit/streams_info/cpu_pinning_test.cpp b/src/plugins/intel_cpu/tests/unit/streams_info/cpu_pinning_test.cpp index edbf4314dbf6ec..4a72ec8d7b2d94 100644 --- a/src/plugins/intel_cpu/tests/unit/streams_info/cpu_pinning_test.cpp +++ b/src/plugins/intel_cpu/tests/unit/streams_info/cpu_pinning_test.cpp @@ -29,6 +29,7 @@ class CpuPinningTests : public ov::test::TestsCommon, auto test_output = ov::intel_cpu::get_cpu_pinning(test_data.input_cpu_pinning, test_data.input_changed, + false, test_data.input_proc_type_table, test_data.input_stream_info_table); diff --git a/src/plugins/intel_gpu/src/runtime/execution_config.cpp b/src/plugins/intel_gpu/src/runtime/execution_config.cpp index a1773ca635546d..befb0974ec95b3 100644 --- a/src/plugins/intel_gpu/src/runtime/execution_config.cpp +++ b/src/plugins/intel_gpu/src/runtime/execution_config.cpp @@ -254,6 +254,11 @@ void ExecutionConfig::apply_user_properties(const cldnn::device_info& info) { set_property(ov::hint::enable_cpu_reservation(true)); } } + if (get_property(ov::hint::enable_cpu_reservation)) { + if (!is_set_by_user(ov::hint::enable_cpu_pinning)) { + set_property(ov::hint::enable_cpu_pinning(true)); + } + } // Enable KV-cache compression by default for non-systolic platforms if (!is_set_by_user(ov::hint::kv_cache_precision) && !info.supports_immad) { From bd4a1321365b4e42b6fcd1e1b10f936be15b6696 Mon Sep 17 00:00:00 2001 From: "Shen, Wanglei" Date: Wed, 25 Dec 2024 00:32:23 +0800 Subject: [PATCH 14/30] update for cpu reservation --- src/plugins/intel_cpu/src/cpu_streams_calculation.cpp | 8 ++++++-- 1 file changed, 6 insertions(+), 2 deletions(-) diff --git a/src/plugins/intel_cpu/src/cpu_streams_calculation.cpp b/src/plugins/intel_cpu/src/cpu_streams_calculation.cpp index 06de0341be927e..9cd77b053064e2 100644 --- a/src/plugins/intel_cpu/src/cpu_streams_calculation.cpp +++ b/src/plugins/intel_cpu/src/cpu_streams_calculation.cpp @@ -210,8 +210,12 @@ std::vector> get_streams_info_table( ((input_streams_changed == true) && (input_streams == 1))) { n_streams = 1; stream_info[NUMBER_OF_STREAMS] = n_streams; - current_socket_id = - proc_type_table.size() == 1 ? proc_type_table[0][PROC_SOCKET_ID] : proc_type_table[1][PROC_SOCKET_ID]; + for (size_t n = 0; n < proc_socket_table.size(); n++) { + if (proc_socket_table[n][ALL_PROC] > 0) { + current_socket_id = proc_socket_table[n][PROC_SOCKET_ID]; + break; + } + } if (input_threads > 0) { if (hint_model_distribution_policy.size() == 0) { n_threads_per_stream = std::min(input_threads, proc_type_table[0][ALL_PROC]); From 93fcb21364ecaea1ac0a528bc7a6598a5358afed Mon Sep 17 00:00:00 2001 From: sunxiaoxia2022 Date: Tue, 24 Dec 2024 18:29:05 +0800 Subject: [PATCH 15/30] revert pr27873 --- .../intel_cpu/src/cpu_streams_calculation.cpp | 13 ++++++------- .../unit/streams_info/streams_info_table_test.cpp | 10 +++++----- 2 files changed, 11 insertions(+), 12 deletions(-) diff --git a/src/plugins/intel_cpu/src/cpu_streams_calculation.cpp b/src/plugins/intel_cpu/src/cpu_streams_calculation.cpp index b6d8f8acd3c235..f044376c5d4d74 100644 --- a/src/plugins/intel_cpu/src/cpu_streams_calculation.cpp +++ b/src/plugins/intel_cpu/src/cpu_streams_calculation.cpp @@ -176,7 +176,11 @@ std::vector> get_streams_info_table( std::unordered_set socket_id_list(proc_type_table.size()); for (size_t i = 1; i < proc_type_table.size(); i++) { if (!socket_id_list.count(proc_type_table[i][PROC_SOCKET_ID])) { - proc_socket_table.push_back(proc_type_table[i]); + if (proc_type_table[i][PROC_SOCKET_ID] == input_current_socket_id) { + proc_socket_table.insert(proc_socket_table.begin(), proc_type_table[i]); + } else { + proc_socket_table.push_back(proc_type_table[i]); + } socket_id_list.insert(proc_type_table[i][PROC_SOCKET_ID]); } else { for (auto& row : proc_socket_table) { @@ -198,12 +202,7 @@ std::vector> get_streams_info_table( ((input_streams_changed == true) && (input_streams == 1))) { n_streams = 1; stream_info[NUMBER_OF_STREAMS] = n_streams; - for (size_t n = 0; n < proc_socket_table.size(); n++) { - if (proc_socket_table[n][ALL_PROC] > 0) { - current_socket_id = proc_socket_table[n][PROC_SOCKET_ID]; - break; - } - } + current_socket_id = input_current_socket_id == -1 ? get_current_socket_id() : input_current_socket_id; if (input_threads > 0) { if (hint_model_distribution_policy.size() == 0) { for (auto& row : proc_socket_table) { diff --git a/src/plugins/intel_cpu/tests/unit/streams_info/streams_info_table_test.cpp b/src/plugins/intel_cpu/tests/unit/streams_info/streams_info_table_test.cpp index 44eeb3ae26d90b..57f9f5c5d72a14 100644 --- a/src/plugins/intel_cpu/tests/unit/streams_info/streams_info_table_test.cpp +++ b/src/plugins/intel_cpu/tests/unit/streams_info/streams_info_table_test.cpp @@ -2591,10 +2591,10 @@ StreamsCalculationTestCase _2sockets_mock_latency_35 = { "LATENCY", {}, {{200, 100, 0, 100, -1, -1}, - {20, 10, 0, 10, 3, 3}, {80, 40, 0, 40, 0, 0}, {60, 30, 0, 30, 1, 1}, - {40, 20, 0, 20, 2, 2}}, + {40, 20, 0, 20, 2, 2}, + {20, 10, 0, 10, 3, 3}}, {{1, ALL_PROC, 20, 3, 3}, {0, MAIN_CORE_PROC, 10, 3, 3}, {0, HYPER_THREADING_PROC, 10, 3, 3}}, }; StreamsCalculationTestCase _2sockets_mock_latency_36 = { @@ -2607,10 +2607,10 @@ StreamsCalculationTestCase _2sockets_mock_latency_36 = { "LATENCY", {}, {{200, 100, 0, 100, -1, -1}, - {20, 10, 0, 10, 3, 3}, {80, 40, 0, 40, 0, 0}, {60, 30, 0, 30, 1, 1}, - {40, 20, 0, 20, 2, 2}}, + {40, 20, 0, 20, 2, 2}, + {20, 10, 0, 10, 3, 3}}, {{1, ALL_PROC, 20, 3, 3}, {0, MAIN_CORE_PROC, 10, 3, 3}, {0, HYPER_THREADING_PROC, 10, 3, 3}}, }; StreamsCalculationTestCase _2sockets_mock_latency_37 = { @@ -2622,7 +2622,7 @@ StreamsCalculationTestCase _2sockets_mock_latency_37 = { 1, "LATENCY", {ov::hint::ModelDistributionPolicy::TENSOR_PARALLEL}, - {{48, 48, 0, 0, -1, -1}, {24, 24, 0, 0, 1, 1}, {24, 24, 0, 0, 0, 0}}, + {{48, 48, 0, 0, -1, -1}, {24, 24, 0, 0, 0, 0}, {24, 24, 0, 0, 1, 1}}, {{1, MAIN_CORE_PROC, 48, -1, -1}, {-1, MAIN_CORE_PROC, 24, 1, 1}, {-1, MAIN_CORE_PROC, 24, 0, 0}}, }; StreamsCalculationTestCase _2sockets_mock_latency_38 = { From 8cc37b11de6793e860766ead1677be23b36fa91a Mon Sep 17 00:00:00 2001 From: sunxiaoxia2022 Date: Fri, 3 Jan 2025 11:32:25 +0800 Subject: [PATCH 16/30] add enable_cpu_reservation condition in creating executor --- src/plugins/intel_gpu/src/plugin/compiled_model.cpp | 6 ++++-- 1 file changed, 4 insertions(+), 2 deletions(-) diff --git a/src/plugins/intel_gpu/src/plugin/compiled_model.cpp b/src/plugins/intel_gpu/src/plugin/compiled_model.cpp index 9f699537004732..d2ef14106e2277 100644 --- a/src/plugins/intel_gpu/src/plugin/compiled_model.cpp +++ b/src/plugins/intel_gpu/src/plugin/compiled_model.cpp @@ -25,7 +25,9 @@ std::shared_ptr create_task_executor(const std::sh // exclusive_async_requests essentially disables the streams (and hence should be checked first) => aligned with // the CPU behavior return plugin->get_executor_manager()->get_executor("GPU"); - } else if (config.get_property(ov::hint::enable_cpu_pinning)) { + } else if (config.get_property(ov::hint::enable_cpu_pinning) || + config.get_property(ov::hint::enable_cpu_reservation)) { + bool enable_cpu_pinning = config.get_property(ov::hint::enable_cpu_pinning); bool enable_cpu_reservation = config.get_property(ov::hint::enable_cpu_reservation); return std::make_shared( ov::threading::IStreamsExecutor::Config{"Intel GPU plugin executor", @@ -33,7 +35,7 @@ std::shared_ptr create_task_executor(const std::sh 1, ov::hint::SchedulingCoreType::PCORE_ONLY, enable_cpu_reservation, - true}); + enable_cpu_pinning}); } else { return std::make_shared( ov::threading::IStreamsExecutor::Config{"Intel GPU plugin executor", config.get_property(ov::num_streams)}); From 34b1afffa7e01d36cbec393edc69fd0a3ff8d9f1 Mon Sep 17 00:00:00 2001 From: sunxiaoxia2022 Date: Mon, 6 Jan 2025 16:39:39 +0800 Subject: [PATCH 17/30] update pinning in windows --- src/plugins/intel_cpu/src/cpu_map_scheduling.cpp | 6 +++++- 1 file changed, 5 insertions(+), 1 deletion(-) diff --git a/src/plugins/intel_cpu/src/cpu_map_scheduling.cpp b/src/plugins/intel_cpu/src/cpu_map_scheduling.cpp index 55db84c7583f7c..b135194068e83c 100644 --- a/src/plugins/intel_cpu/src/cpu_map_scheduling.cpp +++ b/src/plugins/intel_cpu/src/cpu_map_scheduling.cpp @@ -80,7 +80,11 @@ bool get_cpu_pinning(bool& input_value, #if defined(__APPLE__) result_value = false; #elif defined(_WIN32) - result_value = ((input_changed) && (proc_type_table.size() == 1)) ? input_value : false; + if (proc_type_table.size() == 1) { + result_value = input_changed ? input_value : cpu_reservation; + } else { + result_value = false; + } #else if (input_changed) { result_value = input_value; From f3bcc0cbec1bbbe24dc4bbfff004b040b8fb68a0 Mon Sep 17 00:00:00 2001 From: sunxiaoxia2022 Date: Fri, 10 Jan 2025 15:20:41 +0800 Subject: [PATCH 18/30] add lock to guarantee thread safity --- .../cpu-device.rst | 1 + .../runtime/threading/istreams_executor.hpp | 18 +- .../include/openvino/runtime/properties.hpp | 7 +- .../src/dev/threading/istreams_executor.cpp | 27 +- .../intel_cpu/src/cpu_streams_calculation.cpp | 12 +- .../unit/streams_info/streams_e2e_test.cpp | 1281 ++++++++++++++++- 6 files changed, 1313 insertions(+), 33 deletions(-) diff --git a/docs/articles_en/openvino-workflow/running-inference/inference-devices-and-modes/cpu-device.rst b/docs/articles_en/openvino-workflow/running-inference/inference-devices-and-modes/cpu-device.rst index f1a914e6b9dac3..c5a6eb3d57915a 100644 --- a/docs/articles_en/openvino-workflow/running-inference/inference-devices-and-modes/cpu-device.rst +++ b/docs/articles_en/openvino-workflow/running-inference/inference-devices-and-modes/cpu-device.rst @@ -355,6 +355,7 @@ All parameters must be set before calling ``ov::Core::compile_model()`` in order - ``ov::hint::num_request`` - ``ov::hint::scheduling_core_type`` - ``ov::hint::enable_hyper_threading`` +- ``ov::hint::enable_cpu_reservation`` - ``ov::hint::enable_cpu_pinning`` - ``ov::num_streams`` - ``ov::affinity`` diff --git a/src/inference/dev_api/openvino/runtime/threading/istreams_executor.hpp b/src/inference/dev_api/openvino/runtime/threading/istreams_executor.hpp index 3630c2bb5a6ed7..e559f2ad4b3755 100644 --- a/src/inference/dev_api/openvino/runtime/threading/istreams_executor.hpp +++ b/src/inference/dev_api/openvino/runtime/threading/istreams_executor.hpp @@ -12,6 +12,7 @@ #include #include #include +#include #include "openvino/runtime/common.hpp" #include "openvino/runtime/properties.hpp" @@ -102,13 +103,14 @@ class OPENVINO_RUNTIME_API IStreamsExecutor : virtual public ITaskExecutor { ov::hint::SchedulingCoreType::ANY_CORE; //!< PCORE_ONLY and ECORE_ONLY are valid in hybrid core machine, //!< ANY_CORE is valid in all machines. Core type priority: //!< physical PCore, ECore, logical PCore - bool _cpu_reservation = false; //!< Whether to reserve current cores which will not be used by other plugin. - //!< If it is true, cpu_pinning defaults to true. + bool _cpu_reservation = false; //!< Whether to reserve current cores which will not be used by other plugin or + //!< compiled model. If it is true, cpu_pinning defaults to true. bool _cpu_pinning = false; //!< Whether to bind threads to cores. std::vector> _streams_info_table = {}; std::vector> _stream_processor_ids; int _sub_streams = 0; std::vector _rank = {}; + bool _add_lock = true; /** * @brief Get and reserve cpu ids based on configuration and hardware information, @@ -121,6 +123,8 @@ class OPENVINO_RUNTIME_API IStreamsExecutor : virtual public ITaskExecutor { */ void update_executor_config(); + void update_executor_config(bool lock); + /** * @brief Set _streams_info_table and _cpu_reservation in cpu streams executor config when nstreams = 0, * that is, only create one thread with TBB @@ -147,7 +151,8 @@ class OPENVINO_RUNTIME_API IStreamsExecutor : virtual public ITaskExecutor { bool cpu_reservation = false, bool cpu_pinning = false, std::vector> streams_info_table = {}, - std::vector rank = {}) + std::vector rank = {}, + bool add_lock = true) : _name{std::move(name)}, _streams{streams}, _threads_per_stream{threads_per_stream}, @@ -155,8 +160,9 @@ class OPENVINO_RUNTIME_API IStreamsExecutor : virtual public ITaskExecutor { _cpu_reservation{cpu_reservation}, _cpu_pinning{cpu_pinning}, _streams_info_table{std::move(streams_info_table)}, - _rank{rank} { - update_executor_config(); + _rank{rank}, + _add_lock(add_lock) { + update_executor_config(_add_lock); } // These APIs which includes set_property and get_property can not be removed until they will never be called by @@ -283,5 +289,7 @@ class OPENVINO_RUNTIME_API IStreamsExecutor : virtual public ITaskExecutor { virtual void execute(Task task) = 0; }; +static std::mutex _streams_executor_mutex; + } // namespace threading } // namespace ov diff --git a/src/inference/include/openvino/runtime/properties.hpp b/src/inference/include/openvino/runtime/properties.hpp index 5d9ec63ce0075c..b5f3b50f516675 100644 --- a/src/inference/include/openvino/runtime/properties.hpp +++ b/src/inference/include/openvino/runtime/properties.hpp @@ -483,10 +483,9 @@ static constexpr Property enable_cpu_pinning{"ENABLE_CPU_PINNING"}; * @brief This property allows CPU reservation during inference. * @ingroup ov_runtime_cpp_prop_api * - * Cpu Reservation means reserve cpus which will not be used by other plugin. Developer can use this property to - * enable or disable CPU reservation during inference on Windows and Linux. MacOS - * does not support CPU reservation, and this property is always disabled. - * This property defaults to false. + * Cpu Reservation means reserve cpus which will not be used by other plugin or compiled model. Developer can use this + * property to enable or disable CPU reservation during inference on Windows and Linux. MacOS does not support CPU + * reservation, and this property is always disabled. This property defaults to false. * * The following code is example to use this property. * diff --git a/src/inference/src/dev/threading/istreams_executor.cpp b/src/inference/src/dev/threading/istreams_executor.cpp index 4712ae3af193c4..2fce163c89eee7 100644 --- a/src/inference/src/dev/threading/istreams_executor.cpp +++ b/src/inference/src/dev/threading/istreams_executor.cpp @@ -159,23 +159,28 @@ void IStreamsExecutor::Config::update_executor_config() { const auto proc_type_table = get_proc_type_table(); bool streams_info_available = false; - if (proc_type_table.empty()) { - return; + if (_cpu_reservation && (proc_type_table.empty() || proc_type_table[0][ALL_PROC] == 0)) { + OPENVINO_THROW("proc_type_table is empty. No CPU resources available!"); } if (!_streams_info_table.empty()) { streams_info_available = true; std::vector threads_proc_type(HYPER_THREADING_PROC + 1, 0); + int threads_all = 0; for (size_t i = 0; i < _streams_info_table.size(); i++) { if (_streams_info_table[i][NUMBER_OF_STREAMS] > 0) { - threads_proc_type[_streams_info_table[i][PROC_TYPE]] += + int num_threads = _streams_info_table[i][THREADS_PER_STREAM] * _streams_info_table[i][NUMBER_OF_STREAMS]; + threads_proc_type[_streams_info_table[i][PROC_TYPE]] += num_threads; + threads_all += num_threads; } } + if (threads_all == 0) { + OPENVINO_THROW("streams_info_table is invalid!"); + } for (size_t i = ALL_PROC; i < threads_proc_type.size(); i++) { if (threads_proc_type[i] > proc_type_table[0][i]) { - streams_info_available = false; - break; + OPENVINO_THROW("Not enough CPU resources!"); } } } @@ -311,6 +316,17 @@ void IStreamsExecutor::Config::update_executor_config() { #endif } +void IStreamsExecutor::Config::update_executor_config(bool lock) { + if (lock) { + { + std::lock_guard lock{_streams_executor_mutex}; + update_executor_config(); + } + } else { + update_executor_config(); + } +} + void IStreamsExecutor::Config::set_config_zero_stream() { std::vector> proc_type_table = get_proc_type_table(); int core_type = MAIN_CORE_PROC; @@ -325,6 +341,7 @@ void IStreamsExecutor::Config::set_config_zero_stream() { socket_id = std::max(0, proc_type_table[0][PROC_SOCKET_ID]); } _streams_info_table.push_back({1, core_type, 1, numa_id, socket_id}); + _cpu_reservation = false; _cpu_pinning = false; } diff --git a/src/plugins/intel_cpu/src/cpu_streams_calculation.cpp b/src/plugins/intel_cpu/src/cpu_streams_calculation.cpp index ed44c9c19e1eb8..1365b67d27ed66 100644 --- a/src/plugins/intel_cpu/src/cpu_streams_calculation.cpp +++ b/src/plugins/intel_cpu/src/cpu_streams_calculation.cpp @@ -727,15 +727,19 @@ std::vector> generate_stream_info(const int streams, ov::hint::SchedulingCoreType::ANY_CORE, config.enableCpuReservation, cpu_pinning, - streams_info_table}; - + streams_info_table, + {}, + false}; return proc_type_table; } void get_num_streams(const int streams, const std::shared_ptr& model, Config& config) { - std::vector> proc_type_table = get_proc_type_table(); + { + std::lock_guard lock{_streams_executor_mutex}; + std::vector> proc_type_table = get_proc_type_table(); - generate_stream_info(streams, -1, model, config, proc_type_table); + generate_stream_info(streams, -1, model, config, proc_type_table); + } } } // namespace intel_cpu diff --git a/src/plugins/intel_cpu/tests/unit/streams_info/streams_e2e_test.cpp b/src/plugins/intel_cpu/tests/unit/streams_info/streams_e2e_test.cpp index 9242fd7fd46bc9..6e223f28541a77 100644 --- a/src/plugins/intel_cpu/tests/unit/streams_info/streams_e2e_test.cpp +++ b/src/plugins/intel_cpu/tests/unit/streams_info/streams_e2e_test.cpp @@ -8,6 +8,7 @@ #include "cpu_map_scheduling.hpp" #include "cpu_streams_calculation.hpp" #include "openvino/runtime/system_conf.hpp" +#include "openvino/runtime/threading/cpu_streams_info.hpp" #include "os/cpu_map_info.hpp" using namespace testing; @@ -25,10 +26,12 @@ struct StreamGenerateionTestCase { ov::hint::SchedulingCoreType input_type; bool input_ht_value; bool input_ht_changed; + bool input_cpu_reservation; bool input_cpu_value; bool input_cpu_changed; ov::hint::PerformanceMode input_pm_hint; std::set hint_llm_distribution_policy; + std::vector> cpu_mapping_table; std::vector> input_proc_type_table; ov::hint::SchedulingCoreType output_type; bool output_ht_value; @@ -40,6 +43,7 @@ struct StreamGenerateionTestCase { void make_config(StreamGenerateionTestCase& test_data, ov::intel_cpu::Config& config) { config.schedulingCoreType = test_data.input_type; + config.enableCpuReservation = test_data.input_cpu_reservation; config.enableCpuPinning = test_data.input_cpu_value; config.changedCpuPinning = test_data.input_cpu_changed; config.enableHyperThreading = test_data.input_ht_value; @@ -62,21 +66,62 @@ class StreamGenerationTests : public ov::test::TestsCommon, make_config(test_data, config); CPU& cpu = cpu_info(); + cpu._cpu_mapping_table = test_data.cpu_mapping_table; cpu._proc_type_table = test_data.input_proc_type_table; + std::vector> res_proc_type_table = test_data.input_proc_type_table; - auto proc_type_table = ov::intel_cpu::generate_stream_info(test_data.input_stream, - test_data.input_numa_node_id, - nullptr, - config, - test_data.input_proc_type_table, - test_data.input_model_prefer); - - ASSERT_EQ(test_data.output_stream_info_table, config.streamExecutorConfig.get_streams_info_table()); - ASSERT_EQ(test_data.output_proc_type_table, proc_type_table); - ASSERT_EQ(test_data.output_cpu_value, config.streamExecutorConfig.get_cpu_pinning()); - ASSERT_EQ(test_data.output_ht_value, config.enableHyperThreading); - ASSERT_EQ(test_data.output_type, config.schedulingCoreType); - ASSERT_EQ(test_data.output_pm_hint, config.hintPerfMode); + if (cpu._cpu_mapping_table.empty()) { + EXPECT_THROW(ov::intel_cpu::generate_stream_info(test_data.input_stream, + test_data.input_numa_node_id, + nullptr, + config, + test_data.input_proc_type_table, + test_data.input_model_prefer), + ov::Exception); + } else { + auto proc_type_table = ov::intel_cpu::generate_stream_info(test_data.input_stream, + test_data.input_numa_node_id, + nullptr, + config, + test_data.input_proc_type_table, + test_data.input_model_prefer); + ASSERT_EQ(test_data.output_stream_info_table, config.streamExecutorConfig.get_streams_info_table()); + ASSERT_EQ(test_data.output_proc_type_table, proc_type_table); + ASSERT_EQ(test_data.output_cpu_value, config.streamExecutorConfig.get_cpu_pinning()); + ASSERT_EQ(test_data.output_ht_value, config.enableHyperThreading); + ASSERT_EQ(test_data.output_type, config.schedulingCoreType); + ASSERT_EQ(test_data.output_pm_hint, config.hintPerfMode); + if (config.enableCpuReservation) { + for (size_t i = 0; i < test_data.output_stream_info_table.size(); i++) { + if (test_data.output_stream_info_table[i][PROC_TYPE] >= MAIN_CORE_PROC && + test_data.output_stream_info_table[i][PROC_TYPE] <= HYPER_THREADING_PROC) { + int nstreams = test_data.output_stream_info_table[i][NUMBER_OF_STREAMS] > 0 + ? test_data.output_stream_info_table[i][NUMBER_OF_STREAMS] + : 1; + int nthreads = nstreams * test_data.output_stream_info_table[i][THREADS_PER_STREAM]; + if (res_proc_type_table.size() > 1) { + for (size_t j = 0; j < proc_type_table.size(); j++) { + if (res_proc_type_table[j][PROC_NUMA_NODE_ID] == + test_data.output_stream_info_table[i][STREAM_NUMA_NODE_ID] && + res_proc_type_table[j][PROC_SOCKET_ID] == + test_data.output_stream_info_table[i][STREAM_SOCKET_ID]) { + res_proc_type_table[j][test_data.output_stream_info_table[i][PROC_TYPE]] -= + nthreads; + res_proc_type_table[j][ALL_PROC] -= nthreads; + res_proc_type_table[0][test_data.output_stream_info_table[i][PROC_TYPE]] -= + nthreads; + res_proc_type_table[0][ALL_PROC] -= nthreads; + } + } + } else { + res_proc_type_table[0][test_data.output_stream_info_table[i][PROC_TYPE]] -= nthreads; + res_proc_type_table[0][ALL_PROC] -= nthreads; + } + } + } + ASSERT_EQ(res_proc_type_table, cpu._proc_type_table); + } + } } }; @@ -93,10 +138,23 @@ StreamGenerateionTestCase generation_latency_1sockets_14cores_1_pinning = { // (PCORE_ONLY/ECORE_ONLY/ANY_CORE) true, // param[in]: simulated setting for enableHyperThreading true, // param[in]: simulated settting for changedHyperThreading + false, // param[in]: simulated settting for enableCpuReservation true, // param[in]: simulated setting for enableCpuPinning true, // param[in]: simulated setting for changedCpuPinning ov::hint::PerformanceMode::LATENCY, // param[in]: simulated setting for performance mode (throughput/latency) - {}, // param[in]: simulated setting for model distribution policy + {}, // param[in]: simulated setting for model distribution policy + { + {0, 0, 0, 0, MAIN_CORE_PROC, 0, -1}, {1, 0, 0, 0, HYPER_THREADING_PROC, 1, -1}, + {2, 0, 0, 1, MAIN_CORE_PROC, 2, -1}, {3, 0, 0, 1, HYPER_THREADING_PROC, 3, -1}, + {4, 0, 0, 2, MAIN_CORE_PROC, 4, -1}, {5, 0, 0, 2, HYPER_THREADING_PROC, 5, -1}, + {6, 0, 0, 3, MAIN_CORE_PROC, 6, -1}, {7, 0, 0, 3, HYPER_THREADING_PROC, 7, -1}, + {8, 0, 0, 4, MAIN_CORE_PROC, 8, -1}, {9, 0, 0, 4, HYPER_THREADING_PROC, 9, -1}, + {10, 0, 0, 5, MAIN_CORE_PROC, 10, -1}, {11, 0, 0, 5, HYPER_THREADING_PROC, 11, -1}, + {12, 0, 0, 6, EFFICIENT_CORE_PROC, 12, -1}, {13, 0, 0, 7, EFFICIENT_CORE_PROC, 13, -1}, + {14, 0, 0, 8, EFFICIENT_CORE_PROC, 14, -1}, {15, 0, 0, 9, EFFICIENT_CORE_PROC, 15, -1}, + {16, 0, 0, 10, EFFICIENT_CORE_PROC, 16, -1}, {17, 0, 0, 11, EFFICIENT_CORE_PROC, 17, -1}, + {18, 0, 0, 12, EFFICIENT_CORE_PROC, 18, -1}, {19, 0, 0, 13, EFFICIENT_CORE_PROC, 19, -1}, + }, {{20, 6, 8, 6, 0, 0}}, // param[in]: simulated proc_type_table for platform which has one socket, 6 Pcores, 8 // Ecores and hyper threading enabled ov::hint::SchedulingCoreType::ANY_CORE, // param[expected out]: scheduling core type needs to be the same as input @@ -122,10 +180,27 @@ StreamGenerateionTestCase generation_latency_1sockets_14cores_2_pinning = { ov::hint::SchedulingCoreType::ANY_CORE, true, true, + false, true, true, ov::hint::PerformanceMode::LATENCY, {}, + { + {0, 0, 0, 0, MAIN_CORE_PROC, 0, -1}, + {1, 0, 0, 1, MAIN_CORE_PROC, 1, -1}, + {2, 0, 0, 2, MAIN_CORE_PROC, 2, -1}, + {3, 0, 0, 3, MAIN_CORE_PROC, 3, -1}, + {4, 0, 0, 4, MAIN_CORE_PROC, 4, -1}, + {5, 0, 0, 5, MAIN_CORE_PROC, 5, -1}, + {6, 0, 0, 6, EFFICIENT_CORE_PROC, 6, -1}, + {7, 0, 0, 7, EFFICIENT_CORE_PROC, 7, -1}, + {8, 0, 0, 8, EFFICIENT_CORE_PROC, 8, -1}, + {9, 0, 0, 9, EFFICIENT_CORE_PROC, 9, -1}, + {10, 0, 0, 10, EFFICIENT_CORE_PROC, 10, -1}, + {11, 0, 0, 11, EFFICIENT_CORE_PROC, 11, -1}, + {12, 0, 0, 12, EFFICIENT_CORE_PROC, 12, -1}, + {13, 0, 0, 13, EFFICIENT_CORE_PROC, 13, -1}, + }, {{14, 6, 8, 0, 0, 0}}, ov::hint::SchedulingCoreType::ANY_CORE, false, @@ -145,10 +220,23 @@ StreamGenerateionTestCase generation_tput_1sockets_14cores_1_pinning = { ov::hint::SchedulingCoreType::ANY_CORE, true, true, + false, true, true, ov::hint::PerformanceMode::THROUGHPUT, {}, + { + {0, 0, 0, 0, MAIN_CORE_PROC, 0, -1}, {1, 0, 0, 0, HYPER_THREADING_PROC, 1, -1}, + {2, 0, 0, 1, MAIN_CORE_PROC, 2, -1}, {3, 0, 0, 1, HYPER_THREADING_PROC, 3, -1}, + {4, 0, 0, 2, MAIN_CORE_PROC, 4, -1}, {5, 0, 0, 2, HYPER_THREADING_PROC, 5, -1}, + {6, 0, 0, 3, MAIN_CORE_PROC, 6, -1}, {7, 0, 0, 3, HYPER_THREADING_PROC, 7, -1}, + {8, 0, 0, 4, MAIN_CORE_PROC, 8, -1}, {9, 0, 0, 4, HYPER_THREADING_PROC, 9, -1}, + {10, 0, 0, 5, MAIN_CORE_PROC, 10, -1}, {11, 0, 0, 5, HYPER_THREADING_PROC, 11, -1}, + {12, 0, 0, 6, EFFICIENT_CORE_PROC, 12, -1}, {13, 0, 0, 7, EFFICIENT_CORE_PROC, 13, -1}, + {14, 0, 0, 8, EFFICIENT_CORE_PROC, 14, -1}, {15, 0, 0, 9, EFFICIENT_CORE_PROC, 15, -1}, + {16, 0, 0, 10, EFFICIENT_CORE_PROC, 16, -1}, {17, 0, 0, 11, EFFICIENT_CORE_PROC, 17, -1}, + {18, 0, 0, 12, EFFICIENT_CORE_PROC, 18, -1}, {19, 0, 0, 13, EFFICIENT_CORE_PROC, 19, -1}, + }, {{20, 6, 8, 6, 0, 0}}, ov::hint::SchedulingCoreType::ANY_CORE, true, @@ -168,10 +256,23 @@ StreamGenerateionTestCase generation_latency_1sockets_14cores_1_unpinning = { ov::hint::SchedulingCoreType::ANY_CORE, true, true, + false, true, true, ov::hint::PerformanceMode::LATENCY, {}, + { + {0, 0, 0, 0, MAIN_CORE_PROC, 0, -1}, {1, 0, 0, 0, HYPER_THREADING_PROC, 1, -1}, + {2, 0, 0, 1, MAIN_CORE_PROC, 2, -1}, {3, 0, 0, 1, HYPER_THREADING_PROC, 3, -1}, + {4, 0, 0, 2, MAIN_CORE_PROC, 4, -1}, {5, 0, 0, 2, HYPER_THREADING_PROC, 5, -1}, + {6, 0, 0, 3, MAIN_CORE_PROC, 6, -1}, {7, 0, 0, 3, HYPER_THREADING_PROC, 7, -1}, + {8, 0, 0, 4, MAIN_CORE_PROC, 8, -1}, {9, 0, 0, 4, HYPER_THREADING_PROC, 9, -1}, + {10, 0, 0, 5, MAIN_CORE_PROC, 10, -1}, {11, 0, 0, 5, HYPER_THREADING_PROC, 11, -1}, + {12, 0, 0, 6, EFFICIENT_CORE_PROC, 12, -1}, {13, 0, 0, 7, EFFICIENT_CORE_PROC, 13, -1}, + {14, 0, 0, 8, EFFICIENT_CORE_PROC, 14, -1}, {15, 0, 0, 9, EFFICIENT_CORE_PROC, 15, -1}, + {16, 0, 0, 10, EFFICIENT_CORE_PROC, 16, -1}, {17, 0, 0, 11, EFFICIENT_CORE_PROC, 17, -1}, + {18, 0, 0, 12, EFFICIENT_CORE_PROC, 18, -1}, {19, 0, 0, 13, EFFICIENT_CORE_PROC, 19, -1}, + }, {{20, 6, 8, 6, 0, 0}}, ov::hint::SchedulingCoreType::ANY_CORE, true, @@ -194,10 +295,27 @@ StreamGenerateionTestCase generation_latency_1sockets_14cores_2_unpinning = { ov::hint::SchedulingCoreType::ANY_CORE, true, true, + false, true, true, ov::hint::PerformanceMode::LATENCY, {}, + { + {0, 0, 0, 0, MAIN_CORE_PROC, 0, -1}, + {1, 0, 0, 1, MAIN_CORE_PROC, 1, -1}, + {2, 0, 0, 2, MAIN_CORE_PROC, 2, -1}, + {3, 0, 0, 3, MAIN_CORE_PROC, 3, -1}, + {4, 0, 0, 4, MAIN_CORE_PROC, 4, -1}, + {5, 0, 0, 5, MAIN_CORE_PROC, 5, -1}, + {6, 0, 0, 6, EFFICIENT_CORE_PROC, 6, -1}, + {7, 0, 0, 7, EFFICIENT_CORE_PROC, 7, -1}, + {8, 0, 0, 8, EFFICIENT_CORE_PROC, 8, -1}, + {9, 0, 0, 9, EFFICIENT_CORE_PROC, 9, -1}, + {10, 0, 0, 10, EFFICIENT_CORE_PROC, 10, -1}, + {11, 0, 0, 11, EFFICIENT_CORE_PROC, 11, -1}, + {12, 0, 0, 12, EFFICIENT_CORE_PROC, 12, -1}, + {13, 0, 0, 13, EFFICIENT_CORE_PROC, 13, -1}, + }, {{14, 6, 8, 0, 0, 0}}, ov::hint::SchedulingCoreType::ANY_CORE, false, @@ -217,10 +335,23 @@ StreamGenerateionTestCase generation_tput_1sockets_14cores_1_unpinning = { ov::hint::SchedulingCoreType::ANY_CORE, true, true, + false, true, true, ov::hint::PerformanceMode::THROUGHPUT, {}, + { + {0, 0, 0, 0, MAIN_CORE_PROC, 0, -1}, {1, 0, 0, 0, HYPER_THREADING_PROC, 1, -1}, + {2, 0, 0, 1, MAIN_CORE_PROC, 2, -1}, {3, 0, 0, 1, HYPER_THREADING_PROC, 3, -1}, + {4, 0, 0, 2, MAIN_CORE_PROC, 4, -1}, {5, 0, 0, 2, HYPER_THREADING_PROC, 5, -1}, + {6, 0, 0, 3, MAIN_CORE_PROC, 6, -1}, {7, 0, 0, 3, HYPER_THREADING_PROC, 7, -1}, + {8, 0, 0, 4, MAIN_CORE_PROC, 8, -1}, {9, 0, 0, 4, HYPER_THREADING_PROC, 9, -1}, + {10, 0, 0, 5, MAIN_CORE_PROC, 10, -1}, {11, 0, 0, 5, HYPER_THREADING_PROC, 11, -1}, + {12, 0, 0, 6, EFFICIENT_CORE_PROC, 12, -1}, {13, 0, 0, 7, EFFICIENT_CORE_PROC, 13, -1}, + {14, 0, 0, 8, EFFICIENT_CORE_PROC, 14, -1}, {15, 0, 0, 9, EFFICIENT_CORE_PROC, 15, -1}, + {16, 0, 0, 10, EFFICIENT_CORE_PROC, 16, -1}, {17, 0, 0, 11, EFFICIENT_CORE_PROC, 17, -1}, + {18, 0, 0, 12, EFFICIENT_CORE_PROC, 18, -1}, {19, 0, 0, 13, EFFICIENT_CORE_PROC, 19, -1}, + }, {{20, 6, 8, 6, 0, 0}}, ov::hint::SchedulingCoreType::ANY_CORE, true, @@ -241,9 +372,66 @@ StreamGenerateionTestCase generation_latency_1sockets_14cores_3 = { true, true, false, + false, + true, + ov::hint::PerformanceMode::LATENCY, + {}, + { + {0, 0, 0, 0, MAIN_CORE_PROC, 0, -1}, + {1, 0, 0, 1, MAIN_CORE_PROC, 1, -1}, + {2, 0, 0, 2, MAIN_CORE_PROC, 2, -1}, + {3, 0, 0, 3, MAIN_CORE_PROC, 3, -1}, + {4, 0, 0, 4, MAIN_CORE_PROC, 4, -1}, + {5, 0, 0, 5, MAIN_CORE_PROC, 5, -1}, + {6, 0, 0, 6, EFFICIENT_CORE_PROC, 6, -1}, + {7, 0, 0, 7, EFFICIENT_CORE_PROC, 7, -1}, + {8, 0, 0, 8, EFFICIENT_CORE_PROC, 8, -1}, + {9, 0, 0, 9, EFFICIENT_CORE_PROC, 9, -1}, + {10, 0, 0, 10, EFFICIENT_CORE_PROC, 10, -1}, + {11, 0, 0, 11, EFFICIENT_CORE_PROC, 11, -1}, + {12, 0, 0, 12, EFFICIENT_CORE_PROC, 12, -1}, + {13, 0, 0, 13, EFFICIENT_CORE_PROC, 13, -1}, + }, + {{14, 6, 8, 0, 0, 0}}, + ov::hint::SchedulingCoreType::PCORE_ONLY, + false, + false, + ov::hint::PerformanceMode::LATENCY, + {{6, 6, 0, 0, 0, 0}}, + {{1, MAIN_CORE_PROC, 6, 0, 0}}, +}; + +StreamGenerateionTestCase generation_latency_1sockets_14cores_3_reservation = { + 1, + false, + 0, + 0, + 0, + 0, + ov::hint::SchedulingCoreType::PCORE_ONLY, + true, + true, + true, + false, true, ov::hint::PerformanceMode::LATENCY, {}, + { + {0, 0, 0, 0, MAIN_CORE_PROC, 0, -1}, + {1, 0, 0, 1, MAIN_CORE_PROC, 1, -1}, + {2, 0, 0, 2, MAIN_CORE_PROC, 2, -1}, + {3, 0, 0, 3, MAIN_CORE_PROC, 3, -1}, + {4, 0, 0, 4, MAIN_CORE_PROC, 4, -1}, + {5, 0, 0, 5, MAIN_CORE_PROC, 5, -1}, + {6, 0, 0, 6, EFFICIENT_CORE_PROC, 6, -1}, + {7, 0, 0, 7, EFFICIENT_CORE_PROC, 7, -1}, + {8, 0, 0, 8, EFFICIENT_CORE_PROC, 8, -1}, + {9, 0, 0, 9, EFFICIENT_CORE_PROC, 9, -1}, + {10, 0, 0, 10, EFFICIENT_CORE_PROC, 10, -1}, + {11, 0, 0, 11, EFFICIENT_CORE_PROC, 11, -1}, + {12, 0, 0, 12, EFFICIENT_CORE_PROC, 12, -1}, + {13, 0, 0, 13, EFFICIENT_CORE_PROC, 13, -1}, + }, {{14, 6, 8, 0, 0, 0}}, ov::hint::SchedulingCoreType::PCORE_ONLY, false, @@ -264,9 +452,22 @@ StreamGenerateionTestCase generation_latency_1sockets_14cores_4 = { true, true, false, + false, true, ov::hint::PerformanceMode::LATENCY, {}, + { + {0, 0, 0, 0, MAIN_CORE_PROC, 0, -1}, {1, 0, 0, 0, HYPER_THREADING_PROC, 1, -1}, + {2, 0, 0, 1, MAIN_CORE_PROC, 2, -1}, {3, 0, 0, 1, HYPER_THREADING_PROC, 3, -1}, + {4, 0, 0, 2, MAIN_CORE_PROC, 4, -1}, {5, 0, 0, 2, HYPER_THREADING_PROC, 5, -1}, + {6, 0, 0, 3, MAIN_CORE_PROC, 6, -1}, {7, 0, 0, 3, HYPER_THREADING_PROC, 7, -1}, + {8, 0, 0, 4, MAIN_CORE_PROC, 8, -1}, {9, 0, 0, 4, HYPER_THREADING_PROC, 9, -1}, + {10, 0, 0, 5, MAIN_CORE_PROC, 10, -1}, {11, 0, 0, 5, HYPER_THREADING_PROC, 11, -1}, + {12, 0, 0, 6, EFFICIENT_CORE_PROC, 12, -1}, {13, 0, 0, 7, EFFICIENT_CORE_PROC, 13, -1}, + {14, 0, 0, 8, EFFICIENT_CORE_PROC, 14, -1}, {15, 0, 0, 9, EFFICIENT_CORE_PROC, 15, -1}, + {16, 0, 0, 10, EFFICIENT_CORE_PROC, 16, -1}, {17, 0, 0, 11, EFFICIENT_CORE_PROC, 17, -1}, + {18, 0, 0, 12, EFFICIENT_CORE_PROC, 18, -1}, {19, 0, 0, 13, EFFICIENT_CORE_PROC, 19, -1}, + }, {{20, 6, 8, 6, 0, 0}}, ov::hint::SchedulingCoreType::PCORE_ONLY, true, @@ -287,9 +488,22 @@ StreamGenerateionTestCase generation_latency_1sockets_14cores_5 = { false, true, false, + false, true, ov::hint::PerformanceMode::LATENCY, {}, + { + {0, 0, 0, 0, MAIN_CORE_PROC, 0, -1}, {1, 0, 0, 0, HYPER_THREADING_PROC, 1, -1}, + {2, 0, 0, 1, MAIN_CORE_PROC, 2, -1}, {3, 0, 0, 1, HYPER_THREADING_PROC, 3, -1}, + {4, 0, 0, 2, MAIN_CORE_PROC, 4, -1}, {5, 0, 0, 2, HYPER_THREADING_PROC, 5, -1}, + {6, 0, 0, 3, MAIN_CORE_PROC, 6, -1}, {7, 0, 0, 3, HYPER_THREADING_PROC, 7, -1}, + {8, 0, 0, 4, MAIN_CORE_PROC, 8, -1}, {9, 0, 0, 4, HYPER_THREADING_PROC, 9, -1}, + {10, 0, 0, 5, MAIN_CORE_PROC, 10, -1}, {11, 0, 0, 5, HYPER_THREADING_PROC, 11, -1}, + {12, 0, 0, 6, EFFICIENT_CORE_PROC, 12, -1}, {13, 0, 0, 7, EFFICIENT_CORE_PROC, 13, -1}, + {14, 0, 0, 8, EFFICIENT_CORE_PROC, 14, -1}, {15, 0, 0, 9, EFFICIENT_CORE_PROC, 15, -1}, + {16, 0, 0, 10, EFFICIENT_CORE_PROC, 16, -1}, {17, 0, 0, 11, EFFICIENT_CORE_PROC, 17, -1}, + {18, 0, 0, 12, EFFICIENT_CORE_PROC, 18, -1}, {19, 0, 0, 13, EFFICIENT_CORE_PROC, 19, -1}, + }, {{20, 6, 8, 6, 0, 0}}, ov::hint::SchedulingCoreType::PCORE_ONLY, false, @@ -310,9 +524,134 @@ StreamGenerateionTestCase generation_latency_2sockets_48cores_6 = { false, true, false, + false, + true, + ov::hint::PerformanceMode::LATENCY, + {}, + { + {0, 0, 0, 0, HYPER_THREADING_PROC, 0, -1}, {1, 0, 0, 1, HYPER_THREADING_PROC, 1, -1}, + {2, 0, 0, 2, HYPER_THREADING_PROC, 2, -1}, {3, 0, 0, 3, HYPER_THREADING_PROC, 3, -1}, + {4, 0, 0, 4, HYPER_THREADING_PROC, 4, -1}, {5, 0, 0, 5, HYPER_THREADING_PROC, 5, -1}, + {6, 0, 0, 6, HYPER_THREADING_PROC, 6, -1}, {7, 0, 0, 7, HYPER_THREADING_PROC, 7, -1}, + {8, 0, 0, 8, HYPER_THREADING_PROC, 8, -1}, {9, 0, 0, 9, HYPER_THREADING_PROC, 9, -1}, + {10, 0, 0, 10, HYPER_THREADING_PROC, 10, -1}, {11, 0, 0, 11, HYPER_THREADING_PROC, 11, -1}, + {12, 0, 0, 12, HYPER_THREADING_PROC, 12, -1}, {13, 0, 0, 13, HYPER_THREADING_PROC, 13, -1}, + {14, 0, 0, 14, HYPER_THREADING_PROC, 14, -1}, {15, 0, 0, 15, HYPER_THREADING_PROC, 15, -1}, + {16, 0, 0, 16, HYPER_THREADING_PROC, 16, -1}, {17, 0, 0, 17, HYPER_THREADING_PROC, 17, -1}, + {18, 0, 0, 18, HYPER_THREADING_PROC, 18, -1}, {19, 0, 0, 19, HYPER_THREADING_PROC, 19, -1}, + {20, 0, 0, 20, HYPER_THREADING_PROC, 20, -1}, {21, 0, 0, 21, HYPER_THREADING_PROC, 21, -1}, + {22, 0, 0, 22, HYPER_THREADING_PROC, 22, -1}, {23, 0, 0, 23, HYPER_THREADING_PROC, 23, -1}, + {24, 1, 1, 24, HYPER_THREADING_PROC, 24, -1}, {25, 1, 1, 25, HYPER_THREADING_PROC, 25, -1}, + {26, 1, 1, 26, HYPER_THREADING_PROC, 26, -1}, {27, 1, 1, 27, HYPER_THREADING_PROC, 27, -1}, + {28, 1, 1, 28, HYPER_THREADING_PROC, 28, -1}, {29, 1, 1, 29, HYPER_THREADING_PROC, 29, -1}, + {30, 1, 1, 30, HYPER_THREADING_PROC, 30, -1}, {31, 1, 1, 31, HYPER_THREADING_PROC, 31, -1}, + {32, 1, 1, 32, HYPER_THREADING_PROC, 32, -1}, {33, 1, 1, 33, HYPER_THREADING_PROC, 33, -1}, + {34, 1, 1, 34, HYPER_THREADING_PROC, 34, -1}, {35, 1, 1, 35, HYPER_THREADING_PROC, 35, -1}, + {36, 1, 1, 36, HYPER_THREADING_PROC, 36, -1}, {37, 1, 1, 37, HYPER_THREADING_PROC, 37, -1}, + {38, 1, 1, 38, HYPER_THREADING_PROC, 38, -1}, {39, 1, 1, 39, HYPER_THREADING_PROC, 39, -1}, + {40, 1, 1, 40, HYPER_THREADING_PROC, 40, -1}, {41, 1, 1, 41, HYPER_THREADING_PROC, 41, -1}, + {42, 1, 1, 42, HYPER_THREADING_PROC, 42, -1}, {43, 1, 1, 43, HYPER_THREADING_PROC, 43, -1}, + {44, 1, 1, 44, HYPER_THREADING_PROC, 44, -1}, {45, 1, 1, 45, HYPER_THREADING_PROC, 45, -1}, + {46, 1, 1, 46, HYPER_THREADING_PROC, 46, -1}, {47, 1, 1, 47, HYPER_THREADING_PROC, 47, -1}, + {48, 0, 0, 48, MAIN_CORE_PROC, 48, -1}, {49, 0, 0, 49, MAIN_CORE_PROC, 49, -1}, + {50, 0, 0, 50, MAIN_CORE_PROC, 50, -1}, {51, 0, 0, 51, MAIN_CORE_PROC, 51, -1}, + {52, 0, 0, 52, MAIN_CORE_PROC, 52, -1}, {53, 0, 0, 53, MAIN_CORE_PROC, 53, -1}, + {54, 0, 0, 54, MAIN_CORE_PROC, 54, -1}, {55, 0, 0, 55, MAIN_CORE_PROC, 55, -1}, + {56, 0, 0, 56, MAIN_CORE_PROC, 56, -1}, {57, 0, 0, 57, MAIN_CORE_PROC, 57, -1}, + {58, 0, 0, 58, MAIN_CORE_PROC, 58, -1}, {59, 0, 0, 59, MAIN_CORE_PROC, 59, -1}, + {60, 0, 0, 60, MAIN_CORE_PROC, 60, -1}, {61, 0, 0, 61, MAIN_CORE_PROC, 61, -1}, + {62, 0, 0, 62, MAIN_CORE_PROC, 62, -1}, {63, 0, 0, 63, MAIN_CORE_PROC, 63, -1}, + {64, 0, 0, 64, MAIN_CORE_PROC, 64, -1}, {65, 0, 0, 65, MAIN_CORE_PROC, 65, -1}, + {66, 0, 0, 66, MAIN_CORE_PROC, 66, -1}, {67, 0, 0, 67, MAIN_CORE_PROC, 67, -1}, + {68, 0, 0, 68, MAIN_CORE_PROC, 68, -1}, {69, 0, 0, 69, MAIN_CORE_PROC, 69, -1}, + {70, 0, 0, 70, MAIN_CORE_PROC, 70, -1}, {71, 0, 0, 71, MAIN_CORE_PROC, 71, -1}, + {72, 1, 1, 72, MAIN_CORE_PROC, 72, -1}, {73, 1, 1, 73, MAIN_CORE_PROC, 73, -1}, + {74, 1, 1, 74, MAIN_CORE_PROC, 74, -1}, {75, 1, 1, 75, MAIN_CORE_PROC, 75, -1}, + {76, 1, 1, 76, MAIN_CORE_PROC, 76, -1}, {77, 1, 1, 77, MAIN_CORE_PROC, 77, -1}, + {78, 1, 1, 78, MAIN_CORE_PROC, 78, -1}, {79, 1, 1, 79, MAIN_CORE_PROC, 79, -1}, + {80, 1, 1, 80, MAIN_CORE_PROC, 80, -1}, {81, 1, 1, 81, MAIN_CORE_PROC, 81, -1}, + {82, 1, 1, 82, MAIN_CORE_PROC, 82, -1}, {83, 1, 1, 83, MAIN_CORE_PROC, 83, -1}, + {84, 1, 1, 84, MAIN_CORE_PROC, 84, -1}, {85, 1, 1, 85, MAIN_CORE_PROC, 85, -1}, + {86, 1, 1, 86, MAIN_CORE_PROC, 86, -1}, {87, 1, 1, 87, MAIN_CORE_PROC, 87, -1}, + {88, 1, 1, 88, MAIN_CORE_PROC, 88, -1}, {89, 1, 1, 89, MAIN_CORE_PROC, 89, -1}, + {90, 1, 1, 90, MAIN_CORE_PROC, 90, -1}, {91, 1, 1, 91, MAIN_CORE_PROC, 91, -1}, + {92, 1, 1, 92, MAIN_CORE_PROC, 92, -1}, {93, 1, 1, 93, MAIN_CORE_PROC, 93, -1}, + {94, 1, 1, 94, MAIN_CORE_PROC, 94, -1}, {95, 1, 1, 95, MAIN_CORE_PROC, 95, -1}, + }, + {{96, 48, 0, 48, -1, -1}, {48, 24, 0, 24, 0, 0}, {48, 24, 0, 24, 1, 1}}, + ov::hint::SchedulingCoreType::PCORE_ONLY, + false, + false, + ov::hint::PerformanceMode::LATENCY, + {{48, 48, 0, 0, -1, -1}, {24, 24, 0, 0, 0, 0}, {24, 24, 0, 0, 1, 1}}, + {{1, MAIN_CORE_PROC, 24, 0, 0}}, +}; + +StreamGenerateionTestCase generation_latency_2sockets_48cores_6_reservation = { + 1, + false, + 0, + 0, + 0, + 0, + ov::hint::SchedulingCoreType::PCORE_ONLY, + false, + true, + true, + false, true, ov::hint::PerformanceMode::LATENCY, {}, + { + {0, 0, 0, 0, HYPER_THREADING_PROC, 0, -1}, {1, 0, 0, 1, HYPER_THREADING_PROC, 1, -1}, + {2, 0, 0, 2, HYPER_THREADING_PROC, 2, -1}, {3, 0, 0, 3, HYPER_THREADING_PROC, 3, -1}, + {4, 0, 0, 4, HYPER_THREADING_PROC, 4, -1}, {5, 0, 0, 5, HYPER_THREADING_PROC, 5, -1}, + {6, 0, 0, 6, HYPER_THREADING_PROC, 6, -1}, {7, 0, 0, 7, HYPER_THREADING_PROC, 7, -1}, + {8, 0, 0, 8, HYPER_THREADING_PROC, 8, -1}, {9, 0, 0, 9, HYPER_THREADING_PROC, 9, -1}, + {10, 0, 0, 10, HYPER_THREADING_PROC, 10, -1}, {11, 0, 0, 11, HYPER_THREADING_PROC, 11, -1}, + {12, 0, 0, 12, HYPER_THREADING_PROC, 12, -1}, {13, 0, 0, 13, HYPER_THREADING_PROC, 13, -1}, + {14, 0, 0, 14, HYPER_THREADING_PROC, 14, -1}, {15, 0, 0, 15, HYPER_THREADING_PROC, 15, -1}, + {16, 0, 0, 16, HYPER_THREADING_PROC, 16, -1}, {17, 0, 0, 17, HYPER_THREADING_PROC, 17, -1}, + {18, 0, 0, 18, HYPER_THREADING_PROC, 18, -1}, {19, 0, 0, 19, HYPER_THREADING_PROC, 19, -1}, + {20, 0, 0, 20, HYPER_THREADING_PROC, 20, -1}, {21, 0, 0, 21, HYPER_THREADING_PROC, 21, -1}, + {22, 0, 0, 22, HYPER_THREADING_PROC, 22, -1}, {23, 0, 0, 23, HYPER_THREADING_PROC, 23, -1}, + {24, 1, 1, 24, HYPER_THREADING_PROC, 24, -1}, {25, 1, 1, 25, HYPER_THREADING_PROC, 25, -1}, + {26, 1, 1, 26, HYPER_THREADING_PROC, 26, -1}, {27, 1, 1, 27, HYPER_THREADING_PROC, 27, -1}, + {28, 1, 1, 28, HYPER_THREADING_PROC, 28, -1}, {29, 1, 1, 29, HYPER_THREADING_PROC, 29, -1}, + {30, 1, 1, 30, HYPER_THREADING_PROC, 30, -1}, {31, 1, 1, 31, HYPER_THREADING_PROC, 31, -1}, + {32, 1, 1, 32, HYPER_THREADING_PROC, 32, -1}, {33, 1, 1, 33, HYPER_THREADING_PROC, 33, -1}, + {34, 1, 1, 34, HYPER_THREADING_PROC, 34, -1}, {35, 1, 1, 35, HYPER_THREADING_PROC, 35, -1}, + {36, 1, 1, 36, HYPER_THREADING_PROC, 36, -1}, {37, 1, 1, 37, HYPER_THREADING_PROC, 37, -1}, + {38, 1, 1, 38, HYPER_THREADING_PROC, 38, -1}, {39, 1, 1, 39, HYPER_THREADING_PROC, 39, -1}, + {40, 1, 1, 40, HYPER_THREADING_PROC, 40, -1}, {41, 1, 1, 41, HYPER_THREADING_PROC, 41, -1}, + {42, 1, 1, 42, HYPER_THREADING_PROC, 42, -1}, {43, 1, 1, 43, HYPER_THREADING_PROC, 43, -1}, + {44, 1, 1, 44, HYPER_THREADING_PROC, 44, -1}, {45, 1, 1, 45, HYPER_THREADING_PROC, 45, -1}, + {46, 1, 1, 46, HYPER_THREADING_PROC, 46, -1}, {47, 1, 1, 47, HYPER_THREADING_PROC, 47, -1}, + {48, 0, 0, 48, MAIN_CORE_PROC, 48, -1}, {49, 0, 0, 49, MAIN_CORE_PROC, 49, -1}, + {50, 0, 0, 50, MAIN_CORE_PROC, 50, -1}, {51, 0, 0, 51, MAIN_CORE_PROC, 51, -1}, + {52, 0, 0, 52, MAIN_CORE_PROC, 52, -1}, {53, 0, 0, 53, MAIN_CORE_PROC, 53, -1}, + {54, 0, 0, 54, MAIN_CORE_PROC, 54, -1}, {55, 0, 0, 55, MAIN_CORE_PROC, 55, -1}, + {56, 0, 0, 56, MAIN_CORE_PROC, 56, -1}, {57, 0, 0, 57, MAIN_CORE_PROC, 57, -1}, + {58, 0, 0, 58, MAIN_CORE_PROC, 58, -1}, {59, 0, 0, 59, MAIN_CORE_PROC, 59, -1}, + {60, 0, 0, 60, MAIN_CORE_PROC, 60, -1}, {61, 0, 0, 61, MAIN_CORE_PROC, 61, -1}, + {62, 0, 0, 62, MAIN_CORE_PROC, 62, -1}, {63, 0, 0, 63, MAIN_CORE_PROC, 63, -1}, + {64, 0, 0, 64, MAIN_CORE_PROC, 64, -1}, {65, 0, 0, 65, MAIN_CORE_PROC, 65, -1}, + {66, 0, 0, 66, MAIN_CORE_PROC, 66, -1}, {67, 0, 0, 67, MAIN_CORE_PROC, 67, -1}, + {68, 0, 0, 68, MAIN_CORE_PROC, 68, -1}, {69, 0, 0, 69, MAIN_CORE_PROC, 69, -1}, + {70, 0, 0, 70, MAIN_CORE_PROC, 70, -1}, {71, 0, 0, 71, MAIN_CORE_PROC, 71, -1}, + {72, 1, 1, 72, MAIN_CORE_PROC, 72, -1}, {73, 1, 1, 73, MAIN_CORE_PROC, 73, -1}, + {74, 1, 1, 74, MAIN_CORE_PROC, 74, -1}, {75, 1, 1, 75, MAIN_CORE_PROC, 75, -1}, + {76, 1, 1, 76, MAIN_CORE_PROC, 76, -1}, {77, 1, 1, 77, MAIN_CORE_PROC, 77, -1}, + {78, 1, 1, 78, MAIN_CORE_PROC, 78, -1}, {79, 1, 1, 79, MAIN_CORE_PROC, 79, -1}, + {80, 1, 1, 80, MAIN_CORE_PROC, 80, -1}, {81, 1, 1, 81, MAIN_CORE_PROC, 81, -1}, + {82, 1, 1, 82, MAIN_CORE_PROC, 82, -1}, {83, 1, 1, 83, MAIN_CORE_PROC, 83, -1}, + {84, 1, 1, 84, MAIN_CORE_PROC, 84, -1}, {85, 1, 1, 85, MAIN_CORE_PROC, 85, -1}, + {86, 1, 1, 86, MAIN_CORE_PROC, 86, -1}, {87, 1, 1, 87, MAIN_CORE_PROC, 87, -1}, + {88, 1, 1, 88, MAIN_CORE_PROC, 88, -1}, {89, 1, 1, 89, MAIN_CORE_PROC, 89, -1}, + {90, 1, 1, 90, MAIN_CORE_PROC, 90, -1}, {91, 1, 1, 91, MAIN_CORE_PROC, 91, -1}, + {92, 1, 1, 92, MAIN_CORE_PROC, 92, -1}, {93, 1, 1, 93, MAIN_CORE_PROC, 93, -1}, + {94, 1, 1, 94, MAIN_CORE_PROC, 94, -1}, {95, 1, 1, 95, MAIN_CORE_PROC, 95, -1}, + }, {{96, 48, 0, 48, -1, -1}, {48, 24, 0, 24, 0, 0}, {48, 24, 0, 24, 1, 1}}, ov::hint::SchedulingCoreType::PCORE_ONLY, false, @@ -333,9 +672,36 @@ StreamGenerateionTestCase generation_latency_2sockets_48cores_7 = { true, true, false, + false, true, ov::hint::PerformanceMode::LATENCY, {}, + { + {0, 0, 0, 0, MAIN_CORE_PROC, 0, -1}, {1, 0, 0, 1, MAIN_CORE_PROC, 1, -1}, + {2, 0, 0, 2, MAIN_CORE_PROC, 2, -1}, {3, 0, 0, 3, MAIN_CORE_PROC, 3, -1}, + {4, 0, 0, 4, MAIN_CORE_PROC, 4, -1}, {5, 0, 0, 5, MAIN_CORE_PROC, 5, -1}, + {6, 0, 0, 6, MAIN_CORE_PROC, 6, -1}, {7, 0, 0, 7, MAIN_CORE_PROC, 7, -1}, + {8, 0, 0, 8, MAIN_CORE_PROC, 8, -1}, {9, 0, 0, 9, MAIN_CORE_PROC, 9, -1}, + {10, 0, 0, 10, MAIN_CORE_PROC, 10, -1}, {11, 0, 0, 11, MAIN_CORE_PROC, 11, -1}, + {12, 0, 0, 12, MAIN_CORE_PROC, 12, -1}, {13, 0, 0, 13, MAIN_CORE_PROC, 13, -1}, + {14, 0, 0, 14, MAIN_CORE_PROC, 14, -1}, {15, 0, 0, 15, MAIN_CORE_PROC, 15, -1}, + {16, 0, 0, 16, MAIN_CORE_PROC, 16, -1}, {17, 0, 0, 17, MAIN_CORE_PROC, 17, -1}, + {18, 0, 0, 18, MAIN_CORE_PROC, 18, -1}, {19, 0, 0, 19, MAIN_CORE_PROC, 19, -1}, + {20, 0, 0, 20, MAIN_CORE_PROC, 20, -1}, {21, 0, 0, 21, MAIN_CORE_PROC, 21, -1}, + {22, 0, 0, 22, MAIN_CORE_PROC, 22, -1}, {23, 0, 0, 23, MAIN_CORE_PROC, 23, -1}, + {24, 1, 1, 24, MAIN_CORE_PROC, 24, -1}, {25, 1, 1, 25, MAIN_CORE_PROC, 25, -1}, + {26, 1, 1, 26, MAIN_CORE_PROC, 26, -1}, {27, 1, 1, 27, MAIN_CORE_PROC, 27, -1}, + {28, 1, 1, 28, MAIN_CORE_PROC, 28, -1}, {29, 1, 1, 29, MAIN_CORE_PROC, 29, -1}, + {30, 1, 1, 30, MAIN_CORE_PROC, 30, -1}, {31, 1, 1, 31, MAIN_CORE_PROC, 31, -1}, + {32, 1, 1, 32, MAIN_CORE_PROC, 32, -1}, {33, 1, 1, 33, MAIN_CORE_PROC, 33, -1}, + {34, 1, 1, 34, MAIN_CORE_PROC, 34, -1}, {35, 1, 1, 35, MAIN_CORE_PROC, 35, -1}, + {36, 1, 1, 36, MAIN_CORE_PROC, 36, -1}, {37, 1, 1, 37, MAIN_CORE_PROC, 37, -1}, + {38, 1, 1, 38, MAIN_CORE_PROC, 38, -1}, {39, 1, 1, 39, MAIN_CORE_PROC, 39, -1}, + {40, 1, 1, 40, MAIN_CORE_PROC, 40, -1}, {41, 1, 1, 41, MAIN_CORE_PROC, 41, -1}, + {42, 1, 1, 42, MAIN_CORE_PROC, 42, -1}, {43, 1, 1, 43, MAIN_CORE_PROC, 43, -1}, + {44, 1, 1, 44, MAIN_CORE_PROC, 44, -1}, {45, 1, 1, 45, MAIN_CORE_PROC, 45, -1}, + {46, 1, 1, 46, MAIN_CORE_PROC, 46, -1}, {47, 1, 1, 47, MAIN_CORE_PROC, 47, -1}, + }, {{48, 48, 0, 0, -1, -1}, {24, 24, 0, 0, 0, 0}, {24, 24, 0, 0, 1, 1}}, ov::hint::SchedulingCoreType::PCORE_ONLY, false, @@ -356,9 +722,60 @@ StreamGenerateionTestCase generation_latency_2sockets_48cores_8 = { false, true, false, + false, true, ov::hint::PerformanceMode::LATENCY, {}, + { + {0, 0, 0, 0, HYPER_THREADING_PROC, 0, -1}, {1, 0, 0, 1, HYPER_THREADING_PROC, 1, -1}, + {2, 0, 0, 2, HYPER_THREADING_PROC, 2, -1}, {3, 0, 0, 3, HYPER_THREADING_PROC, 3, -1}, + {4, 0, 0, 4, HYPER_THREADING_PROC, 4, -1}, {5, 0, 0, 5, HYPER_THREADING_PROC, 5, -1}, + {6, 0, 0, 6, HYPER_THREADING_PROC, 6, -1}, {7, 0, 0, 7, HYPER_THREADING_PROC, 7, -1}, + {8, 0, 0, 8, HYPER_THREADING_PROC, 8, -1}, {9, 0, 0, 9, HYPER_THREADING_PROC, 9, -1}, + {10, 0, 0, 10, HYPER_THREADING_PROC, 10, -1}, {11, 0, 0, 11, HYPER_THREADING_PROC, 11, -1}, + {12, 0, 0, 12, HYPER_THREADING_PROC, 12, -1}, {13, 0, 0, 13, HYPER_THREADING_PROC, 13, -1}, + {14, 0, 0, 14, HYPER_THREADING_PROC, 14, -1}, {15, 0, 0, 15, HYPER_THREADING_PROC, 15, -1}, + {16, 0, 0, 16, HYPER_THREADING_PROC, 16, -1}, {17, 0, 0, 17, HYPER_THREADING_PROC, 17, -1}, + {18, 0, 0, 18, HYPER_THREADING_PROC, 18, -1}, {19, 0, 0, 19, HYPER_THREADING_PROC, 19, -1}, + {20, 0, 0, 20, HYPER_THREADING_PROC, 20, -1}, {21, 0, 0, 21, HYPER_THREADING_PROC, 21, -1}, + {22, 0, 0, 22, HYPER_THREADING_PROC, 22, -1}, {23, 0, 0, 23, HYPER_THREADING_PROC, 23, -1}, + {24, 1, 1, 24, HYPER_THREADING_PROC, 24, -1}, {25, 1, 1, 25, HYPER_THREADING_PROC, 25, -1}, + {26, 1, 1, 26, HYPER_THREADING_PROC, 26, -1}, {27, 1, 1, 27, HYPER_THREADING_PROC, 27, -1}, + {28, 1, 1, 28, HYPER_THREADING_PROC, 28, -1}, {29, 1, 1, 29, HYPER_THREADING_PROC, 29, -1}, + {30, 1, 1, 30, HYPER_THREADING_PROC, 30, -1}, {31, 1, 1, 31, HYPER_THREADING_PROC, 31, -1}, + {32, 1, 1, 32, HYPER_THREADING_PROC, 32, -1}, {33, 1, 1, 33, HYPER_THREADING_PROC, 33, -1}, + {34, 1, 1, 34, HYPER_THREADING_PROC, 34, -1}, {35, 1, 1, 35, HYPER_THREADING_PROC, 35, -1}, + {36, 1, 1, 36, HYPER_THREADING_PROC, 36, -1}, {37, 1, 1, 37, HYPER_THREADING_PROC, 37, -1}, + {38, 1, 1, 38, HYPER_THREADING_PROC, 38, -1}, {39, 1, 1, 39, HYPER_THREADING_PROC, 39, -1}, + {40, 1, 1, 40, HYPER_THREADING_PROC, 40, -1}, {41, 1, 1, 41, HYPER_THREADING_PROC, 41, -1}, + {42, 1, 1, 42, HYPER_THREADING_PROC, 42, -1}, {43, 1, 1, 43, HYPER_THREADING_PROC, 43, -1}, + {44, 1, 1, 44, HYPER_THREADING_PROC, 44, -1}, {45, 1, 1, 45, HYPER_THREADING_PROC, 45, -1}, + {46, 1, 1, 46, HYPER_THREADING_PROC, 46, -1}, {47, 1, 1, 47, HYPER_THREADING_PROC, 47, -1}, + {48, 0, 0, 48, MAIN_CORE_PROC, 48, -1}, {49, 0, 0, 49, MAIN_CORE_PROC, 49, -1}, + {50, 0, 0, 50, MAIN_CORE_PROC, 50, -1}, {51, 0, 0, 51, MAIN_CORE_PROC, 51, -1}, + {52, 0, 0, 52, MAIN_CORE_PROC, 52, -1}, {53, 0, 0, 53, MAIN_CORE_PROC, 53, -1}, + {54, 0, 0, 54, MAIN_CORE_PROC, 54, -1}, {55, 0, 0, 55, MAIN_CORE_PROC, 55, -1}, + {56, 0, 0, 56, MAIN_CORE_PROC, 56, -1}, {57, 0, 0, 57, MAIN_CORE_PROC, 57, -1}, + {58, 0, 0, 58, MAIN_CORE_PROC, 58, -1}, {59, 0, 0, 59, MAIN_CORE_PROC, 59, -1}, + {60, 0, 0, 60, MAIN_CORE_PROC, 60, -1}, {61, 0, 0, 61, MAIN_CORE_PROC, 61, -1}, + {62, 0, 0, 62, MAIN_CORE_PROC, 62, -1}, {63, 0, 0, 63, MAIN_CORE_PROC, 63, -1}, + {64, 0, 0, 64, MAIN_CORE_PROC, 64, -1}, {65, 0, 0, 65, MAIN_CORE_PROC, 65, -1}, + {66, 0, 0, 66, MAIN_CORE_PROC, 66, -1}, {67, 0, 0, 67, MAIN_CORE_PROC, 67, -1}, + {68, 0, 0, 68, MAIN_CORE_PROC, 68, -1}, {69, 0, 0, 69, MAIN_CORE_PROC, 69, -1}, + {70, 0, 0, 70, MAIN_CORE_PROC, 70, -1}, {71, 0, 0, 71, MAIN_CORE_PROC, 71, -1}, + {72, 1, 1, 72, MAIN_CORE_PROC, 72, -1}, {73, 1, 1, 73, MAIN_CORE_PROC, 73, -1}, + {74, 1, 1, 74, MAIN_CORE_PROC, 74, -1}, {75, 1, 1, 75, MAIN_CORE_PROC, 75, -1}, + {76, 1, 1, 76, MAIN_CORE_PROC, 76, -1}, {77, 1, 1, 77, MAIN_CORE_PROC, 77, -1}, + {78, 1, 1, 78, MAIN_CORE_PROC, 78, -1}, {79, 1, 1, 79, MAIN_CORE_PROC, 79, -1}, + {80, 1, 1, 80, MAIN_CORE_PROC, 80, -1}, {81, 1, 1, 81, MAIN_CORE_PROC, 81, -1}, + {82, 1, 1, 82, MAIN_CORE_PROC, 82, -1}, {83, 1, 1, 83, MAIN_CORE_PROC, 83, -1}, + {84, 1, 1, 84, MAIN_CORE_PROC, 84, -1}, {85, 1, 1, 85, MAIN_CORE_PROC, 85, -1}, + {86, 1, 1, 86, MAIN_CORE_PROC, 86, -1}, {87, 1, 1, 87, MAIN_CORE_PROC, 87, -1}, + {88, 1, 1, 88, MAIN_CORE_PROC, 88, -1}, {89, 1, 1, 89, MAIN_CORE_PROC, 89, -1}, + {90, 1, 1, 90, MAIN_CORE_PROC, 90, -1}, {91, 1, 1, 91, MAIN_CORE_PROC, 91, -1}, + {92, 1, 1, 92, MAIN_CORE_PROC, 92, -1}, {93, 1, 1, 93, MAIN_CORE_PROC, 93, -1}, + {94, 1, 1, 94, MAIN_CORE_PROC, 94, -1}, {95, 1, 1, 95, MAIN_CORE_PROC, 95, -1}, + }, {{96, 48, 0, 48, -1, -1}, {48, 24, 0, 24, 0, 0}, {48, 24, 0, 24, 1, 1}}, ov::hint::SchedulingCoreType::PCORE_ONLY, false, @@ -379,9 +796,36 @@ StreamGenerateionTestCase generation_latency_2sockets_48cores_9 = { true, true, false, + false, true, ov::hint::PerformanceMode::LATENCY, {}, + { + {0, 0, 0, 0, MAIN_CORE_PROC, 0, -1}, {1, 0, 0, 1, MAIN_CORE_PROC, 1, -1}, + {2, 0, 0, 2, MAIN_CORE_PROC, 2, -1}, {3, 0, 0, 3, MAIN_CORE_PROC, 3, -1}, + {4, 0, 0, 4, MAIN_CORE_PROC, 4, -1}, {5, 0, 0, 5, MAIN_CORE_PROC, 5, -1}, + {6, 0, 0, 6, MAIN_CORE_PROC, 6, -1}, {7, 0, 0, 7, MAIN_CORE_PROC, 7, -1}, + {8, 0, 0, 8, MAIN_CORE_PROC, 8, -1}, {9, 0, 0, 9, MAIN_CORE_PROC, 9, -1}, + {10, 0, 0, 10, MAIN_CORE_PROC, 10, -1}, {11, 0, 0, 11, MAIN_CORE_PROC, 11, -1}, + {12, 0, 0, 12, MAIN_CORE_PROC, 12, -1}, {13, 0, 0, 13, MAIN_CORE_PROC, 13, -1}, + {14, 0, 0, 14, MAIN_CORE_PROC, 14, -1}, {15, 0, 0, 15, MAIN_CORE_PROC, 15, -1}, + {16, 0, 0, 16, MAIN_CORE_PROC, 16, -1}, {17, 0, 0, 17, MAIN_CORE_PROC, 17, -1}, + {18, 0, 0, 18, MAIN_CORE_PROC, 18, -1}, {19, 0, 0, 19, MAIN_CORE_PROC, 19, -1}, + {20, 0, 0, 20, MAIN_CORE_PROC, 20, -1}, {21, 0, 0, 21, MAIN_CORE_PROC, 21, -1}, + {22, 0, 0, 22, MAIN_CORE_PROC, 22, -1}, {23, 0, 0, 23, MAIN_CORE_PROC, 23, -1}, + {24, 1, 1, 24, MAIN_CORE_PROC, 24, -1}, {25, 1, 1, 25, MAIN_CORE_PROC, 25, -1}, + {26, 1, 1, 26, MAIN_CORE_PROC, 26, -1}, {27, 1, 1, 27, MAIN_CORE_PROC, 27, -1}, + {28, 1, 1, 28, MAIN_CORE_PROC, 28, -1}, {29, 1, 1, 29, MAIN_CORE_PROC, 29, -1}, + {30, 1, 1, 30, MAIN_CORE_PROC, 30, -1}, {31, 1, 1, 31, MAIN_CORE_PROC, 31, -1}, + {32, 1, 1, 32, MAIN_CORE_PROC, 32, -1}, {33, 1, 1, 33, MAIN_CORE_PROC, 33, -1}, + {34, 1, 1, 34, MAIN_CORE_PROC, 34, -1}, {35, 1, 1, 35, MAIN_CORE_PROC, 35, -1}, + {36, 1, 1, 36, MAIN_CORE_PROC, 36, -1}, {37, 1, 1, 37, MAIN_CORE_PROC, 37, -1}, + {38, 1, 1, 38, MAIN_CORE_PROC, 38, -1}, {39, 1, 1, 39, MAIN_CORE_PROC, 39, -1}, + {40, 1, 1, 40, MAIN_CORE_PROC, 40, -1}, {41, 1, 1, 41, MAIN_CORE_PROC, 41, -1}, + {42, 1, 1, 42, MAIN_CORE_PROC, 42, -1}, {43, 1, 1, 43, MAIN_CORE_PROC, 43, -1}, + {44, 1, 1, 44, MAIN_CORE_PROC, 44, -1}, {45, 1, 1, 45, MAIN_CORE_PROC, 45, -1}, + {46, 1, 1, 46, MAIN_CORE_PROC, 46, -1}, {47, 1, 1, 47, MAIN_CORE_PROC, 47, -1}, + }, {{48, 48, 0, 0, -1, -1}, {24, 24, 0, 0, 0, 0}, {24, 24, 0, 0, 1, 1}}, ov::hint::SchedulingCoreType::PCORE_ONLY, false, @@ -402,9 +846,60 @@ StreamGenerateionTestCase generation_latency_2sockets_48cores_10 = { false, true, false, + false, true, ov::hint::PerformanceMode::LATENCY, {ov::hint::ModelDistributionPolicy::TENSOR_PARALLEL}, + { + {0, 0, 0, 0, HYPER_THREADING_PROC, 0, -1}, {1, 0, 0, 1, HYPER_THREADING_PROC, 1, -1}, + {2, 0, 0, 2, HYPER_THREADING_PROC, 2, -1}, {3, 0, 0, 3, HYPER_THREADING_PROC, 3, -1}, + {4, 0, 0, 4, HYPER_THREADING_PROC, 4, -1}, {5, 0, 0, 5, HYPER_THREADING_PROC, 5, -1}, + {6, 0, 0, 6, HYPER_THREADING_PROC, 6, -1}, {7, 0, 0, 7, HYPER_THREADING_PROC, 7, -1}, + {8, 0, 0, 8, HYPER_THREADING_PROC, 8, -1}, {9, 0, 0, 9, HYPER_THREADING_PROC, 9, -1}, + {10, 0, 0, 10, HYPER_THREADING_PROC, 10, -1}, {11, 0, 0, 11, HYPER_THREADING_PROC, 11, -1}, + {12, 0, 0, 12, HYPER_THREADING_PROC, 12, -1}, {13, 0, 0, 13, HYPER_THREADING_PROC, 13, -1}, + {14, 0, 0, 14, HYPER_THREADING_PROC, 14, -1}, {15, 0, 0, 15, HYPER_THREADING_PROC, 15, -1}, + {16, 0, 0, 16, HYPER_THREADING_PROC, 16, -1}, {17, 0, 0, 17, HYPER_THREADING_PROC, 17, -1}, + {18, 0, 0, 18, HYPER_THREADING_PROC, 18, -1}, {19, 0, 0, 19, HYPER_THREADING_PROC, 19, -1}, + {20, 0, 0, 20, HYPER_THREADING_PROC, 20, -1}, {21, 0, 0, 21, HYPER_THREADING_PROC, 21, -1}, + {22, 0, 0, 22, HYPER_THREADING_PROC, 22, -1}, {23, 0, 0, 23, HYPER_THREADING_PROC, 23, -1}, + {24, 1, 1, 24, HYPER_THREADING_PROC, 24, -1}, {25, 1, 1, 25, HYPER_THREADING_PROC, 25, -1}, + {26, 1, 1, 26, HYPER_THREADING_PROC, 26, -1}, {27, 1, 1, 27, HYPER_THREADING_PROC, 27, -1}, + {28, 1, 1, 28, HYPER_THREADING_PROC, 28, -1}, {29, 1, 1, 29, HYPER_THREADING_PROC, 29, -1}, + {30, 1, 1, 30, HYPER_THREADING_PROC, 30, -1}, {31, 1, 1, 31, HYPER_THREADING_PROC, 31, -1}, + {32, 1, 1, 32, HYPER_THREADING_PROC, 32, -1}, {33, 1, 1, 33, HYPER_THREADING_PROC, 33, -1}, + {34, 1, 1, 34, HYPER_THREADING_PROC, 34, -1}, {35, 1, 1, 35, HYPER_THREADING_PROC, 35, -1}, + {36, 1, 1, 36, HYPER_THREADING_PROC, 36, -1}, {37, 1, 1, 37, HYPER_THREADING_PROC, 37, -1}, + {38, 1, 1, 38, HYPER_THREADING_PROC, 38, -1}, {39, 1, 1, 39, HYPER_THREADING_PROC, 39, -1}, + {40, 1, 1, 40, HYPER_THREADING_PROC, 40, -1}, {41, 1, 1, 41, HYPER_THREADING_PROC, 41, -1}, + {42, 1, 1, 42, HYPER_THREADING_PROC, 42, -1}, {43, 1, 1, 43, HYPER_THREADING_PROC, 43, -1}, + {44, 1, 1, 44, HYPER_THREADING_PROC, 44, -1}, {45, 1, 1, 45, HYPER_THREADING_PROC, 45, -1}, + {46, 1, 1, 46, HYPER_THREADING_PROC, 46, -1}, {47, 1, 1, 47, HYPER_THREADING_PROC, 47, -1}, + {48, 0, 0, 48, MAIN_CORE_PROC, 48, -1}, {49, 0, 0, 49, MAIN_CORE_PROC, 49, -1}, + {50, 0, 0, 50, MAIN_CORE_PROC, 50, -1}, {51, 0, 0, 51, MAIN_CORE_PROC, 51, -1}, + {52, 0, 0, 52, MAIN_CORE_PROC, 52, -1}, {53, 0, 0, 53, MAIN_CORE_PROC, 53, -1}, + {54, 0, 0, 54, MAIN_CORE_PROC, 54, -1}, {55, 0, 0, 55, MAIN_CORE_PROC, 55, -1}, + {56, 0, 0, 56, MAIN_CORE_PROC, 56, -1}, {57, 0, 0, 57, MAIN_CORE_PROC, 57, -1}, + {58, 0, 0, 58, MAIN_CORE_PROC, 58, -1}, {59, 0, 0, 59, MAIN_CORE_PROC, 59, -1}, + {60, 0, 0, 60, MAIN_CORE_PROC, 60, -1}, {61, 0, 0, 61, MAIN_CORE_PROC, 61, -1}, + {62, 0, 0, 62, MAIN_CORE_PROC, 62, -1}, {63, 0, 0, 63, MAIN_CORE_PROC, 63, -1}, + {64, 0, 0, 64, MAIN_CORE_PROC, 64, -1}, {65, 0, 0, 65, MAIN_CORE_PROC, 65, -1}, + {66, 0, 0, 66, MAIN_CORE_PROC, 66, -1}, {67, 0, 0, 67, MAIN_CORE_PROC, 67, -1}, + {68, 0, 0, 68, MAIN_CORE_PROC, 68, -1}, {69, 0, 0, 69, MAIN_CORE_PROC, 69, -1}, + {70, 0, 0, 70, MAIN_CORE_PROC, 70, -1}, {71, 0, 0, 71, MAIN_CORE_PROC, 71, -1}, + {72, 1, 1, 72, MAIN_CORE_PROC, 72, -1}, {73, 1, 1, 73, MAIN_CORE_PROC, 73, -1}, + {74, 1, 1, 74, MAIN_CORE_PROC, 74, -1}, {75, 1, 1, 75, MAIN_CORE_PROC, 75, -1}, + {76, 1, 1, 76, MAIN_CORE_PROC, 76, -1}, {77, 1, 1, 77, MAIN_CORE_PROC, 77, -1}, + {78, 1, 1, 78, MAIN_CORE_PROC, 78, -1}, {79, 1, 1, 79, MAIN_CORE_PROC, 79, -1}, + {80, 1, 1, 80, MAIN_CORE_PROC, 80, -1}, {81, 1, 1, 81, MAIN_CORE_PROC, 81, -1}, + {82, 1, 1, 82, MAIN_CORE_PROC, 82, -1}, {83, 1, 1, 83, MAIN_CORE_PROC, 83, -1}, + {84, 1, 1, 84, MAIN_CORE_PROC, 84, -1}, {85, 1, 1, 85, MAIN_CORE_PROC, 85, -1}, + {86, 1, 1, 86, MAIN_CORE_PROC, 86, -1}, {87, 1, 1, 87, MAIN_CORE_PROC, 87, -1}, + {88, 1, 1, 88, MAIN_CORE_PROC, 88, -1}, {89, 1, 1, 89, MAIN_CORE_PROC, 89, -1}, + {90, 1, 1, 90, MAIN_CORE_PROC, 90, -1}, {91, 1, 1, 91, MAIN_CORE_PROC, 91, -1}, + {92, 1, 1, 92, MAIN_CORE_PROC, 92, -1}, {93, 1, 1, 93, MAIN_CORE_PROC, 93, -1}, + {94, 1, 1, 94, MAIN_CORE_PROC, 94, -1}, {95, 1, 1, 95, MAIN_CORE_PROC, 95, -1}, + }, {{96, 48, 0, 48, -1, -1}, {48, 24, 0, 24, 0, 0}, {48, 24, 0, 24, 1, 1}}, ov::hint::SchedulingCoreType::PCORE_ONLY, false, @@ -425,9 +920,36 @@ StreamGenerateionTestCase generation_latency_2sockets_48cores_11 = { true, true, false, + false, true, ov::hint::PerformanceMode::LATENCY, {ov::hint::ModelDistributionPolicy::TENSOR_PARALLEL}, + { + {0, 0, 0, 0, MAIN_CORE_PROC, 0, -1}, {1, 0, 0, 1, MAIN_CORE_PROC, 1, -1}, + {2, 0, 0, 2, MAIN_CORE_PROC, 2, -1}, {3, 0, 0, 3, MAIN_CORE_PROC, 3, -1}, + {4, 0, 0, 4, MAIN_CORE_PROC, 4, -1}, {5, 0, 0, 5, MAIN_CORE_PROC, 5, -1}, + {6, 0, 0, 6, MAIN_CORE_PROC, 6, -1}, {7, 0, 0, 7, MAIN_CORE_PROC, 7, -1}, + {8, 0, 0, 8, MAIN_CORE_PROC, 8, -1}, {9, 0, 0, 9, MAIN_CORE_PROC, 9, -1}, + {10, 0, 0, 10, MAIN_CORE_PROC, 10, -1}, {11, 0, 0, 11, MAIN_CORE_PROC, 11, -1}, + {12, 0, 0, 12, MAIN_CORE_PROC, 12, -1}, {13, 0, 0, 13, MAIN_CORE_PROC, 13, -1}, + {14, 0, 0, 14, MAIN_CORE_PROC, 14, -1}, {15, 0, 0, 15, MAIN_CORE_PROC, 15, -1}, + {16, 0, 0, 16, MAIN_CORE_PROC, 16, -1}, {17, 0, 0, 17, MAIN_CORE_PROC, 17, -1}, + {18, 0, 0, 18, MAIN_CORE_PROC, 18, -1}, {19, 0, 0, 19, MAIN_CORE_PROC, 19, -1}, + {20, 0, 0, 20, MAIN_CORE_PROC, 20, -1}, {21, 0, 0, 21, MAIN_CORE_PROC, 21, -1}, + {22, 0, 0, 22, MAIN_CORE_PROC, 22, -1}, {23, 0, 0, 23, MAIN_CORE_PROC, 23, -1}, + {24, 1, 1, 24, MAIN_CORE_PROC, 24, -1}, {25, 1, 1, 25, MAIN_CORE_PROC, 25, -1}, + {26, 1, 1, 26, MAIN_CORE_PROC, 26, -1}, {27, 1, 1, 27, MAIN_CORE_PROC, 27, -1}, + {28, 1, 1, 28, MAIN_CORE_PROC, 28, -1}, {29, 1, 1, 29, MAIN_CORE_PROC, 29, -1}, + {30, 1, 1, 30, MAIN_CORE_PROC, 30, -1}, {31, 1, 1, 31, MAIN_CORE_PROC, 31, -1}, + {32, 1, 1, 32, MAIN_CORE_PROC, 32, -1}, {33, 1, 1, 33, MAIN_CORE_PROC, 33, -1}, + {34, 1, 1, 34, MAIN_CORE_PROC, 34, -1}, {35, 1, 1, 35, MAIN_CORE_PROC, 35, -1}, + {36, 1, 1, 36, MAIN_CORE_PROC, 36, -1}, {37, 1, 1, 37, MAIN_CORE_PROC, 37, -1}, + {38, 1, 1, 38, MAIN_CORE_PROC, 38, -1}, {39, 1, 1, 39, MAIN_CORE_PROC, 39, -1}, + {40, 1, 1, 40, MAIN_CORE_PROC, 40, -1}, {41, 1, 1, 41, MAIN_CORE_PROC, 41, -1}, + {42, 1, 1, 42, MAIN_CORE_PROC, 42, -1}, {43, 1, 1, 43, MAIN_CORE_PROC, 43, -1}, + {44, 1, 1, 44, MAIN_CORE_PROC, 44, -1}, {45, 1, 1, 45, MAIN_CORE_PROC, 45, -1}, + {46, 1, 1, 46, MAIN_CORE_PROC, 46, -1}, {47, 1, 1, 47, MAIN_CORE_PROC, 47, -1}, + }, {{48, 48, 0, 0, -1, -1}, {24, 24, 0, 0, 0, 0}, {24, 24, 0, 0, 1, 1}}, ov::hint::SchedulingCoreType::PCORE_ONLY, false, @@ -448,9 +970,22 @@ StreamGenerateionTestCase generation_tput_1sockets_14cores_2 = { false, true, false, + false, true, ov::hint::PerformanceMode::THROUGHPUT, {}, + { + {0, 0, 0, 0, MAIN_CORE_PROC, 0, -1}, {1, 0, 0, 0, HYPER_THREADING_PROC, 1, -1}, + {2, 0, 0, 1, MAIN_CORE_PROC, 2, -1}, {3, 0, 0, 1, HYPER_THREADING_PROC, 3, -1}, + {4, 0, 0, 2, MAIN_CORE_PROC, 4, -1}, {5, 0, 0, 2, HYPER_THREADING_PROC, 5, -1}, + {6, 0, 0, 3, MAIN_CORE_PROC, 6, -1}, {7, 0, 0, 3, HYPER_THREADING_PROC, 7, -1}, + {8, 0, 0, 4, MAIN_CORE_PROC, 8, -1}, {9, 0, 0, 4, HYPER_THREADING_PROC, 9, -1}, + {10, 0, 0, 5, MAIN_CORE_PROC, 10, -1}, {11, 0, 0, 5, HYPER_THREADING_PROC, 11, -1}, + {12, 0, 0, 6, EFFICIENT_CORE_PROC, 12, -1}, {13, 0, 0, 7, EFFICIENT_CORE_PROC, 13, -1}, + {14, 0, 0, 8, EFFICIENT_CORE_PROC, 14, -1}, {15, 0, 0, 9, EFFICIENT_CORE_PROC, 15, -1}, + {16, 0, 0, 10, EFFICIENT_CORE_PROC, 16, -1}, {17, 0, 0, 11, EFFICIENT_CORE_PROC, 17, -1}, + {18, 0, 0, 12, EFFICIENT_CORE_PROC, 18, -1}, {19, 0, 0, 13, EFFICIENT_CORE_PROC, 19, -1}, + }, {{20, 6, 8, 6, 0, 0}}, ov::hint::SchedulingCoreType::PCORE_ONLY, false, @@ -471,9 +1006,22 @@ StreamGenerateionTestCase generation_tput_1sockets_14cores_3 = { true, true, false, + false, true, ov::hint::PerformanceMode::THROUGHPUT, {}, + { + {0, 0, 0, 0, MAIN_CORE_PROC, 0, -1}, {1, 0, 0, 0, HYPER_THREADING_PROC, 1, -1}, + {2, 0, 0, 1, MAIN_CORE_PROC, 2, -1}, {3, 0, 0, 1, HYPER_THREADING_PROC, 3, -1}, + {4, 0, 0, 2, MAIN_CORE_PROC, 4, -1}, {5, 0, 0, 2, HYPER_THREADING_PROC, 5, -1}, + {6, 0, 0, 3, MAIN_CORE_PROC, 6, -1}, {7, 0, 0, 3, HYPER_THREADING_PROC, 7, -1}, + {8, 0, 0, 4, MAIN_CORE_PROC, 8, -1}, {9, 0, 0, 4, HYPER_THREADING_PROC, 9, -1}, + {10, 0, 0, 5, MAIN_CORE_PROC, 10, -1}, {11, 0, 0, 5, HYPER_THREADING_PROC, 11, -1}, + {12, 0, 0, 6, EFFICIENT_CORE_PROC, 12, -1}, {13, 0, 0, 7, EFFICIENT_CORE_PROC, 13, -1}, + {14, 0, 0, 8, EFFICIENT_CORE_PROC, 14, -1}, {15, 0, 0, 9, EFFICIENT_CORE_PROC, 15, -1}, + {16, 0, 0, 10, EFFICIENT_CORE_PROC, 16, -1}, {17, 0, 0, 11, EFFICIENT_CORE_PROC, 17, -1}, + {18, 0, 0, 12, EFFICIENT_CORE_PROC, 18, -1}, {19, 0, 0, 13, EFFICIENT_CORE_PROC, 19, -1}, + }, {{20, 6, 8, 6, 0, 0}}, ov::hint::SchedulingCoreType::PCORE_ONLY, true, @@ -494,9 +1042,22 @@ StreamGenerateionTestCase generation_tput_1sockets_14cores_4 = { true, true, false, + false, true, ov::hint::PerformanceMode::THROUGHPUT, {}, + { + {0, 0, 0, 0, MAIN_CORE_PROC, 0, -1}, {1, 0, 0, 0, HYPER_THREADING_PROC, 1, -1}, + {2, 0, 0, 1, MAIN_CORE_PROC, 2, -1}, {3, 0, 0, 1, HYPER_THREADING_PROC, 3, -1}, + {4, 0, 0, 2, MAIN_CORE_PROC, 4, -1}, {5, 0, 0, 2, HYPER_THREADING_PROC, 5, -1}, + {6, 0, 0, 3, MAIN_CORE_PROC, 6, -1}, {7, 0, 0, 3, HYPER_THREADING_PROC, 7, -1}, + {8, 0, 0, 4, MAIN_CORE_PROC, 8, -1}, {9, 0, 0, 4, HYPER_THREADING_PROC, 9, -1}, + {10, 0, 0, 5, MAIN_CORE_PROC, 10, -1}, {11, 0, 0, 5, HYPER_THREADING_PROC, 11, -1}, + {12, 0, 0, 6, EFFICIENT_CORE_PROC, 12, -1}, {13, 0, 0, 7, EFFICIENT_CORE_PROC, 13, -1}, + {14, 0, 0, 8, EFFICIENT_CORE_PROC, 14, -1}, {15, 0, 0, 9, EFFICIENT_CORE_PROC, 15, -1}, + {16, 0, 0, 10, EFFICIENT_CORE_PROC, 16, -1}, {17, 0, 0, 11, EFFICIENT_CORE_PROC, 17, -1}, + {18, 0, 0, 12, EFFICIENT_CORE_PROC, 18, -1}, {19, 0, 0, 13, EFFICIENT_CORE_PROC, 19, -1}, + }, {{20, 6, 8, 6, 0, 0}}, ov::hint::SchedulingCoreType::PCORE_ONLY, true, @@ -517,9 +1078,60 @@ StreamGenerateionTestCase generation_tput_2sockets_48cores_5 = { true, true, false, + false, true, ov::hint::PerformanceMode::THROUGHPUT, {}, + { + {0, 0, 0, 0, HYPER_THREADING_PROC, 0, -1}, {1, 0, 0, 1, HYPER_THREADING_PROC, 1, -1}, + {2, 0, 0, 2, HYPER_THREADING_PROC, 2, -1}, {3, 0, 0, 3, HYPER_THREADING_PROC, 3, -1}, + {4, 0, 0, 4, HYPER_THREADING_PROC, 4, -1}, {5, 0, 0, 5, HYPER_THREADING_PROC, 5, -1}, + {6, 0, 0, 6, HYPER_THREADING_PROC, 6, -1}, {7, 0, 0, 7, HYPER_THREADING_PROC, 7, -1}, + {8, 0, 0, 8, HYPER_THREADING_PROC, 8, -1}, {9, 0, 0, 9, HYPER_THREADING_PROC, 9, -1}, + {10, 0, 0, 10, HYPER_THREADING_PROC, 10, -1}, {11, 0, 0, 11, HYPER_THREADING_PROC, 11, -1}, + {12, 0, 0, 12, HYPER_THREADING_PROC, 12, -1}, {13, 0, 0, 13, HYPER_THREADING_PROC, 13, -1}, + {14, 0, 0, 14, HYPER_THREADING_PROC, 14, -1}, {15, 0, 0, 15, HYPER_THREADING_PROC, 15, -1}, + {16, 0, 0, 16, HYPER_THREADING_PROC, 16, -1}, {17, 0, 0, 17, HYPER_THREADING_PROC, 17, -1}, + {18, 0, 0, 18, HYPER_THREADING_PROC, 18, -1}, {19, 0, 0, 19, HYPER_THREADING_PROC, 19, -1}, + {20, 0, 0, 20, HYPER_THREADING_PROC, 20, -1}, {21, 0, 0, 21, HYPER_THREADING_PROC, 21, -1}, + {22, 0, 0, 22, HYPER_THREADING_PROC, 22, -1}, {23, 0, 0, 23, HYPER_THREADING_PROC, 23, -1}, + {24, 1, 1, 24, HYPER_THREADING_PROC, 24, -1}, {25, 1, 1, 25, HYPER_THREADING_PROC, 25, -1}, + {26, 1, 1, 26, HYPER_THREADING_PROC, 26, -1}, {27, 1, 1, 27, HYPER_THREADING_PROC, 27, -1}, + {28, 1, 1, 28, HYPER_THREADING_PROC, 28, -1}, {29, 1, 1, 29, HYPER_THREADING_PROC, 29, -1}, + {30, 1, 1, 30, HYPER_THREADING_PROC, 30, -1}, {31, 1, 1, 31, HYPER_THREADING_PROC, 31, -1}, + {32, 1, 1, 32, HYPER_THREADING_PROC, 32, -1}, {33, 1, 1, 33, HYPER_THREADING_PROC, 33, -1}, + {34, 1, 1, 34, HYPER_THREADING_PROC, 34, -1}, {35, 1, 1, 35, HYPER_THREADING_PROC, 35, -1}, + {36, 1, 1, 36, HYPER_THREADING_PROC, 36, -1}, {37, 1, 1, 37, HYPER_THREADING_PROC, 37, -1}, + {38, 1, 1, 38, HYPER_THREADING_PROC, 38, -1}, {39, 1, 1, 39, HYPER_THREADING_PROC, 39, -1}, + {40, 1, 1, 40, HYPER_THREADING_PROC, 40, -1}, {41, 1, 1, 41, HYPER_THREADING_PROC, 41, -1}, + {42, 1, 1, 42, HYPER_THREADING_PROC, 42, -1}, {43, 1, 1, 43, HYPER_THREADING_PROC, 43, -1}, + {44, 1, 1, 44, HYPER_THREADING_PROC, 44, -1}, {45, 1, 1, 45, HYPER_THREADING_PROC, 45, -1}, + {46, 1, 1, 46, HYPER_THREADING_PROC, 46, -1}, {47, 1, 1, 47, HYPER_THREADING_PROC, 47, -1}, + {48, 0, 0, 48, MAIN_CORE_PROC, 48, -1}, {49, 0, 0, 49, MAIN_CORE_PROC, 49, -1}, + {50, 0, 0, 50, MAIN_CORE_PROC, 50, -1}, {51, 0, 0, 51, MAIN_CORE_PROC, 51, -1}, + {52, 0, 0, 52, MAIN_CORE_PROC, 52, -1}, {53, 0, 0, 53, MAIN_CORE_PROC, 53, -1}, + {54, 0, 0, 54, MAIN_CORE_PROC, 54, -1}, {55, 0, 0, 55, MAIN_CORE_PROC, 55, -1}, + {56, 0, 0, 56, MAIN_CORE_PROC, 56, -1}, {57, 0, 0, 57, MAIN_CORE_PROC, 57, -1}, + {58, 0, 0, 58, MAIN_CORE_PROC, 58, -1}, {59, 0, 0, 59, MAIN_CORE_PROC, 59, -1}, + {60, 0, 0, 60, MAIN_CORE_PROC, 60, -1}, {61, 0, 0, 61, MAIN_CORE_PROC, 61, -1}, + {62, 0, 0, 62, MAIN_CORE_PROC, 62, -1}, {63, 0, 0, 63, MAIN_CORE_PROC, 63, -1}, + {64, 0, 0, 64, MAIN_CORE_PROC, 64, -1}, {65, 0, 0, 65, MAIN_CORE_PROC, 65, -1}, + {66, 0, 0, 66, MAIN_CORE_PROC, 66, -1}, {67, 0, 0, 67, MAIN_CORE_PROC, 67, -1}, + {68, 0, 0, 68, MAIN_CORE_PROC, 68, -1}, {69, 0, 0, 69, MAIN_CORE_PROC, 69, -1}, + {70, 0, 0, 70, MAIN_CORE_PROC, 70, -1}, {71, 0, 0, 71, MAIN_CORE_PROC, 71, -1}, + {72, 1, 1, 72, MAIN_CORE_PROC, 72, -1}, {73, 1, 1, 73, MAIN_CORE_PROC, 73, -1}, + {74, 1, 1, 74, MAIN_CORE_PROC, 74, -1}, {75, 1, 1, 75, MAIN_CORE_PROC, 75, -1}, + {76, 1, 1, 76, MAIN_CORE_PROC, 76, -1}, {77, 1, 1, 77, MAIN_CORE_PROC, 77, -1}, + {78, 1, 1, 78, MAIN_CORE_PROC, 78, -1}, {79, 1, 1, 79, MAIN_CORE_PROC, 79, -1}, + {80, 1, 1, 80, MAIN_CORE_PROC, 80, -1}, {81, 1, 1, 81, MAIN_CORE_PROC, 81, -1}, + {82, 1, 1, 82, MAIN_CORE_PROC, 82, -1}, {83, 1, 1, 83, MAIN_CORE_PROC, 83, -1}, + {84, 1, 1, 84, MAIN_CORE_PROC, 84, -1}, {85, 1, 1, 85, MAIN_CORE_PROC, 85, -1}, + {86, 1, 1, 86, MAIN_CORE_PROC, 86, -1}, {87, 1, 1, 87, MAIN_CORE_PROC, 87, -1}, + {88, 1, 1, 88, MAIN_CORE_PROC, 88, -1}, {89, 1, 1, 89, MAIN_CORE_PROC, 89, -1}, + {90, 1, 1, 90, MAIN_CORE_PROC, 90, -1}, {91, 1, 1, 91, MAIN_CORE_PROC, 91, -1}, + {92, 1, 1, 92, MAIN_CORE_PROC, 92, -1}, {93, 1, 1, 93, MAIN_CORE_PROC, 93, -1}, + {94, 1, 1, 94, MAIN_CORE_PROC, 94, -1}, {95, 1, 1, 95, MAIN_CORE_PROC, 95, -1}, + }, {{96, 48, 0, 48, -1, -1}, {48, 24, 0, 24, 0, 0}, {48, 24, 0, 24, 1, 1}}, ov::hint::SchedulingCoreType::ANY_CORE, true, @@ -543,9 +1155,60 @@ StreamGenerateionTestCase generation_tput_2sockets_48cores_6 = { false, true, false, + false, true, ov::hint::PerformanceMode::THROUGHPUT, {}, + { + {0, 0, 0, 0, HYPER_THREADING_PROC, 0, -1}, {1, 0, 0, 1, HYPER_THREADING_PROC, 1, -1}, + {2, 0, 0, 2, HYPER_THREADING_PROC, 2, -1}, {3, 0, 0, 3, HYPER_THREADING_PROC, 3, -1}, + {4, 0, 0, 4, HYPER_THREADING_PROC, 4, -1}, {5, 0, 0, 5, HYPER_THREADING_PROC, 5, -1}, + {6, 0, 0, 6, HYPER_THREADING_PROC, 6, -1}, {7, 0, 0, 7, HYPER_THREADING_PROC, 7, -1}, + {8, 0, 0, 8, HYPER_THREADING_PROC, 8, -1}, {9, 0, 0, 9, HYPER_THREADING_PROC, 9, -1}, + {10, 0, 0, 10, HYPER_THREADING_PROC, 10, -1}, {11, 0, 0, 11, HYPER_THREADING_PROC, 11, -1}, + {12, 0, 0, 12, HYPER_THREADING_PROC, 12, -1}, {13, 0, 0, 13, HYPER_THREADING_PROC, 13, -1}, + {14, 0, 0, 14, HYPER_THREADING_PROC, 14, -1}, {15, 0, 0, 15, HYPER_THREADING_PROC, 15, -1}, + {16, 0, 0, 16, HYPER_THREADING_PROC, 16, -1}, {17, 0, 0, 17, HYPER_THREADING_PROC, 17, -1}, + {18, 0, 0, 18, HYPER_THREADING_PROC, 18, -1}, {19, 0, 0, 19, HYPER_THREADING_PROC, 19, -1}, + {20, 0, 0, 20, HYPER_THREADING_PROC, 20, -1}, {21, 0, 0, 21, HYPER_THREADING_PROC, 21, -1}, + {22, 0, 0, 22, HYPER_THREADING_PROC, 22, -1}, {23, 0, 0, 23, HYPER_THREADING_PROC, 23, -1}, + {24, 1, 1, 24, HYPER_THREADING_PROC, 24, -1}, {25, 1, 1, 25, HYPER_THREADING_PROC, 25, -1}, + {26, 1, 1, 26, HYPER_THREADING_PROC, 26, -1}, {27, 1, 1, 27, HYPER_THREADING_PROC, 27, -1}, + {28, 1, 1, 28, HYPER_THREADING_PROC, 28, -1}, {29, 1, 1, 29, HYPER_THREADING_PROC, 29, -1}, + {30, 1, 1, 30, HYPER_THREADING_PROC, 30, -1}, {31, 1, 1, 31, HYPER_THREADING_PROC, 31, -1}, + {32, 1, 1, 32, HYPER_THREADING_PROC, 32, -1}, {33, 1, 1, 33, HYPER_THREADING_PROC, 33, -1}, + {34, 1, 1, 34, HYPER_THREADING_PROC, 34, -1}, {35, 1, 1, 35, HYPER_THREADING_PROC, 35, -1}, + {36, 1, 1, 36, HYPER_THREADING_PROC, 36, -1}, {37, 1, 1, 37, HYPER_THREADING_PROC, 37, -1}, + {38, 1, 1, 38, HYPER_THREADING_PROC, 38, -1}, {39, 1, 1, 39, HYPER_THREADING_PROC, 39, -1}, + {40, 1, 1, 40, HYPER_THREADING_PROC, 40, -1}, {41, 1, 1, 41, HYPER_THREADING_PROC, 41, -1}, + {42, 1, 1, 42, HYPER_THREADING_PROC, 42, -1}, {43, 1, 1, 43, HYPER_THREADING_PROC, 43, -1}, + {44, 1, 1, 44, HYPER_THREADING_PROC, 44, -1}, {45, 1, 1, 45, HYPER_THREADING_PROC, 45, -1}, + {46, 1, 1, 46, HYPER_THREADING_PROC, 46, -1}, {47, 1, 1, 47, HYPER_THREADING_PROC, 47, -1}, + {48, 0, 0, 48, MAIN_CORE_PROC, 48, -1}, {49, 0, 0, 49, MAIN_CORE_PROC, 49, -1}, + {50, 0, 0, 50, MAIN_CORE_PROC, 50, -1}, {51, 0, 0, 51, MAIN_CORE_PROC, 51, -1}, + {52, 0, 0, 52, MAIN_CORE_PROC, 52, -1}, {53, 0, 0, 53, MAIN_CORE_PROC, 53, -1}, + {54, 0, 0, 54, MAIN_CORE_PROC, 54, -1}, {55, 0, 0, 55, MAIN_CORE_PROC, 55, -1}, + {56, 0, 0, 56, MAIN_CORE_PROC, 56, -1}, {57, 0, 0, 57, MAIN_CORE_PROC, 57, -1}, + {58, 0, 0, 58, MAIN_CORE_PROC, 58, -1}, {59, 0, 0, 59, MAIN_CORE_PROC, 59, -1}, + {60, 0, 0, 60, MAIN_CORE_PROC, 60, -1}, {61, 0, 0, 61, MAIN_CORE_PROC, 61, -1}, + {62, 0, 0, 62, MAIN_CORE_PROC, 62, -1}, {63, 0, 0, 63, MAIN_CORE_PROC, 63, -1}, + {64, 0, 0, 64, MAIN_CORE_PROC, 64, -1}, {65, 0, 0, 65, MAIN_CORE_PROC, 65, -1}, + {66, 0, 0, 66, MAIN_CORE_PROC, 66, -1}, {67, 0, 0, 67, MAIN_CORE_PROC, 67, -1}, + {68, 0, 0, 68, MAIN_CORE_PROC, 68, -1}, {69, 0, 0, 69, MAIN_CORE_PROC, 69, -1}, + {70, 0, 0, 70, MAIN_CORE_PROC, 70, -1}, {71, 0, 0, 71, MAIN_CORE_PROC, 71, -1}, + {72, 1, 1, 72, MAIN_CORE_PROC, 72, -1}, {73, 1, 1, 73, MAIN_CORE_PROC, 73, -1}, + {74, 1, 1, 74, MAIN_CORE_PROC, 74, -1}, {75, 1, 1, 75, MAIN_CORE_PROC, 75, -1}, + {76, 1, 1, 76, MAIN_CORE_PROC, 76, -1}, {77, 1, 1, 77, MAIN_CORE_PROC, 77, -1}, + {78, 1, 1, 78, MAIN_CORE_PROC, 78, -1}, {79, 1, 1, 79, MAIN_CORE_PROC, 79, -1}, + {80, 1, 1, 80, MAIN_CORE_PROC, 80, -1}, {81, 1, 1, 81, MAIN_CORE_PROC, 81, -1}, + {82, 1, 1, 82, MAIN_CORE_PROC, 82, -1}, {83, 1, 1, 83, MAIN_CORE_PROC, 83, -1}, + {84, 1, 1, 84, MAIN_CORE_PROC, 84, -1}, {85, 1, 1, 85, MAIN_CORE_PROC, 85, -1}, + {86, 1, 1, 86, MAIN_CORE_PROC, 86, -1}, {87, 1, 1, 87, MAIN_CORE_PROC, 87, -1}, + {88, 1, 1, 88, MAIN_CORE_PROC, 88, -1}, {89, 1, 1, 89, MAIN_CORE_PROC, 89, -1}, + {90, 1, 1, 90, MAIN_CORE_PROC, 90, -1}, {91, 1, 1, 91, MAIN_CORE_PROC, 91, -1}, + {92, 1, 1, 92, MAIN_CORE_PROC, 92, -1}, {93, 1, 1, 93, MAIN_CORE_PROC, 93, -1}, + {94, 1, 1, 94, MAIN_CORE_PROC, 94, -1}, {95, 1, 1, 95, MAIN_CORE_PROC, 95, -1}, + }, {{96, 48, 0, 48, -1, -1}, {48, 24, 0, 24, 0, 0}, {48, 24, 0, 24, 1, 1}}, ov::hint::SchedulingCoreType::ANY_CORE, false, @@ -566,9 +1229,60 @@ StreamGenerateionTestCase generation_tput_2sockets_48cores_7 = { false, true, false, + false, true, ov::hint::PerformanceMode::THROUGHPUT, {}, + { + {0, 0, 0, 0, HYPER_THREADING_PROC, 0, -1}, {1, 0, 0, 1, HYPER_THREADING_PROC, 1, -1}, + {2, 0, 0, 2, HYPER_THREADING_PROC, 2, -1}, {3, 0, 0, 3, HYPER_THREADING_PROC, 3, -1}, + {4, 0, 0, 4, HYPER_THREADING_PROC, 4, -1}, {5, 0, 0, 5, HYPER_THREADING_PROC, 5, -1}, + {6, 0, 0, 6, HYPER_THREADING_PROC, 6, -1}, {7, 0, 0, 7, HYPER_THREADING_PROC, 7, -1}, + {8, 0, 0, 8, HYPER_THREADING_PROC, 8, -1}, {9, 0, 0, 9, HYPER_THREADING_PROC, 9, -1}, + {10, 0, 0, 10, HYPER_THREADING_PROC, 10, -1}, {11, 0, 0, 11, HYPER_THREADING_PROC, 11, -1}, + {12, 0, 0, 12, HYPER_THREADING_PROC, 12, -1}, {13, 0, 0, 13, HYPER_THREADING_PROC, 13, -1}, + {14, 0, 0, 14, HYPER_THREADING_PROC, 14, -1}, {15, 0, 0, 15, HYPER_THREADING_PROC, 15, -1}, + {16, 0, 0, 16, HYPER_THREADING_PROC, 16, -1}, {17, 0, 0, 17, HYPER_THREADING_PROC, 17, -1}, + {18, 0, 0, 18, HYPER_THREADING_PROC, 18, -1}, {19, 0, 0, 19, HYPER_THREADING_PROC, 19, -1}, + {20, 0, 0, 20, HYPER_THREADING_PROC, 20, -1}, {21, 0, 0, 21, HYPER_THREADING_PROC, 21, -1}, + {22, 0, 0, 22, HYPER_THREADING_PROC, 22, -1}, {23, 0, 0, 23, HYPER_THREADING_PROC, 23, -1}, + {24, 1, 1, 24, HYPER_THREADING_PROC, 24, -1}, {25, 1, 1, 25, HYPER_THREADING_PROC, 25, -1}, + {26, 1, 1, 26, HYPER_THREADING_PROC, 26, -1}, {27, 1, 1, 27, HYPER_THREADING_PROC, 27, -1}, + {28, 1, 1, 28, HYPER_THREADING_PROC, 28, -1}, {29, 1, 1, 29, HYPER_THREADING_PROC, 29, -1}, + {30, 1, 1, 30, HYPER_THREADING_PROC, 30, -1}, {31, 1, 1, 31, HYPER_THREADING_PROC, 31, -1}, + {32, 1, 1, 32, HYPER_THREADING_PROC, 32, -1}, {33, 1, 1, 33, HYPER_THREADING_PROC, 33, -1}, + {34, 1, 1, 34, HYPER_THREADING_PROC, 34, -1}, {35, 1, 1, 35, HYPER_THREADING_PROC, 35, -1}, + {36, 1, 1, 36, HYPER_THREADING_PROC, 36, -1}, {37, 1, 1, 37, HYPER_THREADING_PROC, 37, -1}, + {38, 1, 1, 38, HYPER_THREADING_PROC, 38, -1}, {39, 1, 1, 39, HYPER_THREADING_PROC, 39, -1}, + {40, 1, 1, 40, HYPER_THREADING_PROC, 40, -1}, {41, 1, 1, 41, HYPER_THREADING_PROC, 41, -1}, + {42, 1, 1, 42, HYPER_THREADING_PROC, 42, -1}, {43, 1, 1, 43, HYPER_THREADING_PROC, 43, -1}, + {44, 1, 1, 44, HYPER_THREADING_PROC, 44, -1}, {45, 1, 1, 45, HYPER_THREADING_PROC, 45, -1}, + {46, 1, 1, 46, HYPER_THREADING_PROC, 46, -1}, {47, 1, 1, 47, HYPER_THREADING_PROC, 47, -1}, + {48, 0, 0, 48, MAIN_CORE_PROC, 48, -1}, {49, 0, 0, 49, MAIN_CORE_PROC, 49, -1}, + {50, 0, 0, 50, MAIN_CORE_PROC, 50, -1}, {51, 0, 0, 51, MAIN_CORE_PROC, 51, -1}, + {52, 0, 0, 52, MAIN_CORE_PROC, 52, -1}, {53, 0, 0, 53, MAIN_CORE_PROC, 53, -1}, + {54, 0, 0, 54, MAIN_CORE_PROC, 54, -1}, {55, 0, 0, 55, MAIN_CORE_PROC, 55, -1}, + {56, 0, 0, 56, MAIN_CORE_PROC, 56, -1}, {57, 0, 0, 57, MAIN_CORE_PROC, 57, -1}, + {58, 0, 0, 58, MAIN_CORE_PROC, 58, -1}, {59, 0, 0, 59, MAIN_CORE_PROC, 59, -1}, + {60, 0, 0, 60, MAIN_CORE_PROC, 60, -1}, {61, 0, 0, 61, MAIN_CORE_PROC, 61, -1}, + {62, 0, 0, 62, MAIN_CORE_PROC, 62, -1}, {63, 0, 0, 63, MAIN_CORE_PROC, 63, -1}, + {64, 0, 0, 64, MAIN_CORE_PROC, 64, -1}, {65, 0, 0, 65, MAIN_CORE_PROC, 65, -1}, + {66, 0, 0, 66, MAIN_CORE_PROC, 66, -1}, {67, 0, 0, 67, MAIN_CORE_PROC, 67, -1}, + {68, 0, 0, 68, MAIN_CORE_PROC, 68, -1}, {69, 0, 0, 69, MAIN_CORE_PROC, 69, -1}, + {70, 0, 0, 70, MAIN_CORE_PROC, 70, -1}, {71, 0, 0, 71, MAIN_CORE_PROC, 71, -1}, + {72, 1, 1, 72, MAIN_CORE_PROC, 72, -1}, {73, 1, 1, 73, MAIN_CORE_PROC, 73, -1}, + {74, 1, 1, 74, MAIN_CORE_PROC, 74, -1}, {75, 1, 1, 75, MAIN_CORE_PROC, 75, -1}, + {76, 1, 1, 76, MAIN_CORE_PROC, 76, -1}, {77, 1, 1, 77, MAIN_CORE_PROC, 77, -1}, + {78, 1, 1, 78, MAIN_CORE_PROC, 78, -1}, {79, 1, 1, 79, MAIN_CORE_PROC, 79, -1}, + {80, 1, 1, 80, MAIN_CORE_PROC, 80, -1}, {81, 1, 1, 81, MAIN_CORE_PROC, 81, -1}, + {82, 1, 1, 82, MAIN_CORE_PROC, 82, -1}, {83, 1, 1, 83, MAIN_CORE_PROC, 83, -1}, + {84, 1, 1, 84, MAIN_CORE_PROC, 84, -1}, {85, 1, 1, 85, MAIN_CORE_PROC, 85, -1}, + {86, 1, 1, 86, MAIN_CORE_PROC, 86, -1}, {87, 1, 1, 87, MAIN_CORE_PROC, 87, -1}, + {88, 1, 1, 88, MAIN_CORE_PROC, 88, -1}, {89, 1, 1, 89, MAIN_CORE_PROC, 89, -1}, + {90, 1, 1, 90, MAIN_CORE_PROC, 90, -1}, {91, 1, 1, 91, MAIN_CORE_PROC, 91, -1}, + {92, 1, 1, 92, MAIN_CORE_PROC, 92, -1}, {93, 1, 1, 93, MAIN_CORE_PROC, 93, -1}, + {94, 1, 1, 94, MAIN_CORE_PROC, 94, -1}, {95, 1, 1, 95, MAIN_CORE_PROC, 95, -1}, + }, {{96, 48, 0, 48, -1, -1}, {48, 24, 0, 24, 0, 0}, {48, 24, 0, 24, 1, 1}}, ov::hint::SchedulingCoreType::ANY_CORE, false, @@ -589,9 +1303,134 @@ StreamGenerateionTestCase generation_tput_2sockets_48cores_8 = { false, true, false, + false, true, ov::hint::PerformanceMode::THROUGHPUT, {}, + { + {0, 0, 0, 0, HYPER_THREADING_PROC, 0, -1}, {1, 0, 0, 1, HYPER_THREADING_PROC, 1, -1}, + {2, 0, 0, 2, HYPER_THREADING_PROC, 2, -1}, {3, 0, 0, 3, HYPER_THREADING_PROC, 3, -1}, + {4, 0, 0, 4, HYPER_THREADING_PROC, 4, -1}, {5, 0, 0, 5, HYPER_THREADING_PROC, 5, -1}, + {6, 0, 0, 6, HYPER_THREADING_PROC, 6, -1}, {7, 0, 0, 7, HYPER_THREADING_PROC, 7, -1}, + {8, 0, 0, 8, HYPER_THREADING_PROC, 8, -1}, {9, 0, 0, 9, HYPER_THREADING_PROC, 9, -1}, + {10, 0, 0, 10, HYPER_THREADING_PROC, 10, -1}, {11, 0, 0, 11, HYPER_THREADING_PROC, 11, -1}, + {12, 0, 0, 12, HYPER_THREADING_PROC, 12, -1}, {13, 0, 0, 13, HYPER_THREADING_PROC, 13, -1}, + {14, 0, 0, 14, HYPER_THREADING_PROC, 14, -1}, {15, 0, 0, 15, HYPER_THREADING_PROC, 15, -1}, + {16, 0, 0, 16, HYPER_THREADING_PROC, 16, -1}, {17, 0, 0, 17, HYPER_THREADING_PROC, 17, -1}, + {18, 0, 0, 18, HYPER_THREADING_PROC, 18, -1}, {19, 0, 0, 19, HYPER_THREADING_PROC, 19, -1}, + {20, 0, 0, 20, HYPER_THREADING_PROC, 20, -1}, {21, 0, 0, 21, HYPER_THREADING_PROC, 21, -1}, + {22, 0, 0, 22, HYPER_THREADING_PROC, 22, -1}, {23, 0, 0, 23, HYPER_THREADING_PROC, 23, -1}, + {24, 1, 1, 24, HYPER_THREADING_PROC, 24, -1}, {25, 1, 1, 25, HYPER_THREADING_PROC, 25, -1}, + {26, 1, 1, 26, HYPER_THREADING_PROC, 26, -1}, {27, 1, 1, 27, HYPER_THREADING_PROC, 27, -1}, + {28, 1, 1, 28, HYPER_THREADING_PROC, 28, -1}, {29, 1, 1, 29, HYPER_THREADING_PROC, 29, -1}, + {30, 1, 1, 30, HYPER_THREADING_PROC, 30, -1}, {31, 1, 1, 31, HYPER_THREADING_PROC, 31, -1}, + {32, 1, 1, 32, HYPER_THREADING_PROC, 32, -1}, {33, 1, 1, 33, HYPER_THREADING_PROC, 33, -1}, + {34, 1, 1, 34, HYPER_THREADING_PROC, 34, -1}, {35, 1, 1, 35, HYPER_THREADING_PROC, 35, -1}, + {36, 1, 1, 36, HYPER_THREADING_PROC, 36, -1}, {37, 1, 1, 37, HYPER_THREADING_PROC, 37, -1}, + {38, 1, 1, 38, HYPER_THREADING_PROC, 38, -1}, {39, 1, 1, 39, HYPER_THREADING_PROC, 39, -1}, + {40, 1, 1, 40, HYPER_THREADING_PROC, 40, -1}, {41, 1, 1, 41, HYPER_THREADING_PROC, 41, -1}, + {42, 1, 1, 42, HYPER_THREADING_PROC, 42, -1}, {43, 1, 1, 43, HYPER_THREADING_PROC, 43, -1}, + {44, 1, 1, 44, HYPER_THREADING_PROC, 44, -1}, {45, 1, 1, 45, HYPER_THREADING_PROC, 45, -1}, + {46, 1, 1, 46, HYPER_THREADING_PROC, 46, -1}, {47, 1, 1, 47, HYPER_THREADING_PROC, 47, -1}, + {48, 0, 0, 48, MAIN_CORE_PROC, 48, -1}, {49, 0, 0, 49, MAIN_CORE_PROC, 49, -1}, + {50, 0, 0, 50, MAIN_CORE_PROC, 50, -1}, {51, 0, 0, 51, MAIN_CORE_PROC, 51, -1}, + {52, 0, 0, 52, MAIN_CORE_PROC, 52, -1}, {53, 0, 0, 53, MAIN_CORE_PROC, 53, -1}, + {54, 0, 0, 54, MAIN_CORE_PROC, 54, -1}, {55, 0, 0, 55, MAIN_CORE_PROC, 55, -1}, + {56, 0, 0, 56, MAIN_CORE_PROC, 56, -1}, {57, 0, 0, 57, MAIN_CORE_PROC, 57, -1}, + {58, 0, 0, 58, MAIN_CORE_PROC, 58, -1}, {59, 0, 0, 59, MAIN_CORE_PROC, 59, -1}, + {60, 0, 0, 60, MAIN_CORE_PROC, 60, -1}, {61, 0, 0, 61, MAIN_CORE_PROC, 61, -1}, + {62, 0, 0, 62, MAIN_CORE_PROC, 62, -1}, {63, 0, 0, 63, MAIN_CORE_PROC, 63, -1}, + {64, 0, 0, 64, MAIN_CORE_PROC, 64, -1}, {65, 0, 0, 65, MAIN_CORE_PROC, 65, -1}, + {66, 0, 0, 66, MAIN_CORE_PROC, 66, -1}, {67, 0, 0, 67, MAIN_CORE_PROC, 67, -1}, + {68, 0, 0, 68, MAIN_CORE_PROC, 68, -1}, {69, 0, 0, 69, MAIN_CORE_PROC, 69, -1}, + {70, 0, 0, 70, MAIN_CORE_PROC, 70, -1}, {71, 0, 0, 71, MAIN_CORE_PROC, 71, -1}, + {72, 1, 1, 72, MAIN_CORE_PROC, 72, -1}, {73, 1, 1, 73, MAIN_CORE_PROC, 73, -1}, + {74, 1, 1, 74, MAIN_CORE_PROC, 74, -1}, {75, 1, 1, 75, MAIN_CORE_PROC, 75, -1}, + {76, 1, 1, 76, MAIN_CORE_PROC, 76, -1}, {77, 1, 1, 77, MAIN_CORE_PROC, 77, -1}, + {78, 1, 1, 78, MAIN_CORE_PROC, 78, -1}, {79, 1, 1, 79, MAIN_CORE_PROC, 79, -1}, + {80, 1, 1, 80, MAIN_CORE_PROC, 80, -1}, {81, 1, 1, 81, MAIN_CORE_PROC, 81, -1}, + {82, 1, 1, 82, MAIN_CORE_PROC, 82, -1}, {83, 1, 1, 83, MAIN_CORE_PROC, 83, -1}, + {84, 1, 1, 84, MAIN_CORE_PROC, 84, -1}, {85, 1, 1, 85, MAIN_CORE_PROC, 85, -1}, + {86, 1, 1, 86, MAIN_CORE_PROC, 86, -1}, {87, 1, 1, 87, MAIN_CORE_PROC, 87, -1}, + {88, 1, 1, 88, MAIN_CORE_PROC, 88, -1}, {89, 1, 1, 89, MAIN_CORE_PROC, 89, -1}, + {90, 1, 1, 90, MAIN_CORE_PROC, 90, -1}, {91, 1, 1, 91, MAIN_CORE_PROC, 91, -1}, + {92, 1, 1, 92, MAIN_CORE_PROC, 92, -1}, {93, 1, 1, 93, MAIN_CORE_PROC, 93, -1}, + {94, 1, 1, 94, MAIN_CORE_PROC, 94, -1}, {95, 1, 1, 95, MAIN_CORE_PROC, 95, -1}, + }, + {{96, 48, 0, 48, -1, -1}, {48, 24, 0, 24, 0, 0}, {48, 24, 0, 24, 1, 1}}, + ov::hint::SchedulingCoreType::ANY_CORE, + false, + false, + ov::hint::PerformanceMode::THROUGHPUT, + {{48, 48, 0, 0, -1, -1}, {24, 24, 0, 0, 0, 0}, {24, 24, 0, 0, 1, 1}}, + {{2, MAIN_CORE_PROC, 10, 0, 0}}, +}; + +StreamGenerateionTestCase generation_tput_2sockets_48cores_8_reservation = { + 2, + true, + 20, + 0, + 1, + 0, + ov::hint::SchedulingCoreType::ANY_CORE, + false, + true, + true, + false, + true, + ov::hint::PerformanceMode::THROUGHPUT, + {}, + { + {0, 0, 0, 0, HYPER_THREADING_PROC, 0, -1}, {1, 0, 0, 1, HYPER_THREADING_PROC, 1, -1}, + {2, 0, 0, 2, HYPER_THREADING_PROC, 2, -1}, {3, 0, 0, 3, HYPER_THREADING_PROC, 3, -1}, + {4, 0, 0, 4, HYPER_THREADING_PROC, 4, -1}, {5, 0, 0, 5, HYPER_THREADING_PROC, 5, -1}, + {6, 0, 0, 6, HYPER_THREADING_PROC, 6, -1}, {7, 0, 0, 7, HYPER_THREADING_PROC, 7, -1}, + {8, 0, 0, 8, HYPER_THREADING_PROC, 8, -1}, {9, 0, 0, 9, HYPER_THREADING_PROC, 9, -1}, + {10, 0, 0, 10, HYPER_THREADING_PROC, 10, -1}, {11, 0, 0, 11, HYPER_THREADING_PROC, 11, -1}, + {12, 0, 0, 12, HYPER_THREADING_PROC, 12, -1}, {13, 0, 0, 13, HYPER_THREADING_PROC, 13, -1}, + {14, 0, 0, 14, HYPER_THREADING_PROC, 14, -1}, {15, 0, 0, 15, HYPER_THREADING_PROC, 15, -1}, + {16, 0, 0, 16, HYPER_THREADING_PROC, 16, -1}, {17, 0, 0, 17, HYPER_THREADING_PROC, 17, -1}, + {18, 0, 0, 18, HYPER_THREADING_PROC, 18, -1}, {19, 0, 0, 19, HYPER_THREADING_PROC, 19, -1}, + {20, 0, 0, 20, HYPER_THREADING_PROC, 20, -1}, {21, 0, 0, 21, HYPER_THREADING_PROC, 21, -1}, + {22, 0, 0, 22, HYPER_THREADING_PROC, 22, -1}, {23, 0, 0, 23, HYPER_THREADING_PROC, 23, -1}, + {24, 1, 1, 24, HYPER_THREADING_PROC, 24, -1}, {25, 1, 1, 25, HYPER_THREADING_PROC, 25, -1}, + {26, 1, 1, 26, HYPER_THREADING_PROC, 26, -1}, {27, 1, 1, 27, HYPER_THREADING_PROC, 27, -1}, + {28, 1, 1, 28, HYPER_THREADING_PROC, 28, -1}, {29, 1, 1, 29, HYPER_THREADING_PROC, 29, -1}, + {30, 1, 1, 30, HYPER_THREADING_PROC, 30, -1}, {31, 1, 1, 31, HYPER_THREADING_PROC, 31, -1}, + {32, 1, 1, 32, HYPER_THREADING_PROC, 32, -1}, {33, 1, 1, 33, HYPER_THREADING_PROC, 33, -1}, + {34, 1, 1, 34, HYPER_THREADING_PROC, 34, -1}, {35, 1, 1, 35, HYPER_THREADING_PROC, 35, -1}, + {36, 1, 1, 36, HYPER_THREADING_PROC, 36, -1}, {37, 1, 1, 37, HYPER_THREADING_PROC, 37, -1}, + {38, 1, 1, 38, HYPER_THREADING_PROC, 38, -1}, {39, 1, 1, 39, HYPER_THREADING_PROC, 39, -1}, + {40, 1, 1, 40, HYPER_THREADING_PROC, 40, -1}, {41, 1, 1, 41, HYPER_THREADING_PROC, 41, -1}, + {42, 1, 1, 42, HYPER_THREADING_PROC, 42, -1}, {43, 1, 1, 43, HYPER_THREADING_PROC, 43, -1}, + {44, 1, 1, 44, HYPER_THREADING_PROC, 44, -1}, {45, 1, 1, 45, HYPER_THREADING_PROC, 45, -1}, + {46, 1, 1, 46, HYPER_THREADING_PROC, 46, -1}, {47, 1, 1, 47, HYPER_THREADING_PROC, 47, -1}, + {48, 0, 0, 48, MAIN_CORE_PROC, 48, -1}, {49, 0, 0, 49, MAIN_CORE_PROC, 49, -1}, + {50, 0, 0, 50, MAIN_CORE_PROC, 50, -1}, {51, 0, 0, 51, MAIN_CORE_PROC, 51, -1}, + {52, 0, 0, 52, MAIN_CORE_PROC, 52, -1}, {53, 0, 0, 53, MAIN_CORE_PROC, 53, -1}, + {54, 0, 0, 54, MAIN_CORE_PROC, 54, -1}, {55, 0, 0, 55, MAIN_CORE_PROC, 55, -1}, + {56, 0, 0, 56, MAIN_CORE_PROC, 56, -1}, {57, 0, 0, 57, MAIN_CORE_PROC, 57, -1}, + {58, 0, 0, 58, MAIN_CORE_PROC, 58, -1}, {59, 0, 0, 59, MAIN_CORE_PROC, 59, -1}, + {60, 0, 0, 60, MAIN_CORE_PROC, 60, -1}, {61, 0, 0, 61, MAIN_CORE_PROC, 61, -1}, + {62, 0, 0, 62, MAIN_CORE_PROC, 62, -1}, {63, 0, 0, 63, MAIN_CORE_PROC, 63, -1}, + {64, 0, 0, 64, MAIN_CORE_PROC, 64, -1}, {65, 0, 0, 65, MAIN_CORE_PROC, 65, -1}, + {66, 0, 0, 66, MAIN_CORE_PROC, 66, -1}, {67, 0, 0, 67, MAIN_CORE_PROC, 67, -1}, + {68, 0, 0, 68, MAIN_CORE_PROC, 68, -1}, {69, 0, 0, 69, MAIN_CORE_PROC, 69, -1}, + {70, 0, 0, 70, MAIN_CORE_PROC, 70, -1}, {71, 0, 0, 71, MAIN_CORE_PROC, 71, -1}, + {72, 1, 1, 72, MAIN_CORE_PROC, 72, -1}, {73, 1, 1, 73, MAIN_CORE_PROC, 73, -1}, + {74, 1, 1, 74, MAIN_CORE_PROC, 74, -1}, {75, 1, 1, 75, MAIN_CORE_PROC, 75, -1}, + {76, 1, 1, 76, MAIN_CORE_PROC, 76, -1}, {77, 1, 1, 77, MAIN_CORE_PROC, 77, -1}, + {78, 1, 1, 78, MAIN_CORE_PROC, 78, -1}, {79, 1, 1, 79, MAIN_CORE_PROC, 79, -1}, + {80, 1, 1, 80, MAIN_CORE_PROC, 80, -1}, {81, 1, 1, 81, MAIN_CORE_PROC, 81, -1}, + {82, 1, 1, 82, MAIN_CORE_PROC, 82, -1}, {83, 1, 1, 83, MAIN_CORE_PROC, 83, -1}, + {84, 1, 1, 84, MAIN_CORE_PROC, 84, -1}, {85, 1, 1, 85, MAIN_CORE_PROC, 85, -1}, + {86, 1, 1, 86, MAIN_CORE_PROC, 86, -1}, {87, 1, 1, 87, MAIN_CORE_PROC, 87, -1}, + {88, 1, 1, 88, MAIN_CORE_PROC, 88, -1}, {89, 1, 1, 89, MAIN_CORE_PROC, 89, -1}, + {90, 1, 1, 90, MAIN_CORE_PROC, 90, -1}, {91, 1, 1, 91, MAIN_CORE_PROC, 91, -1}, + {92, 1, 1, 92, MAIN_CORE_PROC, 92, -1}, {93, 1, 1, 93, MAIN_CORE_PROC, 93, -1}, + {94, 1, 1, 94, MAIN_CORE_PROC, 94, -1}, {95, 1, 1, 95, MAIN_CORE_PROC, 95, -1}, + }, {{96, 48, 0, 48, -1, -1}, {48, 24, 0, 24, 0, 0}, {48, 24, 0, 24, 1, 1}}, ov::hint::SchedulingCoreType::ANY_CORE, false, @@ -612,9 +1451,60 @@ StreamGenerateionTestCase generation_tput_2sockets_48cores_9 = { true, false, false, + false, true, ov::hint::PerformanceMode::THROUGHPUT, {}, + { + {0, 0, 0, 0, HYPER_THREADING_PROC, 0, -1}, {1, 0, 0, 1, HYPER_THREADING_PROC, 1, -1}, + {2, 0, 0, 2, HYPER_THREADING_PROC, 2, -1}, {3, 0, 0, 3, HYPER_THREADING_PROC, 3, -1}, + {4, 0, 0, 4, HYPER_THREADING_PROC, 4, -1}, {5, 0, 0, 5, HYPER_THREADING_PROC, 5, -1}, + {6, 0, 0, 6, HYPER_THREADING_PROC, 6, -1}, {7, 0, 0, 7, HYPER_THREADING_PROC, 7, -1}, + {8, 0, 0, 8, HYPER_THREADING_PROC, 8, -1}, {9, 0, 0, 9, HYPER_THREADING_PROC, 9, -1}, + {10, 0, 0, 10, HYPER_THREADING_PROC, 10, -1}, {11, 0, 0, 11, HYPER_THREADING_PROC, 11, -1}, + {12, 0, 0, 12, HYPER_THREADING_PROC, 12, -1}, {13, 0, 0, 13, HYPER_THREADING_PROC, 13, -1}, + {14, 0, 0, 14, HYPER_THREADING_PROC, 14, -1}, {15, 0, 0, 15, HYPER_THREADING_PROC, 15, -1}, + {16, 0, 0, 16, HYPER_THREADING_PROC, 16, -1}, {17, 0, 0, 17, HYPER_THREADING_PROC, 17, -1}, + {18, 0, 0, 18, HYPER_THREADING_PROC, 18, -1}, {19, 0, 0, 19, HYPER_THREADING_PROC, 19, -1}, + {20, 0, 0, 20, HYPER_THREADING_PROC, 20, -1}, {21, 0, 0, 21, HYPER_THREADING_PROC, 21, -1}, + {22, 0, 0, 22, HYPER_THREADING_PROC, 22, -1}, {23, 0, 0, 23, HYPER_THREADING_PROC, 23, -1}, + {24, 1, 1, 24, HYPER_THREADING_PROC, 24, -1}, {25, 1, 1, 25, HYPER_THREADING_PROC, 25, -1}, + {26, 1, 1, 26, HYPER_THREADING_PROC, 26, -1}, {27, 1, 1, 27, HYPER_THREADING_PROC, 27, -1}, + {28, 1, 1, 28, HYPER_THREADING_PROC, 28, -1}, {29, 1, 1, 29, HYPER_THREADING_PROC, 29, -1}, + {30, 1, 1, 30, HYPER_THREADING_PROC, 30, -1}, {31, 1, 1, 31, HYPER_THREADING_PROC, 31, -1}, + {32, 1, 1, 32, HYPER_THREADING_PROC, 32, -1}, {33, 1, 1, 33, HYPER_THREADING_PROC, 33, -1}, + {34, 1, 1, 34, HYPER_THREADING_PROC, 34, -1}, {35, 1, 1, 35, HYPER_THREADING_PROC, 35, -1}, + {36, 1, 1, 36, HYPER_THREADING_PROC, 36, -1}, {37, 1, 1, 37, HYPER_THREADING_PROC, 37, -1}, + {38, 1, 1, 38, HYPER_THREADING_PROC, 38, -1}, {39, 1, 1, 39, HYPER_THREADING_PROC, 39, -1}, + {40, 1, 1, 40, HYPER_THREADING_PROC, 40, -1}, {41, 1, 1, 41, HYPER_THREADING_PROC, 41, -1}, + {42, 1, 1, 42, HYPER_THREADING_PROC, 42, -1}, {43, 1, 1, 43, HYPER_THREADING_PROC, 43, -1}, + {44, 1, 1, 44, HYPER_THREADING_PROC, 44, -1}, {45, 1, 1, 45, HYPER_THREADING_PROC, 45, -1}, + {46, 1, 1, 46, HYPER_THREADING_PROC, 46, -1}, {47, 1, 1, 47, HYPER_THREADING_PROC, 47, -1}, + {48, 0, 0, 48, MAIN_CORE_PROC, 48, -1}, {49, 0, 0, 49, MAIN_CORE_PROC, 49, -1}, + {50, 0, 0, 50, MAIN_CORE_PROC, 50, -1}, {51, 0, 0, 51, MAIN_CORE_PROC, 51, -1}, + {52, 0, 0, 52, MAIN_CORE_PROC, 52, -1}, {53, 0, 0, 53, MAIN_CORE_PROC, 53, -1}, + {54, 0, 0, 54, MAIN_CORE_PROC, 54, -1}, {55, 0, 0, 55, MAIN_CORE_PROC, 55, -1}, + {56, 0, 0, 56, MAIN_CORE_PROC, 56, -1}, {57, 0, 0, 57, MAIN_CORE_PROC, 57, -1}, + {58, 0, 0, 58, MAIN_CORE_PROC, 58, -1}, {59, 0, 0, 59, MAIN_CORE_PROC, 59, -1}, + {60, 0, 0, 60, MAIN_CORE_PROC, 60, -1}, {61, 0, 0, 61, MAIN_CORE_PROC, 61, -1}, + {62, 0, 0, 62, MAIN_CORE_PROC, 62, -1}, {63, 0, 0, 63, MAIN_CORE_PROC, 63, -1}, + {64, 0, 0, 64, MAIN_CORE_PROC, 64, -1}, {65, 0, 0, 65, MAIN_CORE_PROC, 65, -1}, + {66, 0, 0, 66, MAIN_CORE_PROC, 66, -1}, {67, 0, 0, 67, MAIN_CORE_PROC, 67, -1}, + {68, 0, 0, 68, MAIN_CORE_PROC, 68, -1}, {69, 0, 0, 69, MAIN_CORE_PROC, 69, -1}, + {70, 0, 0, 70, MAIN_CORE_PROC, 70, -1}, {71, 0, 0, 71, MAIN_CORE_PROC, 71, -1}, + {72, 1, 1, 72, MAIN_CORE_PROC, 72, -1}, {73, 1, 1, 73, MAIN_CORE_PROC, 73, -1}, + {74, 1, 1, 74, MAIN_CORE_PROC, 74, -1}, {75, 1, 1, 75, MAIN_CORE_PROC, 75, -1}, + {76, 1, 1, 76, MAIN_CORE_PROC, 76, -1}, {77, 1, 1, 77, MAIN_CORE_PROC, 77, -1}, + {78, 1, 1, 78, MAIN_CORE_PROC, 78, -1}, {79, 1, 1, 79, MAIN_CORE_PROC, 79, -1}, + {80, 1, 1, 80, MAIN_CORE_PROC, 80, -1}, {81, 1, 1, 81, MAIN_CORE_PROC, 81, -1}, + {82, 1, 1, 82, MAIN_CORE_PROC, 82, -1}, {83, 1, 1, 83, MAIN_CORE_PROC, 83, -1}, + {84, 1, 1, 84, MAIN_CORE_PROC, 84, -1}, {85, 1, 1, 85, MAIN_CORE_PROC, 85, -1}, + {86, 1, 1, 86, MAIN_CORE_PROC, 86, -1}, {87, 1, 1, 87, MAIN_CORE_PROC, 87, -1}, + {88, 1, 1, 88, MAIN_CORE_PROC, 88, -1}, {89, 1, 1, 89, MAIN_CORE_PROC, 89, -1}, + {90, 1, 1, 90, MAIN_CORE_PROC, 90, -1}, {91, 1, 1, 91, MAIN_CORE_PROC, 91, -1}, + {92, 1, 1, 92, MAIN_CORE_PROC, 92, -1}, {93, 1, 1, 93, MAIN_CORE_PROC, 93, -1}, + {94, 1, 1, 94, MAIN_CORE_PROC, 94, -1}, {95, 1, 1, 95, MAIN_CORE_PROC, 95, -1}, + }, {{96, 48, 0, 48, -1, -1}, {48, 24, 0, 24, 0, 0}, {48, 24, 0, 24, 1, 1}}, ov::hint::SchedulingCoreType::ANY_CORE, false, @@ -633,10 +1523,61 @@ StreamGenerateionTestCase generation_latency_1sockets_96cores_pinning = { ov::hint::SchedulingCoreType::ANY_CORE, false, false, + false, true, true, ov::hint::PerformanceMode::LATENCY, {}, + { + {0, 0, 0, 0, EFFICIENT_CORE_PROC, 0, -1}, {1, 0, 0, 1, EFFICIENT_CORE_PROC, 1, -1}, + {2, 0, 0, 2, EFFICIENT_CORE_PROC, 2, -1}, {3, 0, 0, 3, EFFICIENT_CORE_PROC, 3, -1}, + {4, 0, 0, 4, EFFICIENT_CORE_PROC, 4, -1}, {5, 0, 0, 5, EFFICIENT_CORE_PROC, 5, -1}, + {6, 0, 0, 6, EFFICIENT_CORE_PROC, 6, -1}, {7, 0, 0, 7, EFFICIENT_CORE_PROC, 7, -1}, + {8, 0, 0, 8, EFFICIENT_CORE_PROC, 8, -1}, {9, 0, 0, 9, EFFICIENT_CORE_PROC, 9, -1}, + {10, 0, 0, 10, EFFICIENT_CORE_PROC, 10, -1}, {11, 0, 0, 11, EFFICIENT_CORE_PROC, 11, -1}, + {12, 0, 0, 12, EFFICIENT_CORE_PROC, 12, -1}, {13, 0, 0, 13, EFFICIENT_CORE_PROC, 13, -1}, + {14, 0, 0, 14, EFFICIENT_CORE_PROC, 14, -1}, {15, 0, 0, 15, EFFICIENT_CORE_PROC, 15, -1}, + {16, 0, 0, 16, EFFICIENT_CORE_PROC, 16, -1}, {17, 0, 0, 17, EFFICIENT_CORE_PROC, 17, -1}, + {18, 0, 0, 18, EFFICIENT_CORE_PROC, 18, -1}, {19, 0, 0, 19, EFFICIENT_CORE_PROC, 19, -1}, + {20, 0, 0, 20, EFFICIENT_CORE_PROC, 20, -1}, {21, 0, 0, 21, EFFICIENT_CORE_PROC, 21, -1}, + {22, 0, 0, 22, EFFICIENT_CORE_PROC, 22, -1}, {23, 0, 0, 23, EFFICIENT_CORE_PROC, 23, -1}, + {24, 0, 0, 24, EFFICIENT_CORE_PROC, 24, -1}, {25, 0, 0, 25, EFFICIENT_CORE_PROC, 25, -1}, + {26, 0, 0, 26, EFFICIENT_CORE_PROC, 26, -1}, {27, 0, 0, 27, EFFICIENT_CORE_PROC, 27, -1}, + {28, 0, 0, 28, EFFICIENT_CORE_PROC, 28, -1}, {29, 0, 0, 29, EFFICIENT_CORE_PROC, 29, -1}, + {30, 0, 0, 30, EFFICIENT_CORE_PROC, 30, -1}, {31, 0, 0, 31, EFFICIENT_CORE_PROC, 31, -1}, + {32, 0, 0, 32, EFFICIENT_CORE_PROC, 32, -1}, {33, 0, 0, 33, EFFICIENT_CORE_PROC, 33, -1}, + {34, 0, 0, 34, EFFICIENT_CORE_PROC, 34, -1}, {35, 0, 0, 35, EFFICIENT_CORE_PROC, 35, -1}, + {36, 0, 0, 36, EFFICIENT_CORE_PROC, 36, -1}, {37, 0, 0, 37, EFFICIENT_CORE_PROC, 37, -1}, + {38, 0, 0, 38, EFFICIENT_CORE_PROC, 38, -1}, {39, 0, 0, 39, EFFICIENT_CORE_PROC, 39, -1}, + {40, 0, 0, 40, EFFICIENT_CORE_PROC, 40, -1}, {41, 0, 0, 41, EFFICIENT_CORE_PROC, 41, -1}, + {42, 0, 0, 42, EFFICIENT_CORE_PROC, 42, -1}, {43, 0, 0, 43, EFFICIENT_CORE_PROC, 43, -1}, + {44, 0, 0, 44, EFFICIENT_CORE_PROC, 44, -1}, {45, 0, 0, 45, EFFICIENT_CORE_PROC, 45, -1}, + {46, 0, 0, 46, EFFICIENT_CORE_PROC, 46, -1}, {47, 0, 0, 47, EFFICIENT_CORE_PROC, 47, -1}, + {48, 0, 0, 48, EFFICIENT_CORE_PROC, 48, -1}, {49, 0, 0, 49, EFFICIENT_CORE_PROC, 49, -1}, + {50, 0, 0, 50, EFFICIENT_CORE_PROC, 50, -1}, {51, 0, 0, 51, EFFICIENT_CORE_PROC, 51, -1}, + {52, 0, 0, 52, EFFICIENT_CORE_PROC, 52, -1}, {53, 0, 0, 53, EFFICIENT_CORE_PROC, 53, -1}, + {54, 0, 0, 54, EFFICIENT_CORE_PROC, 54, -1}, {55, 0, 0, 55, EFFICIENT_CORE_PROC, 55, -1}, + {56, 0, 0, 56, EFFICIENT_CORE_PROC, 56, -1}, {57, 0, 0, 57, EFFICIENT_CORE_PROC, 57, -1}, + {58, 0, 0, 58, EFFICIENT_CORE_PROC, 58, -1}, {59, 0, 0, 59, EFFICIENT_CORE_PROC, 59, -1}, + {60, 0, 0, 60, EFFICIENT_CORE_PROC, 60, -1}, {61, 0, 0, 61, EFFICIENT_CORE_PROC, 61, -1}, + {62, 0, 0, 62, EFFICIENT_CORE_PROC, 62, -1}, {63, 0, 0, 63, EFFICIENT_CORE_PROC, 63, -1}, + {64, 0, 0, 64, EFFICIENT_CORE_PROC, 64, -1}, {65, 0, 0, 65, EFFICIENT_CORE_PROC, 65, -1}, + {66, 0, 0, 66, EFFICIENT_CORE_PROC, 66, -1}, {67, 0, 0, 67, EFFICIENT_CORE_PROC, 67, -1}, + {68, 0, 0, 68, EFFICIENT_CORE_PROC, 68, -1}, {69, 0, 0, 69, EFFICIENT_CORE_PROC, 69, -1}, + {70, 0, 0, 70, EFFICIENT_CORE_PROC, 70, -1}, {71, 0, 0, 71, EFFICIENT_CORE_PROC, 71, -1}, + {72, 0, 0, 72, EFFICIENT_CORE_PROC, 72, -1}, {73, 0, 0, 73, EFFICIENT_CORE_PROC, 73, -1}, + {74, 0, 0, 74, EFFICIENT_CORE_PROC, 74, -1}, {75, 0, 0, 75, EFFICIENT_CORE_PROC, 75, -1}, + {76, 0, 0, 76, EFFICIENT_CORE_PROC, 76, -1}, {77, 0, 0, 77, EFFICIENT_CORE_PROC, 77, -1}, + {78, 0, 0, 78, EFFICIENT_CORE_PROC, 78, -1}, {79, 0, 0, 79, EFFICIENT_CORE_PROC, 79, -1}, + {80, 0, 0, 80, EFFICIENT_CORE_PROC, 80, -1}, {81, 0, 0, 81, EFFICIENT_CORE_PROC, 81, -1}, + {82, 0, 0, 82, EFFICIENT_CORE_PROC, 82, -1}, {83, 0, 0, 83, EFFICIENT_CORE_PROC, 83, -1}, + {84, 0, 0, 84, EFFICIENT_CORE_PROC, 84, -1}, {85, 0, 0, 85, EFFICIENT_CORE_PROC, 85, -1}, + {86, 0, 0, 86, EFFICIENT_CORE_PROC, 86, -1}, {87, 0, 0, 87, EFFICIENT_CORE_PROC, 87, -1}, + {88, 0, 0, 88, EFFICIENT_CORE_PROC, 88, -1}, {89, 0, 0, 89, EFFICIENT_CORE_PROC, 89, -1}, + {90, 0, 0, 90, EFFICIENT_CORE_PROC, 90, -1}, {91, 0, 0, 91, EFFICIENT_CORE_PROC, 91, -1}, + {92, 0, 0, 92, EFFICIENT_CORE_PROC, 92, -1}, {93, 0, 0, 93, EFFICIENT_CORE_PROC, 93, -1}, + {94, 0, 0, 94, EFFICIENT_CORE_PROC, 94, -1}, {95, 0, 0, 95, EFFICIENT_CORE_PROC, 95, -1}, + }, {{96, 0, 96, 0, 0, 0}}, ov::hint::SchedulingCoreType::ANY_CORE, false, @@ -655,10 +1596,61 @@ StreamGenerateionTestCase generation_tput_1sockets_96cores_pinning = { ov::hint::SchedulingCoreType::ANY_CORE, false, false, + false, true, true, ov::hint::PerformanceMode::THROUGHPUT, {}, + { + {0, 0, 0, 0, EFFICIENT_CORE_PROC, 0, -1}, {1, 0, 0, 1, EFFICIENT_CORE_PROC, 1, -1}, + {2, 0, 0, 2, EFFICIENT_CORE_PROC, 2, -1}, {3, 0, 0, 3, EFFICIENT_CORE_PROC, 3, -1}, + {4, 0, 0, 4, EFFICIENT_CORE_PROC, 4, -1}, {5, 0, 0, 5, EFFICIENT_CORE_PROC, 5, -1}, + {6, 0, 0, 6, EFFICIENT_CORE_PROC, 6, -1}, {7, 0, 0, 7, EFFICIENT_CORE_PROC, 7, -1}, + {8, 0, 0, 8, EFFICIENT_CORE_PROC, 8, -1}, {9, 0, 0, 9, EFFICIENT_CORE_PROC, 9, -1}, + {10, 0, 0, 10, EFFICIENT_CORE_PROC, 10, -1}, {11, 0, 0, 11, EFFICIENT_CORE_PROC, 11, -1}, + {12, 0, 0, 12, EFFICIENT_CORE_PROC, 12, -1}, {13, 0, 0, 13, EFFICIENT_CORE_PROC, 13, -1}, + {14, 0, 0, 14, EFFICIENT_CORE_PROC, 14, -1}, {15, 0, 0, 15, EFFICIENT_CORE_PROC, 15, -1}, + {16, 0, 0, 16, EFFICIENT_CORE_PROC, 16, -1}, {17, 0, 0, 17, EFFICIENT_CORE_PROC, 17, -1}, + {18, 0, 0, 18, EFFICIENT_CORE_PROC, 18, -1}, {19, 0, 0, 19, EFFICIENT_CORE_PROC, 19, -1}, + {20, 0, 0, 20, EFFICIENT_CORE_PROC, 20, -1}, {21, 0, 0, 21, EFFICIENT_CORE_PROC, 21, -1}, + {22, 0, 0, 22, EFFICIENT_CORE_PROC, 22, -1}, {23, 0, 0, 23, EFFICIENT_CORE_PROC, 23, -1}, + {24, 0, 0, 24, EFFICIENT_CORE_PROC, 24, -1}, {25, 0, 0, 25, EFFICIENT_CORE_PROC, 25, -1}, + {26, 0, 0, 26, EFFICIENT_CORE_PROC, 26, -1}, {27, 0, 0, 27, EFFICIENT_CORE_PROC, 27, -1}, + {28, 0, 0, 28, EFFICIENT_CORE_PROC, 28, -1}, {29, 0, 0, 29, EFFICIENT_CORE_PROC, 29, -1}, + {30, 0, 0, 30, EFFICIENT_CORE_PROC, 30, -1}, {31, 0, 0, 31, EFFICIENT_CORE_PROC, 31, -1}, + {32, 0, 0, 32, EFFICIENT_CORE_PROC, 32, -1}, {33, 0, 0, 33, EFFICIENT_CORE_PROC, 33, -1}, + {34, 0, 0, 34, EFFICIENT_CORE_PROC, 34, -1}, {35, 0, 0, 35, EFFICIENT_CORE_PROC, 35, -1}, + {36, 0, 0, 36, EFFICIENT_CORE_PROC, 36, -1}, {37, 0, 0, 37, EFFICIENT_CORE_PROC, 37, -1}, + {38, 0, 0, 38, EFFICIENT_CORE_PROC, 38, -1}, {39, 0, 0, 39, EFFICIENT_CORE_PROC, 39, -1}, + {40, 0, 0, 40, EFFICIENT_CORE_PROC, 40, -1}, {41, 0, 0, 41, EFFICIENT_CORE_PROC, 41, -1}, + {42, 0, 0, 42, EFFICIENT_CORE_PROC, 42, -1}, {43, 0, 0, 43, EFFICIENT_CORE_PROC, 43, -1}, + {44, 0, 0, 44, EFFICIENT_CORE_PROC, 44, -1}, {45, 0, 0, 45, EFFICIENT_CORE_PROC, 45, -1}, + {46, 0, 0, 46, EFFICIENT_CORE_PROC, 46, -1}, {47, 0, 0, 47, EFFICIENT_CORE_PROC, 47, -1}, + {48, 0, 0, 48, EFFICIENT_CORE_PROC, 48, -1}, {49, 0, 0, 49, EFFICIENT_CORE_PROC, 49, -1}, + {50, 0, 0, 50, EFFICIENT_CORE_PROC, 50, -1}, {51, 0, 0, 51, EFFICIENT_CORE_PROC, 51, -1}, + {52, 0, 0, 52, EFFICIENT_CORE_PROC, 52, -1}, {53, 0, 0, 53, EFFICIENT_CORE_PROC, 53, -1}, + {54, 0, 0, 54, EFFICIENT_CORE_PROC, 54, -1}, {55, 0, 0, 55, EFFICIENT_CORE_PROC, 55, -1}, + {56, 0, 0, 56, EFFICIENT_CORE_PROC, 56, -1}, {57, 0, 0, 57, EFFICIENT_CORE_PROC, 57, -1}, + {58, 0, 0, 58, EFFICIENT_CORE_PROC, 58, -1}, {59, 0, 0, 59, EFFICIENT_CORE_PROC, 59, -1}, + {60, 0, 0, 60, EFFICIENT_CORE_PROC, 60, -1}, {61, 0, 0, 61, EFFICIENT_CORE_PROC, 61, -1}, + {62, 0, 0, 62, EFFICIENT_CORE_PROC, 62, -1}, {63, 0, 0, 63, EFFICIENT_CORE_PROC, 63, -1}, + {64, 0, 0, 64, EFFICIENT_CORE_PROC, 64, -1}, {65, 0, 0, 65, EFFICIENT_CORE_PROC, 65, -1}, + {66, 0, 0, 66, EFFICIENT_CORE_PROC, 66, -1}, {67, 0, 0, 67, EFFICIENT_CORE_PROC, 67, -1}, + {68, 0, 0, 68, EFFICIENT_CORE_PROC, 68, -1}, {69, 0, 0, 69, EFFICIENT_CORE_PROC, 69, -1}, + {70, 0, 0, 70, EFFICIENT_CORE_PROC, 70, -1}, {71, 0, 0, 71, EFFICIENT_CORE_PROC, 71, -1}, + {72, 0, 0, 72, EFFICIENT_CORE_PROC, 72, -1}, {73, 0, 0, 73, EFFICIENT_CORE_PROC, 73, -1}, + {74, 0, 0, 74, EFFICIENT_CORE_PROC, 74, -1}, {75, 0, 0, 75, EFFICIENT_CORE_PROC, 75, -1}, + {76, 0, 0, 76, EFFICIENT_CORE_PROC, 76, -1}, {77, 0, 0, 77, EFFICIENT_CORE_PROC, 77, -1}, + {78, 0, 0, 78, EFFICIENT_CORE_PROC, 78, -1}, {79, 0, 0, 79, EFFICIENT_CORE_PROC, 79, -1}, + {80, 0, 0, 80, EFFICIENT_CORE_PROC, 80, -1}, {81, 0, 0, 81, EFFICIENT_CORE_PROC, 81, -1}, + {82, 0, 0, 82, EFFICIENT_CORE_PROC, 82, -1}, {83, 0, 0, 83, EFFICIENT_CORE_PROC, 83, -1}, + {84, 0, 0, 84, EFFICIENT_CORE_PROC, 84, -1}, {85, 0, 0, 85, EFFICIENT_CORE_PROC, 85, -1}, + {86, 0, 0, 86, EFFICIENT_CORE_PROC, 86, -1}, {87, 0, 0, 87, EFFICIENT_CORE_PROC, 87, -1}, + {88, 0, 0, 88, EFFICIENT_CORE_PROC, 88, -1}, {89, 0, 0, 89, EFFICIENT_CORE_PROC, 89, -1}, + {90, 0, 0, 90, EFFICIENT_CORE_PROC, 90, -1}, {91, 0, 0, 91, EFFICIENT_CORE_PROC, 91, -1}, + {92, 0, 0, 92, EFFICIENT_CORE_PROC, 92, -1}, {93, 0, 0, 93, EFFICIENT_CORE_PROC, 93, -1}, + {94, 0, 0, 94, EFFICIENT_CORE_PROC, 94, -1}, {95, 0, 0, 95, EFFICIENT_CORE_PROC, 95, -1}, + }, {{96, 0, 96, 0, 0, 0}}, ov::hint::SchedulingCoreType::ANY_CORE, false, @@ -677,10 +1669,61 @@ StreamGenerateionTestCase generation_tput_1sockets_96cores_2_pinning = { ov::hint::SchedulingCoreType::PCORE_ONLY, true, true, + false, true, true, ov::hint::PerformanceMode::THROUGHPUT, {}, + { + {0, 0, 0, 0, EFFICIENT_CORE_PROC, 0, -1}, {1, 0, 0, 1, EFFICIENT_CORE_PROC, 1, -1}, + {2, 0, 0, 2, EFFICIENT_CORE_PROC, 2, -1}, {3, 0, 0, 3, EFFICIENT_CORE_PROC, 3, -1}, + {4, 0, 0, 4, EFFICIENT_CORE_PROC, 4, -1}, {5, 0, 0, 5, EFFICIENT_CORE_PROC, 5, -1}, + {6, 0, 0, 6, EFFICIENT_CORE_PROC, 6, -1}, {7, 0, 0, 7, EFFICIENT_CORE_PROC, 7, -1}, + {8, 0, 0, 8, EFFICIENT_CORE_PROC, 8, -1}, {9, 0, 0, 9, EFFICIENT_CORE_PROC, 9, -1}, + {10, 0, 0, 10, EFFICIENT_CORE_PROC, 10, -1}, {11, 0, 0, 11, EFFICIENT_CORE_PROC, 11, -1}, + {12, 0, 0, 12, EFFICIENT_CORE_PROC, 12, -1}, {13, 0, 0, 13, EFFICIENT_CORE_PROC, 13, -1}, + {14, 0, 0, 14, EFFICIENT_CORE_PROC, 14, -1}, {15, 0, 0, 15, EFFICIENT_CORE_PROC, 15, -1}, + {16, 0, 0, 16, EFFICIENT_CORE_PROC, 16, -1}, {17, 0, 0, 17, EFFICIENT_CORE_PROC, 17, -1}, + {18, 0, 0, 18, EFFICIENT_CORE_PROC, 18, -1}, {19, 0, 0, 19, EFFICIENT_CORE_PROC, 19, -1}, + {20, 0, 0, 20, EFFICIENT_CORE_PROC, 20, -1}, {21, 0, 0, 21, EFFICIENT_CORE_PROC, 21, -1}, + {22, 0, 0, 22, EFFICIENT_CORE_PROC, 22, -1}, {23, 0, 0, 23, EFFICIENT_CORE_PROC, 23, -1}, + {24, 0, 0, 24, EFFICIENT_CORE_PROC, 24, -1}, {25, 0, 0, 25, EFFICIENT_CORE_PROC, 25, -1}, + {26, 0, 0, 26, EFFICIENT_CORE_PROC, 26, -1}, {27, 0, 0, 27, EFFICIENT_CORE_PROC, 27, -1}, + {28, 0, 0, 28, EFFICIENT_CORE_PROC, 28, -1}, {29, 0, 0, 29, EFFICIENT_CORE_PROC, 29, -1}, + {30, 0, 0, 30, EFFICIENT_CORE_PROC, 30, -1}, {31, 0, 0, 31, EFFICIENT_CORE_PROC, 31, -1}, + {32, 0, 0, 32, EFFICIENT_CORE_PROC, 32, -1}, {33, 0, 0, 33, EFFICIENT_CORE_PROC, 33, -1}, + {34, 0, 0, 34, EFFICIENT_CORE_PROC, 34, -1}, {35, 0, 0, 35, EFFICIENT_CORE_PROC, 35, -1}, + {36, 0, 0, 36, EFFICIENT_CORE_PROC, 36, -1}, {37, 0, 0, 37, EFFICIENT_CORE_PROC, 37, -1}, + {38, 0, 0, 38, EFFICIENT_CORE_PROC, 38, -1}, {39, 0, 0, 39, EFFICIENT_CORE_PROC, 39, -1}, + {40, 0, 0, 40, EFFICIENT_CORE_PROC, 40, -1}, {41, 0, 0, 41, EFFICIENT_CORE_PROC, 41, -1}, + {42, 0, 0, 42, EFFICIENT_CORE_PROC, 42, -1}, {43, 0, 0, 43, EFFICIENT_CORE_PROC, 43, -1}, + {44, 0, 0, 44, EFFICIENT_CORE_PROC, 44, -1}, {45, 0, 0, 45, EFFICIENT_CORE_PROC, 45, -1}, + {46, 0, 0, 46, EFFICIENT_CORE_PROC, 46, -1}, {47, 0, 0, 47, EFFICIENT_CORE_PROC, 47, -1}, + {48, 0, 0, 48, EFFICIENT_CORE_PROC, 48, -1}, {49, 0, 0, 49, EFFICIENT_CORE_PROC, 49, -1}, + {50, 0, 0, 50, EFFICIENT_CORE_PROC, 50, -1}, {51, 0, 0, 51, EFFICIENT_CORE_PROC, 51, -1}, + {52, 0, 0, 52, EFFICIENT_CORE_PROC, 52, -1}, {53, 0, 0, 53, EFFICIENT_CORE_PROC, 53, -1}, + {54, 0, 0, 54, EFFICIENT_CORE_PROC, 54, -1}, {55, 0, 0, 55, EFFICIENT_CORE_PROC, 55, -1}, + {56, 0, 0, 56, EFFICIENT_CORE_PROC, 56, -1}, {57, 0, 0, 57, EFFICIENT_CORE_PROC, 57, -1}, + {58, 0, 0, 58, EFFICIENT_CORE_PROC, 58, -1}, {59, 0, 0, 59, EFFICIENT_CORE_PROC, 59, -1}, + {60, 0, 0, 60, EFFICIENT_CORE_PROC, 60, -1}, {61, 0, 0, 61, EFFICIENT_CORE_PROC, 61, -1}, + {62, 0, 0, 62, EFFICIENT_CORE_PROC, 62, -1}, {63, 0, 0, 63, EFFICIENT_CORE_PROC, 63, -1}, + {64, 0, 0, 64, EFFICIENT_CORE_PROC, 64, -1}, {65, 0, 0, 65, EFFICIENT_CORE_PROC, 65, -1}, + {66, 0, 0, 66, EFFICIENT_CORE_PROC, 66, -1}, {67, 0, 0, 67, EFFICIENT_CORE_PROC, 67, -1}, + {68, 0, 0, 68, EFFICIENT_CORE_PROC, 68, -1}, {69, 0, 0, 69, EFFICIENT_CORE_PROC, 69, -1}, + {70, 0, 0, 70, EFFICIENT_CORE_PROC, 70, -1}, {71, 0, 0, 71, EFFICIENT_CORE_PROC, 71, -1}, + {72, 0, 0, 72, EFFICIENT_CORE_PROC, 72, -1}, {73, 0, 0, 73, EFFICIENT_CORE_PROC, 73, -1}, + {74, 0, 0, 74, EFFICIENT_CORE_PROC, 74, -1}, {75, 0, 0, 75, EFFICIENT_CORE_PROC, 75, -1}, + {76, 0, 0, 76, EFFICIENT_CORE_PROC, 76, -1}, {77, 0, 0, 77, EFFICIENT_CORE_PROC, 77, -1}, + {78, 0, 0, 78, EFFICIENT_CORE_PROC, 78, -1}, {79, 0, 0, 79, EFFICIENT_CORE_PROC, 79, -1}, + {80, 0, 0, 80, EFFICIENT_CORE_PROC, 80, -1}, {81, 0, 0, 81, EFFICIENT_CORE_PROC, 81, -1}, + {82, 0, 0, 82, EFFICIENT_CORE_PROC, 82, -1}, {83, 0, 0, 83, EFFICIENT_CORE_PROC, 83, -1}, + {84, 0, 0, 84, EFFICIENT_CORE_PROC, 84, -1}, {85, 0, 0, 85, EFFICIENT_CORE_PROC, 85, -1}, + {86, 0, 0, 86, EFFICIENT_CORE_PROC, 86, -1}, {87, 0, 0, 87, EFFICIENT_CORE_PROC, 87, -1}, + {88, 0, 0, 88, EFFICIENT_CORE_PROC, 88, -1}, {89, 0, 0, 89, EFFICIENT_CORE_PROC, 89, -1}, + {90, 0, 0, 90, EFFICIENT_CORE_PROC, 90, -1}, {91, 0, 0, 91, EFFICIENT_CORE_PROC, 91, -1}, + {92, 0, 0, 92, EFFICIENT_CORE_PROC, 92, -1}, {93, 0, 0, 93, EFFICIENT_CORE_PROC, 93, -1}, + {94, 0, 0, 94, EFFICIENT_CORE_PROC, 94, -1}, {95, 0, 0, 95, EFFICIENT_CORE_PROC, 95, -1}, + }, {{96, 0, 96, 0, 0, 0}}, ov::hint::SchedulingCoreType::ANY_CORE, false, @@ -699,10 +1742,61 @@ StreamGenerateionTestCase generation_latency_1sockets_96cores_unpinning = { ov::hint::SchedulingCoreType::ANY_CORE, false, false, + false, true, true, ov::hint::PerformanceMode::LATENCY, {}, + { + {0, 0, 0, 0, EFFICIENT_CORE_PROC, 0, -1}, {1, 0, 0, 1, EFFICIENT_CORE_PROC, 1, -1}, + {2, 0, 0, 2, EFFICIENT_CORE_PROC, 2, -1}, {3, 0, 0, 3, EFFICIENT_CORE_PROC, 3, -1}, + {4, 0, 0, 4, EFFICIENT_CORE_PROC, 4, -1}, {5, 0, 0, 5, EFFICIENT_CORE_PROC, 5, -1}, + {6, 0, 0, 6, EFFICIENT_CORE_PROC, 6, -1}, {7, 0, 0, 7, EFFICIENT_CORE_PROC, 7, -1}, + {8, 0, 0, 8, EFFICIENT_CORE_PROC, 8, -1}, {9, 0, 0, 9, EFFICIENT_CORE_PROC, 9, -1}, + {10, 0, 0, 10, EFFICIENT_CORE_PROC, 10, -1}, {11, 0, 0, 11, EFFICIENT_CORE_PROC, 11, -1}, + {12, 0, 0, 12, EFFICIENT_CORE_PROC, 12, -1}, {13, 0, 0, 13, EFFICIENT_CORE_PROC, 13, -1}, + {14, 0, 0, 14, EFFICIENT_CORE_PROC, 14, -1}, {15, 0, 0, 15, EFFICIENT_CORE_PROC, 15, -1}, + {16, 0, 0, 16, EFFICIENT_CORE_PROC, 16, -1}, {17, 0, 0, 17, EFFICIENT_CORE_PROC, 17, -1}, + {18, 0, 0, 18, EFFICIENT_CORE_PROC, 18, -1}, {19, 0, 0, 19, EFFICIENT_CORE_PROC, 19, -1}, + {20, 0, 0, 20, EFFICIENT_CORE_PROC, 20, -1}, {21, 0, 0, 21, EFFICIENT_CORE_PROC, 21, -1}, + {22, 0, 0, 22, EFFICIENT_CORE_PROC, 22, -1}, {23, 0, 0, 23, EFFICIENT_CORE_PROC, 23, -1}, + {24, 0, 0, 24, EFFICIENT_CORE_PROC, 24, -1}, {25, 0, 0, 25, EFFICIENT_CORE_PROC, 25, -1}, + {26, 0, 0, 26, EFFICIENT_CORE_PROC, 26, -1}, {27, 0, 0, 27, EFFICIENT_CORE_PROC, 27, -1}, + {28, 0, 0, 28, EFFICIENT_CORE_PROC, 28, -1}, {29, 0, 0, 29, EFFICIENT_CORE_PROC, 29, -1}, + {30, 0, 0, 30, EFFICIENT_CORE_PROC, 30, -1}, {31, 0, 0, 31, EFFICIENT_CORE_PROC, 31, -1}, + {32, 0, 0, 32, EFFICIENT_CORE_PROC, 32, -1}, {33, 0, 0, 33, EFFICIENT_CORE_PROC, 33, -1}, + {34, 0, 0, 34, EFFICIENT_CORE_PROC, 34, -1}, {35, 0, 0, 35, EFFICIENT_CORE_PROC, 35, -1}, + {36, 0, 0, 36, EFFICIENT_CORE_PROC, 36, -1}, {37, 0, 0, 37, EFFICIENT_CORE_PROC, 37, -1}, + {38, 0, 0, 38, EFFICIENT_CORE_PROC, 38, -1}, {39, 0, 0, 39, EFFICIENT_CORE_PROC, 39, -1}, + {40, 0, 0, 40, EFFICIENT_CORE_PROC, 40, -1}, {41, 0, 0, 41, EFFICIENT_CORE_PROC, 41, -1}, + {42, 0, 0, 42, EFFICIENT_CORE_PROC, 42, -1}, {43, 0, 0, 43, EFFICIENT_CORE_PROC, 43, -1}, + {44, 0, 0, 44, EFFICIENT_CORE_PROC, 44, -1}, {45, 0, 0, 45, EFFICIENT_CORE_PROC, 45, -1}, + {46, 0, 0, 46, EFFICIENT_CORE_PROC, 46, -1}, {47, 0, 0, 47, EFFICIENT_CORE_PROC, 47, -1}, + {48, 0, 0, 48, EFFICIENT_CORE_PROC, 48, -1}, {49, 0, 0, 49, EFFICIENT_CORE_PROC, 49, -1}, + {50, 0, 0, 50, EFFICIENT_CORE_PROC, 50, -1}, {51, 0, 0, 51, EFFICIENT_CORE_PROC, 51, -1}, + {52, 0, 0, 52, EFFICIENT_CORE_PROC, 52, -1}, {53, 0, 0, 53, EFFICIENT_CORE_PROC, 53, -1}, + {54, 0, 0, 54, EFFICIENT_CORE_PROC, 54, -1}, {55, 0, 0, 55, EFFICIENT_CORE_PROC, 55, -1}, + {56, 0, 0, 56, EFFICIENT_CORE_PROC, 56, -1}, {57, 0, 0, 57, EFFICIENT_CORE_PROC, 57, -1}, + {58, 0, 0, 58, EFFICIENT_CORE_PROC, 58, -1}, {59, 0, 0, 59, EFFICIENT_CORE_PROC, 59, -1}, + {60, 0, 0, 60, EFFICIENT_CORE_PROC, 60, -1}, {61, 0, 0, 61, EFFICIENT_CORE_PROC, 61, -1}, + {62, 0, 0, 62, EFFICIENT_CORE_PROC, 62, -1}, {63, 0, 0, 63, EFFICIENT_CORE_PROC, 63, -1}, + {64, 0, 0, 64, EFFICIENT_CORE_PROC, 64, -1}, {65, 0, 0, 65, EFFICIENT_CORE_PROC, 65, -1}, + {66, 0, 0, 66, EFFICIENT_CORE_PROC, 66, -1}, {67, 0, 0, 67, EFFICIENT_CORE_PROC, 67, -1}, + {68, 0, 0, 68, EFFICIENT_CORE_PROC, 68, -1}, {69, 0, 0, 69, EFFICIENT_CORE_PROC, 69, -1}, + {70, 0, 0, 70, EFFICIENT_CORE_PROC, 70, -1}, {71, 0, 0, 71, EFFICIENT_CORE_PROC, 71, -1}, + {72, 0, 0, 72, EFFICIENT_CORE_PROC, 72, -1}, {73, 0, 0, 73, EFFICIENT_CORE_PROC, 73, -1}, + {74, 0, 0, 74, EFFICIENT_CORE_PROC, 74, -1}, {75, 0, 0, 75, EFFICIENT_CORE_PROC, 75, -1}, + {76, 0, 0, 76, EFFICIENT_CORE_PROC, 76, -1}, {77, 0, 0, 77, EFFICIENT_CORE_PROC, 77, -1}, + {78, 0, 0, 78, EFFICIENT_CORE_PROC, 78, -1}, {79, 0, 0, 79, EFFICIENT_CORE_PROC, 79, -1}, + {80, 0, 0, 80, EFFICIENT_CORE_PROC, 80, -1}, {81, 0, 0, 81, EFFICIENT_CORE_PROC, 81, -1}, + {82, 0, 0, 82, EFFICIENT_CORE_PROC, 82, -1}, {83, 0, 0, 83, EFFICIENT_CORE_PROC, 83, -1}, + {84, 0, 0, 84, EFFICIENT_CORE_PROC, 84, -1}, {85, 0, 0, 85, EFFICIENT_CORE_PROC, 85, -1}, + {86, 0, 0, 86, EFFICIENT_CORE_PROC, 86, -1}, {87, 0, 0, 87, EFFICIENT_CORE_PROC, 87, -1}, + {88, 0, 0, 88, EFFICIENT_CORE_PROC, 88, -1}, {89, 0, 0, 89, EFFICIENT_CORE_PROC, 89, -1}, + {90, 0, 0, 90, EFFICIENT_CORE_PROC, 90, -1}, {91, 0, 0, 91, EFFICIENT_CORE_PROC, 91, -1}, + {92, 0, 0, 92, EFFICIENT_CORE_PROC, 92, -1}, {93, 0, 0, 93, EFFICIENT_CORE_PROC, 93, -1}, + {94, 0, 0, 94, EFFICIENT_CORE_PROC, 94, -1}, {95, 0, 0, 95, EFFICIENT_CORE_PROC, 95, -1}, + }, {{96, 0, 96, 0, 0, 0}}, ov::hint::SchedulingCoreType::ANY_CORE, false, @@ -723,8 +1817,59 @@ StreamGenerateionTestCase generation_tput_1sockets_96cores_unpinning = { false, false, false, + false, ov::hint::PerformanceMode::THROUGHPUT, {}, + { + {0, 0, 0, 0, EFFICIENT_CORE_PROC, 0, -1}, {1, 0, 0, 1, EFFICIENT_CORE_PROC, 1, -1}, + {2, 0, 0, 2, EFFICIENT_CORE_PROC, 2, -1}, {3, 0, 0, 3, EFFICIENT_CORE_PROC, 3, -1}, + {4, 0, 0, 4, EFFICIENT_CORE_PROC, 4, -1}, {5, 0, 0, 5, EFFICIENT_CORE_PROC, 5, -1}, + {6, 0, 0, 6, EFFICIENT_CORE_PROC, 6, -1}, {7, 0, 0, 7, EFFICIENT_CORE_PROC, 7, -1}, + {8, 0, 0, 8, EFFICIENT_CORE_PROC, 8, -1}, {9, 0, 0, 9, EFFICIENT_CORE_PROC, 9, -1}, + {10, 0, 0, 10, EFFICIENT_CORE_PROC, 10, -1}, {11, 0, 0, 11, EFFICIENT_CORE_PROC, 11, -1}, + {12, 0, 0, 12, EFFICIENT_CORE_PROC, 12, -1}, {13, 0, 0, 13, EFFICIENT_CORE_PROC, 13, -1}, + {14, 0, 0, 14, EFFICIENT_CORE_PROC, 14, -1}, {15, 0, 0, 15, EFFICIENT_CORE_PROC, 15, -1}, + {16, 0, 0, 16, EFFICIENT_CORE_PROC, 16, -1}, {17, 0, 0, 17, EFFICIENT_CORE_PROC, 17, -1}, + {18, 0, 0, 18, EFFICIENT_CORE_PROC, 18, -1}, {19, 0, 0, 19, EFFICIENT_CORE_PROC, 19, -1}, + {20, 0, 0, 20, EFFICIENT_CORE_PROC, 20, -1}, {21, 0, 0, 21, EFFICIENT_CORE_PROC, 21, -1}, + {22, 0, 0, 22, EFFICIENT_CORE_PROC, 22, -1}, {23, 0, 0, 23, EFFICIENT_CORE_PROC, 23, -1}, + {24, 0, 0, 24, EFFICIENT_CORE_PROC, 24, -1}, {25, 0, 0, 25, EFFICIENT_CORE_PROC, 25, -1}, + {26, 0, 0, 26, EFFICIENT_CORE_PROC, 26, -1}, {27, 0, 0, 27, EFFICIENT_CORE_PROC, 27, -1}, + {28, 0, 0, 28, EFFICIENT_CORE_PROC, 28, -1}, {29, 0, 0, 29, EFFICIENT_CORE_PROC, 29, -1}, + {30, 0, 0, 30, EFFICIENT_CORE_PROC, 30, -1}, {31, 0, 0, 31, EFFICIENT_CORE_PROC, 31, -1}, + {32, 0, 0, 32, EFFICIENT_CORE_PROC, 32, -1}, {33, 0, 0, 33, EFFICIENT_CORE_PROC, 33, -1}, + {34, 0, 0, 34, EFFICIENT_CORE_PROC, 34, -1}, {35, 0, 0, 35, EFFICIENT_CORE_PROC, 35, -1}, + {36, 0, 0, 36, EFFICIENT_CORE_PROC, 36, -1}, {37, 0, 0, 37, EFFICIENT_CORE_PROC, 37, -1}, + {38, 0, 0, 38, EFFICIENT_CORE_PROC, 38, -1}, {39, 0, 0, 39, EFFICIENT_CORE_PROC, 39, -1}, + {40, 0, 0, 40, EFFICIENT_CORE_PROC, 40, -1}, {41, 0, 0, 41, EFFICIENT_CORE_PROC, 41, -1}, + {42, 0, 0, 42, EFFICIENT_CORE_PROC, 42, -1}, {43, 0, 0, 43, EFFICIENT_CORE_PROC, 43, -1}, + {44, 0, 0, 44, EFFICIENT_CORE_PROC, 44, -1}, {45, 0, 0, 45, EFFICIENT_CORE_PROC, 45, -1}, + {46, 0, 0, 46, EFFICIENT_CORE_PROC, 46, -1}, {47, 0, 0, 47, EFFICIENT_CORE_PROC, 47, -1}, + {48, 0, 0, 48, EFFICIENT_CORE_PROC, 48, -1}, {49, 0, 0, 49, EFFICIENT_CORE_PROC, 49, -1}, + {50, 0, 0, 50, EFFICIENT_CORE_PROC, 50, -1}, {51, 0, 0, 51, EFFICIENT_CORE_PROC, 51, -1}, + {52, 0, 0, 52, EFFICIENT_CORE_PROC, 52, -1}, {53, 0, 0, 53, EFFICIENT_CORE_PROC, 53, -1}, + {54, 0, 0, 54, EFFICIENT_CORE_PROC, 54, -1}, {55, 0, 0, 55, EFFICIENT_CORE_PROC, 55, -1}, + {56, 0, 0, 56, EFFICIENT_CORE_PROC, 56, -1}, {57, 0, 0, 57, EFFICIENT_CORE_PROC, 57, -1}, + {58, 0, 0, 58, EFFICIENT_CORE_PROC, 58, -1}, {59, 0, 0, 59, EFFICIENT_CORE_PROC, 59, -1}, + {60, 0, 0, 60, EFFICIENT_CORE_PROC, 60, -1}, {61, 0, 0, 61, EFFICIENT_CORE_PROC, 61, -1}, + {62, 0, 0, 62, EFFICIENT_CORE_PROC, 62, -1}, {63, 0, 0, 63, EFFICIENT_CORE_PROC, 63, -1}, + {64, 0, 0, 64, EFFICIENT_CORE_PROC, 64, -1}, {65, 0, 0, 65, EFFICIENT_CORE_PROC, 65, -1}, + {66, 0, 0, 66, EFFICIENT_CORE_PROC, 66, -1}, {67, 0, 0, 67, EFFICIENT_CORE_PROC, 67, -1}, + {68, 0, 0, 68, EFFICIENT_CORE_PROC, 68, -1}, {69, 0, 0, 69, EFFICIENT_CORE_PROC, 69, -1}, + {70, 0, 0, 70, EFFICIENT_CORE_PROC, 70, -1}, {71, 0, 0, 71, EFFICIENT_CORE_PROC, 71, -1}, + {72, 0, 0, 72, EFFICIENT_CORE_PROC, 72, -1}, {73, 0, 0, 73, EFFICIENT_CORE_PROC, 73, -1}, + {74, 0, 0, 74, EFFICIENT_CORE_PROC, 74, -1}, {75, 0, 0, 75, EFFICIENT_CORE_PROC, 75, -1}, + {76, 0, 0, 76, EFFICIENT_CORE_PROC, 76, -1}, {77, 0, 0, 77, EFFICIENT_CORE_PROC, 77, -1}, + {78, 0, 0, 78, EFFICIENT_CORE_PROC, 78, -1}, {79, 0, 0, 79, EFFICIENT_CORE_PROC, 79, -1}, + {80, 0, 0, 80, EFFICIENT_CORE_PROC, 80, -1}, {81, 0, 0, 81, EFFICIENT_CORE_PROC, 81, -1}, + {82, 0, 0, 82, EFFICIENT_CORE_PROC, 82, -1}, {83, 0, 0, 83, EFFICIENT_CORE_PROC, 83, -1}, + {84, 0, 0, 84, EFFICIENT_CORE_PROC, 84, -1}, {85, 0, 0, 85, EFFICIENT_CORE_PROC, 85, -1}, + {86, 0, 0, 86, EFFICIENT_CORE_PROC, 86, -1}, {87, 0, 0, 87, EFFICIENT_CORE_PROC, 87, -1}, + {88, 0, 0, 88, EFFICIENT_CORE_PROC, 88, -1}, {89, 0, 0, 89, EFFICIENT_CORE_PROC, 89, -1}, + {90, 0, 0, 90, EFFICIENT_CORE_PROC, 90, -1}, {91, 0, 0, 91, EFFICIENT_CORE_PROC, 91, -1}, + {92, 0, 0, 92, EFFICIENT_CORE_PROC, 92, -1}, {93, 0, 0, 93, EFFICIENT_CORE_PROC, 93, -1}, + {94, 0, 0, 94, EFFICIENT_CORE_PROC, 94, -1}, {95, 0, 0, 95, EFFICIENT_CORE_PROC, 95, -1}, + }, {{96, 0, 96, 0, 0, 0}}, ov::hint::SchedulingCoreType::ANY_CORE, false, @@ -744,9 +1889,60 @@ StreamGenerateionTestCase generation_tput_1sockets_96cores_2_unpinning = { true, true, false, + false, true, ov::hint::PerformanceMode::THROUGHPUT, {}, + { + {0, 0, 0, 0, EFFICIENT_CORE_PROC, 0, -1}, {1, 0, 0, 1, EFFICIENT_CORE_PROC, 1, -1}, + {2, 0, 0, 2, EFFICIENT_CORE_PROC, 2, -1}, {3, 0, 0, 3, EFFICIENT_CORE_PROC, 3, -1}, + {4, 0, 0, 4, EFFICIENT_CORE_PROC, 4, -1}, {5, 0, 0, 5, EFFICIENT_CORE_PROC, 5, -1}, + {6, 0, 0, 6, EFFICIENT_CORE_PROC, 6, -1}, {7, 0, 0, 7, EFFICIENT_CORE_PROC, 7, -1}, + {8, 0, 0, 8, EFFICIENT_CORE_PROC, 8, -1}, {9, 0, 0, 9, EFFICIENT_CORE_PROC, 9, -1}, + {10, 0, 0, 10, EFFICIENT_CORE_PROC, 10, -1}, {11, 0, 0, 11, EFFICIENT_CORE_PROC, 11, -1}, + {12, 0, 0, 12, EFFICIENT_CORE_PROC, 12, -1}, {13, 0, 0, 13, EFFICIENT_CORE_PROC, 13, -1}, + {14, 0, 0, 14, EFFICIENT_CORE_PROC, 14, -1}, {15, 0, 0, 15, EFFICIENT_CORE_PROC, 15, -1}, + {16, 0, 0, 16, EFFICIENT_CORE_PROC, 16, -1}, {17, 0, 0, 17, EFFICIENT_CORE_PROC, 17, -1}, + {18, 0, 0, 18, EFFICIENT_CORE_PROC, 18, -1}, {19, 0, 0, 19, EFFICIENT_CORE_PROC, 19, -1}, + {20, 0, 0, 20, EFFICIENT_CORE_PROC, 20, -1}, {21, 0, 0, 21, EFFICIENT_CORE_PROC, 21, -1}, + {22, 0, 0, 22, EFFICIENT_CORE_PROC, 22, -1}, {23, 0, 0, 23, EFFICIENT_CORE_PROC, 23, -1}, + {24, 0, 0, 24, EFFICIENT_CORE_PROC, 24, -1}, {25, 0, 0, 25, EFFICIENT_CORE_PROC, 25, -1}, + {26, 0, 0, 26, EFFICIENT_CORE_PROC, 26, -1}, {27, 0, 0, 27, EFFICIENT_CORE_PROC, 27, -1}, + {28, 0, 0, 28, EFFICIENT_CORE_PROC, 28, -1}, {29, 0, 0, 29, EFFICIENT_CORE_PROC, 29, -1}, + {30, 0, 0, 30, EFFICIENT_CORE_PROC, 30, -1}, {31, 0, 0, 31, EFFICIENT_CORE_PROC, 31, -1}, + {32, 0, 0, 32, EFFICIENT_CORE_PROC, 32, -1}, {33, 0, 0, 33, EFFICIENT_CORE_PROC, 33, -1}, + {34, 0, 0, 34, EFFICIENT_CORE_PROC, 34, -1}, {35, 0, 0, 35, EFFICIENT_CORE_PROC, 35, -1}, + {36, 0, 0, 36, EFFICIENT_CORE_PROC, 36, -1}, {37, 0, 0, 37, EFFICIENT_CORE_PROC, 37, -1}, + {38, 0, 0, 38, EFFICIENT_CORE_PROC, 38, -1}, {39, 0, 0, 39, EFFICIENT_CORE_PROC, 39, -1}, + {40, 0, 0, 40, EFFICIENT_CORE_PROC, 40, -1}, {41, 0, 0, 41, EFFICIENT_CORE_PROC, 41, -1}, + {42, 0, 0, 42, EFFICIENT_CORE_PROC, 42, -1}, {43, 0, 0, 43, EFFICIENT_CORE_PROC, 43, -1}, + {44, 0, 0, 44, EFFICIENT_CORE_PROC, 44, -1}, {45, 0, 0, 45, EFFICIENT_CORE_PROC, 45, -1}, + {46, 0, 0, 46, EFFICIENT_CORE_PROC, 46, -1}, {47, 0, 0, 47, EFFICIENT_CORE_PROC, 47, -1}, + {48, 0, 0, 48, EFFICIENT_CORE_PROC, 48, -1}, {49, 0, 0, 49, EFFICIENT_CORE_PROC, 49, -1}, + {50, 0, 0, 50, EFFICIENT_CORE_PROC, 50, -1}, {51, 0, 0, 51, EFFICIENT_CORE_PROC, 51, -1}, + {52, 0, 0, 52, EFFICIENT_CORE_PROC, 52, -1}, {53, 0, 0, 53, EFFICIENT_CORE_PROC, 53, -1}, + {54, 0, 0, 54, EFFICIENT_CORE_PROC, 54, -1}, {55, 0, 0, 55, EFFICIENT_CORE_PROC, 55, -1}, + {56, 0, 0, 56, EFFICIENT_CORE_PROC, 56, -1}, {57, 0, 0, 57, EFFICIENT_CORE_PROC, 57, -1}, + {58, 0, 0, 58, EFFICIENT_CORE_PROC, 58, -1}, {59, 0, 0, 59, EFFICIENT_CORE_PROC, 59, -1}, + {60, 0, 0, 60, EFFICIENT_CORE_PROC, 60, -1}, {61, 0, 0, 61, EFFICIENT_CORE_PROC, 61, -1}, + {62, 0, 0, 62, EFFICIENT_CORE_PROC, 62, -1}, {63, 0, 0, 63, EFFICIENT_CORE_PROC, 63, -1}, + {64, 0, 0, 64, EFFICIENT_CORE_PROC, 64, -1}, {65, 0, 0, 65, EFFICIENT_CORE_PROC, 65, -1}, + {66, 0, 0, 66, EFFICIENT_CORE_PROC, 66, -1}, {67, 0, 0, 67, EFFICIENT_CORE_PROC, 67, -1}, + {68, 0, 0, 68, EFFICIENT_CORE_PROC, 68, -1}, {69, 0, 0, 69, EFFICIENT_CORE_PROC, 69, -1}, + {70, 0, 0, 70, EFFICIENT_CORE_PROC, 70, -1}, {71, 0, 0, 71, EFFICIENT_CORE_PROC, 71, -1}, + {72, 0, 0, 72, EFFICIENT_CORE_PROC, 72, -1}, {73, 0, 0, 73, EFFICIENT_CORE_PROC, 73, -1}, + {74, 0, 0, 74, EFFICIENT_CORE_PROC, 74, -1}, {75, 0, 0, 75, EFFICIENT_CORE_PROC, 75, -1}, + {76, 0, 0, 76, EFFICIENT_CORE_PROC, 76, -1}, {77, 0, 0, 77, EFFICIENT_CORE_PROC, 77, -1}, + {78, 0, 0, 78, EFFICIENT_CORE_PROC, 78, -1}, {79, 0, 0, 79, EFFICIENT_CORE_PROC, 79, -1}, + {80, 0, 0, 80, EFFICIENT_CORE_PROC, 80, -1}, {81, 0, 0, 81, EFFICIENT_CORE_PROC, 81, -1}, + {82, 0, 0, 82, EFFICIENT_CORE_PROC, 82, -1}, {83, 0, 0, 83, EFFICIENT_CORE_PROC, 83, -1}, + {84, 0, 0, 84, EFFICIENT_CORE_PROC, 84, -1}, {85, 0, 0, 85, EFFICIENT_CORE_PROC, 85, -1}, + {86, 0, 0, 86, EFFICIENT_CORE_PROC, 86, -1}, {87, 0, 0, 87, EFFICIENT_CORE_PROC, 87, -1}, + {88, 0, 0, 88, EFFICIENT_CORE_PROC, 88, -1}, {89, 0, 0, 89, EFFICIENT_CORE_PROC, 89, -1}, + {90, 0, 0, 90, EFFICIENT_CORE_PROC, 90, -1}, {91, 0, 0, 91, EFFICIENT_CORE_PROC, 91, -1}, + {92, 0, 0, 92, EFFICIENT_CORE_PROC, 92, -1}, {93, 0, 0, 93, EFFICIENT_CORE_PROC, 93, -1}, + {94, 0, 0, 94, EFFICIENT_CORE_PROC, 94, -1}, {95, 0, 0, 95, EFFICIENT_CORE_PROC, 95, -1}, + }, {{96, 0, 96, 0, 0, 0}}, ov::hint::SchedulingCoreType::ANY_CORE, false, @@ -756,13 +1952,65 @@ StreamGenerateionTestCase generation_tput_1sockets_96cores_2_unpinning = { {{24, EFFICIENT_CORE_PROC, 4, 0, 0}}, }; +StreamGenerateionTestCase generation_tput_1sockets_0cores_1 = { + 1, + false, + 0, + 0, + 0, + 0, + ov::hint::SchedulingCoreType::PCORE_ONLY, + true, + true, + false, + false, + true, + ov::hint::PerformanceMode::LATENCY, + {}, + {}, + {{0, 0, 0, 0, 0, 0}}, + ov::hint::SchedulingCoreType::ANY_CORE, + false, + false, + ov::hint::PerformanceMode::LATENCY, + {{96, 0, 96, 0, 0, 0}}, + {{24, EFFICIENT_CORE_PROC, 4, 0, 0}}, +}; + +StreamGenerateionTestCase generation_tput_1sockets_0cores_1_reservation = { + 1, + false, + 0, + 0, + 0, + 0, + ov::hint::SchedulingCoreType::PCORE_ONLY, + true, + true, + true, + false, + true, + ov::hint::PerformanceMode::LATENCY, + {}, + {}, + {{0, 0, 0, 0, 0, 0}}, + ov::hint::SchedulingCoreType::ANY_CORE, + false, + false, + ov::hint::PerformanceMode::LATENCY, + {{96, 0, 96, 0, 0, 0}}, + {{24, EFFICIENT_CORE_PROC, 4, 0, 0}}, +}; + #if defined(__linux__) || defined(_WIN32) INSTANTIATE_TEST_SUITE_P(smoke_StreamsGeneration, StreamGenerationTests, ::testing::Values(generation_latency_1sockets_14cores_3, + generation_latency_1sockets_14cores_3_reservation, generation_latency_1sockets_14cores_4, generation_latency_1sockets_14cores_5, generation_latency_2sockets_48cores_6, + generation_latency_2sockets_48cores_6_reservation, generation_latency_2sockets_48cores_7, generation_latency_2sockets_48cores_8, generation_latency_2sockets_48cores_9, @@ -778,10 +2026,13 @@ INSTANTIATE_TEST_SUITE_P(smoke_StreamsGeneration, generation_tput_2sockets_48cores_6, generation_tput_2sockets_48cores_7, generation_tput_2sockets_48cores_8, + generation_tput_2sockets_48cores_8_reservation, generation_tput_2sockets_48cores_9, generation_latency_1sockets_96cores_pinning, generation_tput_1sockets_96cores_pinning, - generation_tput_1sockets_96cores_2_pinning)); + generation_tput_1sockets_96cores_2_pinning, + generation_tput_1sockets_0cores_1, + generation_tput_1sockets_0cores_1_reservation)); #else INSTANTIATE_TEST_SUITE_P(smoke_StreamsGeneration, StreamGenerationTests, From 4e9d6a13b62b45e614c0e0e008bc32dd2aea4781 Mon Sep 17 00:00:00 2001 From: sunxiaoxia2022 Date: Fri, 10 Jan 2025 16:34:16 +0800 Subject: [PATCH 19/30] fix ci issue --- .../tests/unit/executor_config_test.cpp | 36 +------------------ 1 file changed, 1 insertion(+), 35 deletions(-) diff --git a/src/inference/tests/unit/executor_config_test.cpp b/src/inference/tests/unit/executor_config_test.cpp index ea117d8fa0c72a..a07ed4e7506575 100644 --- a/src/inference/tests/unit/executor_config_test.cpp +++ b/src/inference/tests/unit/executor_config_test.cpp @@ -1308,39 +1308,6 @@ ExecutorConfigTestCase _pecore_streams_info_table_1 = { }; ExecutorConfigTestCase _pecore_streams_info_table_2 = { - { - {24, 8, 8, 8, 0, 0}, - }, - { - {0, 0, 0, 0, MAIN_CORE_PROC, 0, -1}, {1, 0, 0, 0, HYPER_THREADING_PROC, 1, -1}, - {2, 0, 0, 1, MAIN_CORE_PROC, 2, -1}, {3, 0, 0, 1, HYPER_THREADING_PROC, 3, -1}, - {4, 0, 0, 2, MAIN_CORE_PROC, 4, -1}, {5, 0, 0, 2, HYPER_THREADING_PROC, 5, -1}, - {6, 0, 0, 3, MAIN_CORE_PROC, 6, -1}, {7, 0, 0, 3, HYPER_THREADING_PROC, 7, -1}, - {8, 0, 0, 4, MAIN_CORE_PROC, 8, -1}, {9, 0, 0, 4, HYPER_THREADING_PROC, 9, -1}, - {10, 0, 0, 5, MAIN_CORE_PROC, 10, -1}, {11, 0, 0, 5, HYPER_THREADING_PROC, 11, -1}, - {12, 0, 0, 6, MAIN_CORE_PROC, 12, -1}, {13, 0, 0, 6, HYPER_THREADING_PROC, 13, -1}, - {14, 0, 0, 7, MAIN_CORE_PROC, 14, -1}, {15, 0, 0, 7, HYPER_THREADING_PROC, 15, -1}, - {16, 0, 0, 8, EFFICIENT_CORE_PROC, 16, -1}, {17, 0, 0, 9, EFFICIENT_CORE_PROC, 17, -1}, - {18, 0, 0, 10, EFFICIENT_CORE_PROC, 18, -1}, {19, 0, 0, 11, EFFICIENT_CORE_PROC, 19, -1}, - {20, 0, 0, 12, EFFICIENT_CORE_PROC, 20, -1}, {21, 0, 0, 13, EFFICIENT_CORE_PROC, 21, -1}, - {22, 0, 0, 14, EFFICIENT_CORE_PROC, 22, -1}, {23, 0, 0, 15, EFFICIENT_CORE_PROC, 23, -1}, - }, - 1, - 8, - ov::hint::SchedulingCoreType::PCORE_ONLY, - false, - false, - { - {5, MAIN_CORE_PROC, 2, 0, 0}, - {2, EFFICIENT_CORE_PROC, 2, 0, 0}, - }, - { - {1, MAIN_CORE_PROC, 8, 0, 0}, - }, - {}, -}; - -ExecutorConfigTestCase _pecore_streams_info_table_3 = { { {24, 8, 8, 8, 0, 0}, }, @@ -1414,7 +1381,6 @@ INSTANTIATE_TEST_SUITE_P(smoke_ExecutorConfig, _pecore_streams_10_threads_1_binding, _pecore_streams_10_threads_2_reservation, _pecore_streams_info_table_1, - _pecore_streams_info_table_2, - _pecore_streams_info_table_3)); + _pecore_streams_info_table_2)); #endif } // namespace From 2e0295f487cbea653766e63985fab5f28a2adf88 Mon Sep 17 00:00:00 2001 From: sunxiaoxia2022 Date: Sat, 11 Jan 2025 18:01:04 +0800 Subject: [PATCH 20/30] fix ci test issue --- .../intel_cpu/tests/unit/streams_info/streams_e2e_test.cpp | 3 +++ 1 file changed, 3 insertions(+) diff --git a/src/plugins/intel_cpu/tests/unit/streams_info/streams_e2e_test.cpp b/src/plugins/intel_cpu/tests/unit/streams_info/streams_e2e_test.cpp index 6e223f28541a77..26b421a537afae 100644 --- a/src/plugins/intel_cpu/tests/unit/streams_info/streams_e2e_test.cpp +++ b/src/plugins/intel_cpu/tests/unit/streams_info/streams_e2e_test.cpp @@ -68,6 +68,9 @@ class StreamGenerationTests : public ov::test::TestsCommon, CPU& cpu = cpu_info(); cpu._cpu_mapping_table = test_data.cpu_mapping_table; cpu._proc_type_table = test_data.input_proc_type_table; + cpu._org_proc_type_table = test_data.input_proc_type_table; + cpu._numa_nodes = cpu._proc_type_table.size() > 1 ? static_cast(cpu._proc_type_table.size()) - 1 : 1; + cpu._sockets = cpu._numa_nodes; std::vector> res_proc_type_table = test_data.input_proc_type_table; if (cpu._cpu_mapping_table.empty()) { From 76bb972e2786248fbc1eb227b433c1fbb9c849fc Mon Sep 17 00:00:00 2001 From: sunxiaoxia2022 Date: Mon, 13 Jan 2025 11:22:43 +0800 Subject: [PATCH 21/30] add test case of reservation --- .../ov_executable_network/properties.cpp | 16 ++++++++++++++++ .../behavior/ov_plugin/properties_tests.cpp | 1 + 2 files changed, 17 insertions(+) diff --git a/src/plugins/intel_cpu/tests/functional/custom/behavior/ov_executable_network/properties.cpp b/src/plugins/intel_cpu/tests/functional/custom/behavior/ov_executable_network/properties.cpp index b2e7db2a74d9d7..15e5e9ced7d4e3 100644 --- a/src/plugins/intel_cpu/tests/functional/custom/behavior/ov_executable_network/properties.cpp +++ b/src/plugins/intel_cpu/tests/functional/custom/behavior/ov_executable_network/properties.cpp @@ -155,6 +155,22 @@ TEST_F(OVClassConfigTestCPU, smoke_CpuExecNetworkCheckModelZeroStreams) { ASSERT_EQ(streams, value); } +TEST_F(OVClassConfigTestCPU, smoke_CpuExecNetworkCheckCpuReservation) { + ov::Core core; + bool reservation = false; + int32_t threads = 0, input_threads = 2; + + OV_ASSERT_NO_THROW(core.set_property(deviceName, ov::hint::performance_mode(ov::hint::PerformanceMode::LATENCY))); + + ov::AnyMap config = {{ov::hint::enable_cpu_reservation.name(), true}, {ov::inference_num_threads.name(), input_threads}}; + ov::CompiledModel compiledModel = core.compile_model(model, deviceName, config); + + OV_ASSERT_NO_THROW(reservation = compiledModel.get_property(ov::hint::enable_cpu_reservation)); + OV_ASSERT_NO_THROW(threads = compiledModel.get_property(ov::inference_num_threads)); + ASSERT_EQ(reservation, true); + ASSERT_EQ(threads, input_threads); +} + TEST_F(OVClassConfigTestCPU, smoke_CpuExecNetworkCheckSparseWeigthsDecompressionRate) { ov::Core core; diff --git a/src/plugins/intel_cpu/tests/functional/shared_tests_instances/behavior/ov_plugin/properties_tests.cpp b/src/plugins/intel_cpu/tests/functional/shared_tests_instances/behavior/ov_plugin/properties_tests.cpp index 7dcc98a2c63446..4de615d617e933 100644 --- a/src/plugins/intel_cpu/tests/functional/shared_tests_instances/behavior/ov_plugin/properties_tests.cpp +++ b/src/plugins/intel_cpu/tests/functional/shared_tests_instances/behavior/ov_plugin/properties_tests.cpp @@ -30,6 +30,7 @@ auto cpu_properties = []() -> std::vector { // check that hints doesn't override customer value (now for streams and later for other config opts) {{ov::hint::performance_mode(ov::hint::PerformanceMode::THROUGHPUT)}, {ov::hint::num_requests(3)}}, {{ov::hint::performance_mode(ov::hint::PerformanceMode::LATENCY)}, {ov::hint::num_requests(3)}}, + {{ov::hint::enable_cpu_reservation(true)}, {ov::num_streams(1)}, {ov::inference_num_threads(2)}}, }; auto numa_nodes = ov::get_available_numa_nodes(); From a0c87933fbff828c7c1b7c3f3627ce6dd3df624b Mon Sep 17 00:00:00 2001 From: sunxiaoxia2022 Date: Mon, 13 Jan 2025 17:45:46 +0800 Subject: [PATCH 22/30] add parallel running multiple compiled model test case --- .../behavior/ov_plugin/core_threading.hpp | 22 +++++++++++++++++++ 1 file changed, 22 insertions(+) diff --git a/src/tests/functional/plugin/shared/include/behavior/ov_plugin/core_threading.hpp b/src/tests/functional/plugin/shared/include/behavior/ov_plugin/core_threading.hpp index d39dad1779191a..ddddf6c7c475b5 100644 --- a/src/tests/functional/plugin/shared/include/behavior/ov_plugin/core_threading.hpp +++ b/src/tests/functional/plugin/shared/include/behavior/ov_plugin/core_threading.hpp @@ -613,3 +613,25 @@ TEST_P(CoreThreadingTestsWithIter, nightly_AsyncInfer_ShareInput) { numIterations, numThreads); } + +TEST_P(CoreThreadingTestsWithIter, smoke_CompileModel_MutipleModel_Reservation) { + auto core = ov::test::utils::create_core(); + std::atomic counter{0u}; + SetupNetworks(); + core.set_property(target_device, config); + ov::AnyMap property_config_reserve = {{ov::num_streams.name(), 1}, + {ov::inference_num_threads.name(), 1}, + {ov::hint::enable_cpu_reservation.name(), true}}; + ov::AnyMap property_config = {{ov::num_streams.name(), 1}, {ov::inference_num_threads.name(), 1}}; + + runParallel( + [&]() { + auto value = counter++; + std::cout << "value: " << value << "\n"; + (void)core.compile_model(models[value % models.size()], + target_device, + value == 1 ? property_config : property_config_reserve); + }, + 1, + 3); +} From 9a36e8de9c93a1b24cb66b9d0f8cb6951a5adf91 Mon Sep 17 00:00:00 2001 From: sunxiaoxia2022 Date: Mon, 13 Jan 2025 20:11:40 +0800 Subject: [PATCH 23/30] rm invalid log --- .../shared/include/behavior/ov_plugin/core_threading.hpp | 3 +-- 1 file changed, 1 insertion(+), 2 deletions(-) diff --git a/src/tests/functional/plugin/shared/include/behavior/ov_plugin/core_threading.hpp b/src/tests/functional/plugin/shared/include/behavior/ov_plugin/core_threading.hpp index ddddf6c7c475b5..3f15cd8cfd85c0 100644 --- a/src/tests/functional/plugin/shared/include/behavior/ov_plugin/core_threading.hpp +++ b/src/tests/functional/plugin/shared/include/behavior/ov_plugin/core_threading.hpp @@ -627,11 +627,10 @@ TEST_P(CoreThreadingTestsWithIter, smoke_CompileModel_MutipleModel_Reservation) runParallel( [&]() { auto value = counter++; - std::cout << "value: " << value << "\n"; (void)core.compile_model(models[value % models.size()], target_device, value == 1 ? property_config : property_config_reserve); }, 1, - 3); + 2); } From ab7484d6cca6dd3cb1ce81adc1bf93abdbbe86fb Mon Sep 17 00:00:00 2001 From: sunxiaoxia2022 Date: Tue, 14 Jan 2025 11:28:26 +0800 Subject: [PATCH 24/30] add test case --- .../streams_info/cpu_reservation_test.cpp | 50 +++++++++++++++++++ .../unit/streams_info/streams_e2e_test.cpp | 41 +++++++++++++++ .../behavior/ov_plugin/core_threading.hpp | 21 -------- 3 files changed, 91 insertions(+), 21 deletions(-) create mode 100644 src/plugins/intel_cpu/tests/unit/streams_info/cpu_reservation_test.cpp diff --git a/src/plugins/intel_cpu/tests/unit/streams_info/cpu_reservation_test.cpp b/src/plugins/intel_cpu/tests/unit/streams_info/cpu_reservation_test.cpp new file mode 100644 index 00000000000000..a8823bc8a6dab0 --- /dev/null +++ b/src/plugins/intel_cpu/tests/unit/streams_info/cpu_reservation_test.cpp @@ -0,0 +1,50 @@ + +// Copyright (C) 2018-2024 Intel Corporation +// SPDX-License-Identifier: Apache-2.0 +// + +#include +#include +#include + +#include "common_test_utils/subgraph_builders/2_input_subtract.hpp" +#include "common_test_utils/subgraph_builders/multi_single_conv.hpp" +#include "openvino/runtime/properties.hpp" +// #include "openvino/util/file_util.hpp" +#include "openvino/openvino.hpp" + +using Device = std::string; +using Config = ov::AnyMap; +using CpuReservationTest = ::testing::Test; + +TEST_F(CpuReservationTest, Mutiple_CompiledModel_Reservation) { + std::vector> models; + Config config = {ov::enable_profiling(true)}; + Device target_device("CPU"); + std::atomic counter{0u}; + + models.emplace_back(ov::test::utils::make_2_input_subtract()); + models.emplace_back(ov::test::utils::make_multi_single_conv()); + + ov::Core core; + core.set_property(target_device, config); + ov::AnyMap property_config_reserve = {{ov::num_streams.name(), 1}, + {ov::inference_num_threads.name(), 1}, + {ov::hint::enable_cpu_reservation.name(), true}}; + ov::AnyMap property_config = {{ov::num_streams.name(), 1}, {ov::inference_num_threads.name(), 1}}; + + std::vector threads(2); + for (auto& thread : threads) { + thread = std::thread([&]() { + auto value = counter++; + (void)core.compile_model(models[value % models.size()], + target_device, + value == 1 ? property_config : property_config_reserve); + }); + } + + for (auto& thread : threads) { + if (thread.joinable()) + thread.join(); + } +} \ No newline at end of file diff --git a/src/plugins/intel_cpu/tests/unit/streams_info/streams_e2e_test.cpp b/src/plugins/intel_cpu/tests/unit/streams_info/streams_e2e_test.cpp index 26b421a537afae..dd19a28d74c712 100644 --- a/src/plugins/intel_cpu/tests/unit/streams_info/streams_e2e_test.cpp +++ b/src/plugins/intel_cpu/tests/unit/streams_info/streams_e2e_test.cpp @@ -444,6 +444,46 @@ StreamGenerateionTestCase generation_latency_1sockets_14cores_3_reservation = { {{1, MAIN_CORE_PROC, 6, 0, 0}}, }; +StreamGenerateionTestCase generation_latency_1sockets_14cores_4_reservation = { + 1, + false, + 0, + 0, + 0, + 0, + ov::hint::SchedulingCoreType::PCORE_ONLY, + true, + true, + true, + false, + false, + ov::hint::PerformanceMode::LATENCY, + {}, + { + {0, 0, 0, 0, MAIN_CORE_PROC, 0, -1}, + {1, 0, 0, 1, MAIN_CORE_PROC, 1, -1}, + {2, 0, 0, 2, MAIN_CORE_PROC, 2, -1}, + {3, 0, 0, 3, MAIN_CORE_PROC, 3, -1}, + {4, 0, 0, 4, MAIN_CORE_PROC, 4, -1}, + {5, 0, 0, 5, MAIN_CORE_PROC, 5, -1}, + {6, 0, 0, 6, EFFICIENT_CORE_PROC, 6, -1}, + {7, 0, 0, 7, EFFICIENT_CORE_PROC, 7, -1}, + {8, 0, 0, 8, EFFICIENT_CORE_PROC, 8, -1}, + {9, 0, 0, 9, EFFICIENT_CORE_PROC, 9, -1}, + {10, 0, 0, 10, EFFICIENT_CORE_PROC, 10, -1}, + {11, 0, 0, 11, EFFICIENT_CORE_PROC, 11, -1}, + {12, 0, 0, 12, EFFICIENT_CORE_PROC, 12, -1}, + {13, 0, 0, 13, EFFICIENT_CORE_PROC, 13, -1}, + }, + {{14, 6, 8, 0, 0, 0}}, + ov::hint::SchedulingCoreType::PCORE_ONLY, + false, + true, + ov::hint::PerformanceMode::LATENCY, + {{6, 6, 0, 0, 0, 0}}, + {{1, MAIN_CORE_PROC, 6, 0, 0}}, +}; + StreamGenerateionTestCase generation_latency_1sockets_14cores_4 = { 1, false, @@ -2010,6 +2050,7 @@ INSTANTIATE_TEST_SUITE_P(smoke_StreamsGeneration, StreamGenerationTests, ::testing::Values(generation_latency_1sockets_14cores_3, generation_latency_1sockets_14cores_3_reservation, + generation_latency_1sockets_14cores_4_reservation, generation_latency_1sockets_14cores_4, generation_latency_1sockets_14cores_5, generation_latency_2sockets_48cores_6, diff --git a/src/tests/functional/plugin/shared/include/behavior/ov_plugin/core_threading.hpp b/src/tests/functional/plugin/shared/include/behavior/ov_plugin/core_threading.hpp index 3f15cd8cfd85c0..d39dad1779191a 100644 --- a/src/tests/functional/plugin/shared/include/behavior/ov_plugin/core_threading.hpp +++ b/src/tests/functional/plugin/shared/include/behavior/ov_plugin/core_threading.hpp @@ -613,24 +613,3 @@ TEST_P(CoreThreadingTestsWithIter, nightly_AsyncInfer_ShareInput) { numIterations, numThreads); } - -TEST_P(CoreThreadingTestsWithIter, smoke_CompileModel_MutipleModel_Reservation) { - auto core = ov::test::utils::create_core(); - std::atomic counter{0u}; - SetupNetworks(); - core.set_property(target_device, config); - ov::AnyMap property_config_reserve = {{ov::num_streams.name(), 1}, - {ov::inference_num_threads.name(), 1}, - {ov::hint::enable_cpu_reservation.name(), true}}; - ov::AnyMap property_config = {{ov::num_streams.name(), 1}, {ov::inference_num_threads.name(), 1}}; - - runParallel( - [&]() { - auto value = counter++; - (void)core.compile_model(models[value % models.size()], - target_device, - value == 1 ? property_config : property_config_reserve); - }, - 1, - 2); -} From f46103cf1c9870c4dca8690dc17eb30d00e804cc Mon Sep 17 00:00:00 2001 From: sunxiaoxia2022 Date: Tue, 14 Jan 2025 13:16:57 +0800 Subject: [PATCH 25/30] fix ci test issue --- .../compiled_model}/cpu_reservation_test.cpp | 18 ++++--- .../concurrency/gpu_reservation_test.cpp | 51 +++++++++++++++++++ 2 files changed, 61 insertions(+), 8 deletions(-) rename src/plugins/intel_cpu/tests/{unit/streams_info => functional/shared_tests_instances/behavior/compiled_model}/cpu_reservation_test.cpp (80%) create mode 100644 src/plugins/intel_gpu/tests/functional/concurrency/gpu_reservation_test.cpp diff --git a/src/plugins/intel_cpu/tests/unit/streams_info/cpu_reservation_test.cpp b/src/plugins/intel_cpu/tests/functional/shared_tests_instances/behavior/compiled_model/cpu_reservation_test.cpp similarity index 80% rename from src/plugins/intel_cpu/tests/unit/streams_info/cpu_reservation_test.cpp rename to src/plugins/intel_cpu/tests/functional/shared_tests_instances/behavior/compiled_model/cpu_reservation_test.cpp index a8823bc8a6dab0..c8f95c34f2a2d1 100644 --- a/src/plugins/intel_cpu/tests/unit/streams_info/cpu_reservation_test.cpp +++ b/src/plugins/intel_cpu/tests/functional/shared_tests_instances/behavior/compiled_model/cpu_reservation_test.cpp @@ -1,17 +1,19 @@ - // Copyright (C) 2018-2024 Intel Corporation // SPDX-License-Identifier: Apache-2.0 // #include -#include + #include +#include +#include "common_test_utils/test_constants.hpp" #include "common_test_utils/subgraph_builders/2_input_subtract.hpp" #include "common_test_utils/subgraph_builders/multi_single_conv.hpp" -#include "openvino/runtime/properties.hpp" -// #include "openvino/util/file_util.hpp" #include "openvino/openvino.hpp" +#include "common_test_utils/ov_plugin_cache.hpp" +#include "openvino/runtime/properties.hpp" +#include "openvino/util/file_util.hpp" using Device = std::string; using Config = ov::AnyMap; @@ -20,14 +22,14 @@ using CpuReservationTest = ::testing::Test; TEST_F(CpuReservationTest, Mutiple_CompiledModel_Reservation) { std::vector> models; Config config = {ov::enable_profiling(true)}; - Device target_device("CPU"); + Device target_device(ov::test::utils::DEVICE_CPU); std::atomic counter{0u}; models.emplace_back(ov::test::utils::make_2_input_subtract()); models.emplace_back(ov::test::utils::make_multi_single_conv()); - ov::Core core; - core.set_property(target_device, config); + std::shared_ptr core = ov::test::utils::PluginCache::get().core(); + core->set_property(target_device, config); ov::AnyMap property_config_reserve = {{ov::num_streams.name(), 1}, {ov::inference_num_threads.name(), 1}, {ov::hint::enable_cpu_reservation.name(), true}}; @@ -37,7 +39,7 @@ TEST_F(CpuReservationTest, Mutiple_CompiledModel_Reservation) { for (auto& thread : threads) { thread = std::thread([&]() { auto value = counter++; - (void)core.compile_model(models[value % models.size()], + (void)core->compile_model(models[value % models.size()], target_device, value == 1 ? property_config : property_config_reserve); }); diff --git a/src/plugins/intel_gpu/tests/functional/concurrency/gpu_reservation_test.cpp b/src/plugins/intel_gpu/tests/functional/concurrency/gpu_reservation_test.cpp new file mode 100644 index 00000000000000..35cb94cf647dc9 --- /dev/null +++ b/src/plugins/intel_gpu/tests/functional/concurrency/gpu_reservation_test.cpp @@ -0,0 +1,51 @@ +// Copyright (C) 2018-2024 Intel Corporation +// SPDX-License-Identifier: Apache-2.0 +// + +#include + +#include +#include + +#include "common_test_utils/file_utils.hpp" +#include "common_test_utils/subgraph_builders/2_input_subtract.hpp" +#include "common_test_utils/subgraph_builders/multi_single_conv.hpp" +#include "common_test_utils/ov_plugin_cache.hpp" +#include "openvino/openvino.hpp" +#include "openvino/runtime/intel_gpu/properties.hpp" + +using Device = std::string; +using Config = ov::AnyMap; +using GpuReservationTest = ::testing::Test; + +TEST_F(GpuReservationTest, Mutiple_CompiledModel_Reservation) { + std::vector> models; + Config config = {ov::enable_profiling(true)}; + std::vector target_devices = {ov::test::utils::DEVICE_CPU, ov::test::utils::DEVICE_GPU}; + std::atomic counter{0u}; + + models.emplace_back(ov::test::utils::make_2_input_subtract()); + models.emplace_back(ov::test::utils::make_multi_single_conv()); + + auto core = ov::test::utils::PluginCache::get().core(); + core->set_property(target_devices[1], config); + + ov::AnyMap property_config = {{ov::num_streams.name(), 1}, + {ov::inference_num_threads.name(), 1}, + {ov::hint::enable_cpu_reservation.name(), true}}; + + std::vector threads(2); + for (auto& thread : threads) { + thread = std::thread([&]() { + auto value = counter++; + (void)core->compile_model(models[value % models.size()], + target_devices[value % target_devices.size()], + property_config); + }); + } + + for (auto& thread : threads) { + if (thread.joinable()) + thread.join(); + } +} \ No newline at end of file From 85b03f611b78df2217a893ea73a4b048cb0dff53 Mon Sep 17 00:00:00 2001 From: sunxiaoxia2022 Date: Wed, 15 Jan 2025 21:34:55 +0800 Subject: [PATCH 26/30] change test case --- .../threading/cpu_streams_executor.hpp | 2 ++ .../runtime/threading/istreams_executor.hpp | 5 +++ .../dev/threading/cpu_streams_executor.cpp | 25 ++++++++----- .../src/dev/threading/istreams_executor.cpp | 8 +++-- src/plugins/intel_cpu/src/compiled_model.h | 2 ++ .../intel_cpu/src/cpu_streams_calculation.cpp | 10 +++++- .../compiled_model/cpu_reservation_test.cpp | 36 ++++++++++++++++++- src/plugins/intel_gpu/src/graph/program.cpp | 3 +- .../concurrency/gpu_reservation_test.cpp | 6 ++-- 9 files changed, 81 insertions(+), 16 deletions(-) diff --git a/src/inference/dev_api/openvino/runtime/threading/cpu_streams_executor.hpp b/src/inference/dev_api/openvino/runtime/threading/cpu_streams_executor.hpp index 26b0592c94ce10..2ee4aa6fe05871 100644 --- a/src/inference/dev_api/openvino/runtime/threading/cpu_streams_executor.hpp +++ b/src/inference/dev_api/openvino/runtime/threading/cpu_streams_executor.hpp @@ -57,6 +57,8 @@ class OPENVINO_RUNTIME_API CPUStreamsExecutor : public IStreamsExecutor { std::vector get_rank() override; + void cpu_reset() override; + private: struct Impl; std::unique_ptr _impl; diff --git a/src/inference/dev_api/openvino/runtime/threading/istreams_executor.hpp b/src/inference/dev_api/openvino/runtime/threading/istreams_executor.hpp index 13d35cce568fdf..b66cc3537614ed 100644 --- a/src/inference/dev_api/openvino/runtime/threading/istreams_executor.hpp +++ b/src/inference/dev_api/openvino/runtime/threading/istreams_executor.hpp @@ -269,6 +269,11 @@ class OPENVINO_RUNTIME_API IStreamsExecutor : virtual public ITaskExecutor { */ virtual std::vector get_rank() = 0; + /** + * @brief Reset cpu map table when user set enable_cpu_reservation = true + */ + virtual void cpu_reset() = 0; + /** * @brief Execute the task in the current thread using streams executor configuration and constraints * @param task A task to start diff --git a/src/inference/src/dev/threading/cpu_streams_executor.cpp b/src/inference/src/dev/threading/cpu_streams_executor.cpp index b51289dabc2735..9f8362d4dbb39c 100644 --- a/src/inference/src/dev/threading/cpu_streams_executor.cpp +++ b/src/inference/src/dev/threading/cpu_streams_executor.cpp @@ -92,14 +92,6 @@ struct CPUStreamsExecutor::Impl { _impl->_streamIdQueue.push(_streamId); } #if OV_THREAD == OV_THREAD_TBB || OV_THREAD == OV_THREAD_TBB_AUTO - if (_impl->_config.get_name().find("StreamsExecutor") == std::string::npos) { - try { - set_cpu_used(_cpu_ids, NOT_USED); - } catch (const ov::Exception&) { - // Destructor should not throw - catch needed for static analysis. - // CPU::CPU() won't throw here as cpu_info() is called from Stream constructor. - } - } if (nullptr != _observer) { _observer->observe(false); } @@ -153,6 +145,10 @@ struct CPUStreamsExecutor::Impl { _cpu_ids = stream_id < static_cast(stream_processors.size()) ? stream_processors[stream_id] : _cpu_ids; if (_cpu_ids.size() > 0) { + if (_impl->_config.get_cpu_reservation()) { + std::lock_guard lock(_impl->_cpu_ids_mutex); + _impl->_cpu_ids_all.insert(_impl->_cpu_ids_all.end(), _cpu_ids.begin(), _cpu_ids.end()); + } CpuSet processMask; int ncpus = 0; std::tie(processMask, ncpus) = get_process_mask(); @@ -457,6 +453,8 @@ struct CPUStreamsExecutor::Impl { CustomThreadLocal _streams; std::shared_ptr _exectorMgr; bool _isExit = false; + std::vector _cpu_ids_all; + std::mutex _cpu_ids_mutex; }; int CPUStreamsExecutor::get_stream_id() { @@ -492,9 +490,20 @@ std::vector CPUStreamsExecutor::get_rank() { return stream->_rank; } +void CPUStreamsExecutor::cpu_reset() { + if (!_impl->_cpu_ids_all.empty()) { + set_cpu_used(_impl->_cpu_ids_all, NOT_USED); + { + std::lock_guard lock(_impl->_cpu_ids_mutex); + _impl->_cpu_ids_all.clear(); + } + } +} + CPUStreamsExecutor::CPUStreamsExecutor(const IStreamsExecutor::Config& config) : _impl{new Impl{config}} {} CPUStreamsExecutor::~CPUStreamsExecutor() { + cpu_reset(); { std::lock_guard lock(_impl->_mutex); _impl->_isStopped = true; diff --git a/src/inference/src/dev/threading/istreams_executor.cpp b/src/inference/src/dev/threading/istreams_executor.cpp index bfbb49a256d8dc..d9b66cdbd0a22e 100644 --- a/src/inference/src/dev/threading/istreams_executor.cpp +++ b/src/inference/src/dev/threading/istreams_executor.cpp @@ -159,8 +159,12 @@ void IStreamsExecutor::Config::update_executor_config() { const auto proc_type_table = get_proc_type_table(); bool streams_info_available = false; - if (_cpu_reservation && (proc_type_table.empty() || proc_type_table[0][ALL_PROC] == 0)) { - OPENVINO_THROW("proc_type_table is empty. No CPU resources available!"); + if (proc_type_table.empty() || proc_type_table[0][ALL_PROC] == 0) { + if (_cpu_reservation) { + OPENVINO_THROW("[ Config ] proc_type_table is empty. No CPU resources available!"); + } else { + return; + } } if (!_streams_info_table.empty()) { diff --git a/src/plugins/intel_cpu/src/compiled_model.h b/src/plugins/intel_cpu/src/compiled_model.h index ee55002dbb3eb9..68e82bee77ae38 100644 --- a/src/plugins/intel_cpu/src/compiled_model.h +++ b/src/plugins/intel_cpu/src/compiled_model.h @@ -43,6 +43,8 @@ class CompiledModel : public ov::ICompiledModel { m_sub_compiled_models.clear(); m_sub_memory_manager->_memorys_table.clear(); } + auto streamsExecutor = std::dynamic_pointer_cast(m_task_executor); + streamsExecutor->cpu_reset(); } std::shared_ptr create_infer_request() const override; diff --git a/src/plugins/intel_cpu/src/cpu_streams_calculation.cpp b/src/plugins/intel_cpu/src/cpu_streams_calculation.cpp index 362733b30a40d6..c75c60206b4d55 100644 --- a/src/plugins/intel_cpu/src/cpu_streams_calculation.cpp +++ b/src/plugins/intel_cpu/src/cpu_streams_calculation.cpp @@ -695,6 +695,9 @@ std::vector> generate_stream_info(const int streams, Config& config, std::vector>& proc_type_table, int preferred_nthreads_per_stream) { + if (proc_type_table.empty() || proc_type_table[0][ALL_PROC] == 0) { + OPENVINO_THROW("proc_type_table is empty. No CPU resources available!"); + } int model_prefer_threads = preferred_nthreads_per_stream; proc_type_table = apply_scheduling_core_type(config.schedulingCoreType, proc_type_table); @@ -710,7 +713,9 @@ std::vector> generate_stream_info(const int streams, const auto cur_numa_node_id = input_numa_node_id < 0 ? get_current_numa_node_id() : input_numa_node_id; sort_table_by_numa_node_id(cur_numa_node_id, proc_type_table); } - + if (proc_type_table.empty() || proc_type_table[0][ALL_PROC] == 0) { + OPENVINO_THROW("proc_type_table is empty. No valid CPU resources available!"); + } auto streams_info_table = get_streams_info_table(config.streams, config.streamsChanged, config.threads, @@ -719,6 +724,9 @@ std::vector> generate_stream_info(const int streams, ov::util::to_string(config.hintPerfMode), config.modelDistributionPolicy, proc_type_table); + if (streams_info_table.empty()) { + OPENVINO_THROW("streams_info_table is empty!"); + } if (config.modelDistributionPolicy.find(ov::hint::ModelDistributionPolicy::TENSOR_PARALLEL) != config.modelDistributionPolicy.end()) { config.streamsRankTable = diff --git a/src/plugins/intel_cpu/tests/functional/shared_tests_instances/behavior/compiled_model/cpu_reservation_test.cpp b/src/plugins/intel_cpu/tests/functional/shared_tests_instances/behavior/compiled_model/cpu_reservation_test.cpp index c8f95c34f2a2d1..81212434393903 100644 --- a/src/plugins/intel_cpu/tests/functional/shared_tests_instances/behavior/compiled_model/cpu_reservation_test.cpp +++ b/src/plugins/intel_cpu/tests/functional/shared_tests_instances/behavior/compiled_model/cpu_reservation_test.cpp @@ -15,6 +15,7 @@ #include "openvino/runtime/properties.hpp" #include "openvino/util/file_util.hpp" +using namespace testing; using Device = std::string; using Config = ov::AnyMap; using CpuReservationTest = ::testing::Test; @@ -49,4 +50,37 @@ TEST_F(CpuReservationTest, Mutiple_CompiledModel_Reservation) { if (thread.joinable()) thread.join(); } -} \ No newline at end of file +} + +TEST_F(CpuReservationTest, Cpu_Reservation_NoAvailableCores) { + std::vector> models; + Config config = {ov::enable_profiling(true)}; + Device target_device(ov::test::utils::DEVICE_CPU); + models.emplace_back(ov::test::utils::make_2_input_subtract()); + + std::shared_ptr core = ov::test::utils::PluginCache::get().core(); + core->set_property(target_device, config); + ov::AnyMap property_config = {{ov::num_streams.name(), 1}, + {ov::inference_num_threads.name(), 2000}, + {ov::hint::enable_hyper_threading.name(), true}, + {ov::hint::enable_cpu_reservation.name(), true}}; + auto compiled_model = core->compile_model(models[0], target_device, property_config); + EXPECT_THROW(core->compile_model(models[0], target_device, property_config), ov::Exception); +} + +#if defined(__linux__) +TEST_F(CpuReservationTest, Cpu_Reservation_CpuPinning) { + std::vector> models; + Config config = {ov::enable_profiling(true)}; + Device target_device(ov::test::utils::DEVICE_CPU); + models.emplace_back(ov::test::utils::make_2_input_subtract()); + + std::shared_ptr core = ov::test::utils::PluginCache::get().core(); + core->set_property(target_device, config); + ov::AnyMap property_config = {{ov::inference_num_threads.name(), 1}, + {ov::hint::enable_cpu_reservation.name(), true}}; + auto compiled_model = core->compile_model(models[0], target_device, property_config); + auto cpu_pinning = compiled_model.get_property(ov::hint::enable_cpu_pinning.name()); + ASSERT_EQ(cpu_pinning, true); +} +#endif diff --git a/src/plugins/intel_gpu/src/graph/program.cpp b/src/plugins/intel_gpu/src/graph/program.cpp index ce2eda97e4ce5a..5072740240e2a5 100644 --- a/src/plugins/intel_gpu/src/graph/program.cpp +++ b/src/plugins/intel_gpu/src/graph/program.cpp @@ -117,13 +117,12 @@ static ov::threading::IStreamsExecutor::Config make_task_executor_config(const E default: OPENVINO_ASSERT(false, "[GPU] Can't create task executor: invalid host task priority value: ", priority); } bool enable_cpu_pinning = config.get_property(ov::hint::enable_cpu_pinning); - bool enable_cpu_reservation = config.get_property(ov::hint::enable_cpu_reservation); ov::threading::IStreamsExecutor::Config task_executor_config(tags, streams, 1, core_type, - enable_cpu_reservation, + false, enable_cpu_pinning); return task_executor_config; diff --git a/src/plugins/intel_gpu/tests/functional/concurrency/gpu_reservation_test.cpp b/src/plugins/intel_gpu/tests/functional/concurrency/gpu_reservation_test.cpp index 35cb94cf647dc9..9b389f3ccb785d 100644 --- a/src/plugins/intel_gpu/tests/functional/concurrency/gpu_reservation_test.cpp +++ b/src/plugins/intel_gpu/tests/functional/concurrency/gpu_reservation_test.cpp @@ -33,14 +33,16 @@ TEST_F(GpuReservationTest, Mutiple_CompiledModel_Reservation) { ov::AnyMap property_config = {{ov::num_streams.name(), 1}, {ov::inference_num_threads.name(), 1}, {ov::hint::enable_cpu_reservation.name(), true}}; + ov::AnyMap property_config_gpu = {{ov::num_streams.name(), ov::streams::Num(1)}, + {ov::hint::enable_cpu_reservation.name(), true}}; std::vector threads(2); for (auto& thread : threads) { thread = std::thread([&]() { auto value = counter++; (void)core->compile_model(models[value % models.size()], - target_devices[value % target_devices.size()], - property_config); + target_devices[value % target_devices.size()], + value == 0 ? property_config : property_config_gpu); }); } From bb622bb2723cb7e3cda9145802a244c98be87c1f Mon Sep 17 00:00:00 2001 From: sunxiaoxia2022 Date: Thu, 16 Jan 2025 16:00:00 +0800 Subject: [PATCH 27/30] change test case --- .../compiled_model/cpu_reservation_test.cpp | 14 +++++++++----- .../concurrency/gpu_reservation_test.cpp | 10 +++++++--- 2 files changed, 16 insertions(+), 8 deletions(-) diff --git a/src/plugins/intel_cpu/tests/functional/shared_tests_instances/behavior/compiled_model/cpu_reservation_test.cpp b/src/plugins/intel_cpu/tests/functional/shared_tests_instances/behavior/compiled_model/cpu_reservation_test.cpp index 81212434393903..78ee401d169cbb 100644 --- a/src/plugins/intel_cpu/tests/functional/shared_tests_instances/behavior/compiled_model/cpu_reservation_test.cpp +++ b/src/plugins/intel_cpu/tests/functional/shared_tests_instances/behavior/compiled_model/cpu_reservation_test.cpp @@ -31,18 +31,22 @@ TEST_F(CpuReservationTest, Mutiple_CompiledModel_Reservation) { std::shared_ptr core = ov::test::utils::PluginCache::get().core(); core->set_property(target_device, config); - ov::AnyMap property_config_reserve = {{ov::num_streams.name(), 1}, + ov::AnyMap property_config_reserve = {{ov::num_streams.name(), ov::streams::Num(1)}, {ov::inference_num_threads.name(), 1}, {ov::hint::enable_cpu_reservation.name(), true}}; - ov::AnyMap property_config = {{ov::num_streams.name(), 1}, {ov::inference_num_threads.name(), 1}}; + ov::AnyMap property_config = {{ov::num_streams.name(), ov::streams::Num(1)}, {ov::inference_num_threads.name(), 1}}; std::vector threads(2); for (auto& thread : threads) { thread = std::thread([&]() { auto value = counter++; - (void)core->compile_model(models[value % models.size()], - target_device, - value == 1 ? property_config : property_config_reserve); + auto compiled_model = core->compile_model(models[value % models.size()], + target_device, + value == 1 ? property_config : property_config_reserve); + auto cpu_reservation = compiled_model.get_property(ov::hint::enable_cpu_reservation.name()); + auto num_streams = compiled_model.get_property(ov::num_streams.name()); + ASSERT_EQ(cpu_reservation, value == 1 ? false : true); + ASSERT_EQ(num_streams, ov::streams::Num(1)); }); } diff --git a/src/plugins/intel_gpu/tests/functional/concurrency/gpu_reservation_test.cpp b/src/plugins/intel_gpu/tests/functional/concurrency/gpu_reservation_test.cpp index 9b389f3ccb785d..07d4879257185c 100644 --- a/src/plugins/intel_gpu/tests/functional/concurrency/gpu_reservation_test.cpp +++ b/src/plugins/intel_gpu/tests/functional/concurrency/gpu_reservation_test.cpp @@ -40,9 +40,13 @@ TEST_F(GpuReservationTest, Mutiple_CompiledModel_Reservation) { for (auto& thread : threads) { thread = std::thread([&]() { auto value = counter++; - (void)core->compile_model(models[value % models.size()], - target_devices[value % target_devices.size()], - value == 0 ? property_config : property_config_gpu); + auto compiled_model = core->compile_model(models[value % models.size()], + target_devices[value % target_devices.size()], + value == 0 ? property_config : property_config_gpu); + auto num_streams = compiled_model.get_property(ov::num_streams.name()); + auto cpu_reservation = compiled_model.get_property(ov::hint::enable_cpu_reservation.name()); + ASSERT_EQ(num_streams, ov::streams::Num(1)); + ASSERT_EQ(cpu_reservation, true); }); } From d0e19e1694d54ef8e66c3b279ea2d1b4c689f0a9 Mon Sep 17 00:00:00 2001 From: sunxiaoxia2022 Date: Thu, 16 Jan 2025 16:38:24 +0800 Subject: [PATCH 28/30] change _cpu_ids_all to Impl() --- src/inference/src/dev/threading/cpu_streams_executor.cpp | 9 +++++---- 1 file changed, 5 insertions(+), 4 deletions(-) diff --git a/src/inference/src/dev/threading/cpu_streams_executor.cpp b/src/inference/src/dev/threading/cpu_streams_executor.cpp index 9f8362d4dbb39c..a10709aa6db3df 100644 --- a/src/inference/src/dev/threading/cpu_streams_executor.cpp +++ b/src/inference/src/dev/threading/cpu_streams_executor.cpp @@ -145,10 +145,6 @@ struct CPUStreamsExecutor::Impl { _cpu_ids = stream_id < static_cast(stream_processors.size()) ? stream_processors[stream_id] : _cpu_ids; if (_cpu_ids.size() > 0) { - if (_impl->_config.get_cpu_reservation()) { - std::lock_guard lock(_impl->_cpu_ids_mutex); - _impl->_cpu_ids_all.insert(_impl->_cpu_ids_all.end(), _cpu_ids.begin(), _cpu_ids.end()); - } CpuSet processMask; int ncpus = 0; std::tie(processMask, ncpus) = get_process_mask(); @@ -341,6 +337,7 @@ struct CPUStreamsExecutor::Impl { _exectorMgr = executor_manager(); auto numaNodes = get_available_numa_nodes(); int streams_num = _config.get_streams(); + auto processor_ids = _config.get_stream_processor_ids(); if (streams_num != 0) { std::copy_n(std::begin(numaNodes), std::min(streams_num, numaNodes.size()), @@ -349,6 +346,10 @@ struct CPUStreamsExecutor::Impl { _usedNumaNodes = std::move(numaNodes); } for (auto streamId = 0; streamId < streams_num; ++streamId) { + if (_config.get_cpu_reservation()) { + std::lock_guard lock(_cpu_ids_mutex); + _cpu_ids_all.insert(_cpu_ids_all.end(), processor_ids[streamId].begin(), processor_ids[streamId].end()); + } _threads.emplace_back([this, streamId] { openvino::itt::threadName(_config.get_name() + "_" + std::to_string(streamId)); for (bool stopped = false; !stopped;) { From c0f2e693070ab934e20e2eb48734594a6aed00ad Mon Sep 17 00:00:00 2001 From: sunxiaoxia2022 Date: Thu, 16 Jan 2025 17:57:37 +0800 Subject: [PATCH 29/30] fix ci test --- .../custom/behavior/ov_executable_network/properties.cpp | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/src/plugins/intel_cpu/tests/functional/custom/behavior/ov_executable_network/properties.cpp b/src/plugins/intel_cpu/tests/functional/custom/behavior/ov_executable_network/properties.cpp index 8174c932ca63e6..6d62385c01dc04 100644 --- a/src/plugins/intel_cpu/tests/functional/custom/behavior/ov_executable_network/properties.cpp +++ b/src/plugins/intel_cpu/tests/functional/custom/behavior/ov_executable_network/properties.cpp @@ -162,7 +162,7 @@ TEST_F(OVClassConfigTestCPU, smoke_CpuExecNetworkCheckModelZeroStreams) { TEST_F(OVClassConfigTestCPU, smoke_CpuExecNetworkCheckCpuReservation) { ov::Core core; bool reservation = false; - int32_t threads = 0, input_threads = 2; + int32_t threads = 0, input_threads = 1; OV_ASSERT_NO_THROW(core.set_property(deviceName, ov::hint::performance_mode(ov::hint::PerformanceMode::LATENCY))); From e06fbdd2c05e58094b9fbb16c2dc683010988603 Mon Sep 17 00:00:00 2001 From: sunxiaoxia2022 Date: Thu, 16 Jan 2025 18:47:21 +0800 Subject: [PATCH 30/30] remove smoke_CpuExecNetworkCheckCpuReservation --- .../ov_executable_network/properties.cpp | 16 ---------------- 1 file changed, 16 deletions(-) diff --git a/src/plugins/intel_cpu/tests/functional/custom/behavior/ov_executable_network/properties.cpp b/src/plugins/intel_cpu/tests/functional/custom/behavior/ov_executable_network/properties.cpp index 6d62385c01dc04..fd9b5084a0c768 100644 --- a/src/plugins/intel_cpu/tests/functional/custom/behavior/ov_executable_network/properties.cpp +++ b/src/plugins/intel_cpu/tests/functional/custom/behavior/ov_executable_network/properties.cpp @@ -159,22 +159,6 @@ TEST_F(OVClassConfigTestCPU, smoke_CpuExecNetworkCheckModelZeroStreams) { ASSERT_EQ(streams, value); } -TEST_F(OVClassConfigTestCPU, smoke_CpuExecNetworkCheckCpuReservation) { - ov::Core core; - bool reservation = false; - int32_t threads = 0, input_threads = 1; - - OV_ASSERT_NO_THROW(core.set_property(deviceName, ov::hint::performance_mode(ov::hint::PerformanceMode::LATENCY))); - - ov::AnyMap config = {{ov::hint::enable_cpu_reservation.name(), true}, {ov::inference_num_threads.name(), input_threads}}; - ov::CompiledModel compiledModel = core.compile_model(model, deviceName, config); - - OV_ASSERT_NO_THROW(reservation = compiledModel.get_property(ov::hint::enable_cpu_reservation)); - OV_ASSERT_NO_THROW(threads = compiledModel.get_property(ov::inference_num_threads)); - ASSERT_EQ(reservation, true); - ASSERT_EQ(threads, input_threads); -} - TEST_F(OVClassConfigTestCPU, smoke_CpuExecNetworkCheckSparseWeigthsDecompressionRate) { ov::Core core;