[CPU] extend bf16 fp16 cpu functional tests on LNL+ systems (#29168)

liubo-intel · web-flow · commit 2b477c1dd9d0 · 2025-03-18T11:39:38.000Z
### Details: - *extend bf16 fp16 cpu functional tests on LNL+ systems* ### Tickets: - *CVS-161636*
diff --git a/src/plugins/intel_cpu/src/nodes/scaled_attn.cpp b/src/plugins/intel_cpu/src/nodes/scaled_attn.cpp
@@ -1238,10 +1238,17 @@ void ScaledDotProductAttention::createPrimitive() {
         std::shared_ptr<Executor> executor = nullptr;
 #ifdef OPENVINO_ARCH_X86_64
         if (rtPrecision == ov::element::bf16) {
-            executor = std::make_shared<AttentionExecutor<KT_ONEDNN, ov::bfloat16>>(context,
-                                                                                    m_key_quant_param.groupSize,
-                                                                                    m_value_quant_param.groupSize,
-                                                                                    m_key_quant_param.isByChannel);
+            if (ov::with_cpu_x86_bfloat16()) {
+                executor = std::make_shared<AttentionExecutor<KT_ONEDNN, ov::bfloat16>>(context,
+                                                                                        m_key_quant_param.groupSize,
+                                                                                        m_value_quant_param.groupSize,
+                                                                                        m_key_quant_param.isByChannel);
+            } else {
+                executor = std::make_shared<AttentionExecutor<KT_REF, ov::bfloat16>>(context,
+                                                                                     m_key_quant_param.groupSize,
+                                                                                     m_value_quant_param.groupSize,
+                                                                                     m_key_quant_param.isByChannel);
+            }
         } else if (rtPrecision == ov::element::f16) {
             if (with_cpu_x86_avx512_core_fp16()) {
                 executor = std::make_shared<AttentionExecutor<KT_ONEDNN, ov::float16>>(context,
@@ -2075,7 +2082,7 @@ const ScaledDotProductAttention::SDPAQuantParam& ScaledDotProductAttention::getV
 ov::element::Type ScaledDotProductAttention::getRuntimePrecision() const {
     auto rtPrecision = getOriginalInputPrecisionAtPort(0);
     // bf16 should be enabled only when platform supports
-    if (rtPrecision == ov::element::bf16 && ov::with_cpu_x86_bfloat16()) {
+    if (rtPrecision == ov::element::bf16 && (ov::with_cpu_x86_bfloat16() || mayiuse(cpu_isa_t::avx2_vnni_2))) {
         rtPrecision = ov::element::bf16;
     } else if (rtPrecision == ov::element::f16 && ov::intel_cpu::hasHardwareSupport(ov::element::f16)) {
         rtPrecision = ov::element::f16;
diff --git a/src/plugins/intel_cpu/src/nodes/topk.cpp b/src/plugins/intel_cpu/src/nodes/topk.cpp
@@ -18,6 +18,7 @@
 #include "onednn/dnnl.h"
 #include "openvino/core/parallel.hpp"
 #include "openvino/op/topk.hpp"
+#include "utils/cpu_utils.hpp"
 #include "utils/ngraph_utils.hpp"
 
 using namespace dnnl;
@@ -1985,11 +1986,9 @@ void TopK::initSupportedPrimitiveDescriptors() {
                                                            ov::element::u8};
 
     ov::element::Type dataPrecision = getOriginalOutputPrecisionAtPort(TOPK_DATA);
-    if (dataPrecision == ov::element::bf16 && !mayiuse(avx512_core)) {
-        THROW_CPU_NODE_ERR("gets incorrect isa for BF16! AVX512 must be supported!");
-    }
     bool precisionSupported = std::find(std::begin(supportedPrecision), std::end(supportedPrecision), dataPrecision) !=
                               std::end(supportedPrecision);
+    precisionSupported = (dataPrecision == ov::element::bf16 && !mayiuse(avx512_core)) ? false : precisionSupported;
     if (!precisionSupported) {
         if (dataPrecision.is_real()) {
             dataPrecision = ov::element::f32;
diff --git a/src/plugins/intel_cpu/tests/functional/custom/single_layer_tests/classes/conversion.cpp b/src/plugins/intel_cpu/tests/functional/custom/single_layer_tests/classes/conversion.cpp
@@ -145,6 +145,12 @@ void ConvertCPULayerTest::SetUp() {
     auto conversion = std::make_shared<ov::op::v0::Convert>(params.front(), outPrc);
 
     function = makeNgraphFunction(inPrc, params, conversion, "ConversionCPU");
+
+    // issue 161636
+    if (special_value == ov::test::SpecialValue::none && outPrc == ov::element::f8e4m3) {
+        abs_threshold = 0.0078125f;
+        rel_threshold = 1e-2f;
+    }
 }
 
 void ConvertCPULayerTest::generate_inputs(const std::vector<ov::Shape>& targetInputStaticShapes) {
diff --git a/src/plugins/intel_cpu/tests/functional/custom/single_layer_tests/classes/eltwise.cpp b/src/plugins/intel_cpu/tests/functional/custom/single_layer_tests/classes/eltwise.cpp
@@ -158,6 +158,15 @@ void EltwiseLayerCPUTest::SetUp() {
     std::tie(inFmts, outFmts, priority, selectedType) = cpuParams;
     std::tie(postOpMgrPtr, fusedOps) = fusingParams;
 
+    // issue 163147
+    if (ElementType::f16 == netType && enforceSnippets) {
+        auto fusedOpsNames = postOpMgrPtr ? postOpMgrPtr->getFusedOpsNames() : "";
+        if (fusedOpsNames.find("PerChannel") != std::string::npos) {
+            rel_threshold = 0.01f;
+            abs_threshold = 0.0078125f;
+        }
+    }
+
     shapes.resize(2);
     switch (opType) {
     case ov::test::utils::OpType::SCALAR: {
diff --git a/src/plugins/intel_cpu/tests/functional/custom/single_layer_tests/classes/scaled_attn.cpp b/src/plugins/intel_cpu/tests/functional/custom/single_layer_tests/classes/scaled_attn.cpp
@@ -59,7 +59,12 @@ void ScaledAttnLayerCPUTest::SetUp() {
     }
 
     if (inType == ElementType::bf16) {
-        rel_threshold = 2e-2f;
+        // Issue: 163144
+        if (with_cpu_x86_avx2_vnni_2()) {
+            rel_threshold = 0.2f;
+        } else {
+            rel_threshold = 2e-2f;
+        }
     }
     selectedType = makeSelectedTypeStr(selectedType, inType);
     init_input_shapes(inputShapes);
@@ -133,7 +138,7 @@ TEST_P(ScaledAttnLayerCPUTest, CompareWithRefs) {
     bool has_scale;
     std::string targetDevice;
     std::tie(inType, inputShapes, is_causal, has_attn, has_scale, targetDevice, cpuParams) = this->GetParam();
-    if (inType == ElementType::bf16 && !ov::with_cpu_x86_bfloat16())
+    if (inType == ElementType::bf16 && !ov::with_cpu_x86_bfloat16() && !with_cpu_x86_avx2_vnni_2())
         GTEST_SKIP();
     run();
     CheckPluginRelatedResults(compiledModel, "ScaledAttn");
diff --git a/src/plugins/intel_cpu/tests/functional/custom/single_layer_tests/instances/x64/matmul.cpp b/src/plugins/intel_cpu/tests/functional/custom/single_layer_tests/instances/x64/matmul.cpp
@@ -157,7 +157,7 @@ std::vector<ov::AnyMap> filterAdditionalConfig_Brgemm() {
 #else
     std::vector<ov::AnyMap> additionalConfig = {{}};
 #endif
-    if (with_cpu_x86_bfloat16()) {
+    if (with_cpu_x86_bfloat16() || with_cpu_x86_avx2_vnni_2()) {
         additionalConfig.push_back({ov::hint::inference_precision(ov::element::bf16)});
     }
 
diff --git a/src/plugins/intel_cpu/tests/functional/custom/single_layer_tests/normalize.cpp b/src/plugins/intel_cpu/tests/functional/custom/single_layer_tests/normalize.cpp
@@ -64,7 +64,13 @@ class NormalizeL2LayerCPUTest : public testing::WithParamInterface<NormalizeL2La
         if (selectedType.empty()) {
             selectedType = getPrimitiveType();
         }
-        selectedType = makeSelectedTypeStr("unknown", inType);
+
+        if (!with_cpu_x86_avx512_core() && inType == ElementType::bf16) {
+            selectedType = makeSelectedTypeStr("unknown", ElementType::f32);
+        } else {
+            selectedType = makeSelectedTypeStr("unknown", inType);
+        }
+
         targetDevice = ov::test::utils::DEVICE_CPU;
         init_input_shapes({shapes});
 
diff --git a/src/plugins/intel_cpu/tests/functional/custom/single_layer_tests/roi_pooling.cpp b/src/plugins/intel_cpu/tests/functional/custom/single_layer_tests/roi_pooling.cpp
@@ -194,7 +194,12 @@ class ROIPoolingCPULayerTest : public testing::WithParamInterface<ROIPoolingCPUT
             selectedType = getPrimitiveType();
         }
         selectedType.push_back('_');
-        selectedType += netPrecision.to_string();
+
+        if (!with_cpu_x86_avx512_core() && netPrecision == ElementType::bf16) {
+            selectedType += ov::element::f32.to_string();
+        } else {
+            selectedType += netPrecision.to_string();
+        }
 
         if (netPrecision == ov::element::bf16) {
             rel_threshold = 1e-2;
diff --git a/src/plugins/intel_cpu/tests/functional/custom/single_layer_tests/topk.cpp b/src/plugins/intel_cpu/tests/functional/custom/single_layer_tests/topk.cpp
@@ -102,7 +102,11 @@ class TopKLayerCPUTest : public testing::WithParamInterface<TopKLayerCPUTestPara
             inPrc = outPrc = netPrecision;
         configuration.insert(additionalConfig.begin(), additionalConfig.end());
 
-        selectedType = getPrimitiveType() + "_" + ov::element::Type(netPrecision).get_type_name();
+        if (!ov::with_cpu_x86_avx512_core() && netPrecision == ElementType::bf16) {
+            selectedType = makeSelectedTypeStr(getPrimitiveType(), ElementType::f32);
+        } else {
+            selectedType = makeSelectedTypeStr(getPrimitiveType(), netPrecision);
+        }
 
         staticShape = inputShape.first.rank() == 0;
         if (staticShape) {
diff --git a/src/plugins/intel_cpu/tests/functional/custom/subgraph_tests/src/x64/interaction.cpp b/src/plugins/intel_cpu/tests/functional/custom/subgraph_tests/src/x64/interaction.cpp
@@ -149,7 +149,7 @@ class IntertactionCPUTest : public testing::WithParamInterface<InteractionLayerC
         ElementType inType;
         InputShape inputShape;
         std::tie(inType, inputShape) = this->GetParam();
-        bool with_bf16 = ov::with_cpu_x86_bfloat16();
+        bool with_bf16 = ov::with_cpu_x86_bfloat16() || with_cpu_x86_avx2_vnni_2();
         if (with_bf16 && (inType == ov::element::bf16 || inType == ov::element::i32)) {
             selectedType = makeSelectedTypeStr("ref_any", ov::element::bf16);
         } else {
@@ -177,6 +177,8 @@ TEST_P(IntertactionCPUTest_FP16, CompareWithRefs) {
         GTEST_SKIP() << "Skipping test, platform don't support precision f16";
     }
     configuration.insert({ov::hint::inference_precision.name(), ov::element::f16});
+    rel_threshold = 0.01;
+    abs_threshold = 0.0078125;
 
     run();
     CheckNumberOfNodesWithType(compiledModel, "Interaction", 1);
diff --git a/src/plugins/intel_cpu/tests/functional/shared_tests_instances/skip_tests_config.cpp b/src/plugins/intel_cpu/tests/functional/shared_tests_instances/skip_tests_config.cpp
@@ -9,10 +9,11 @@
 #if defined(OPENVINO_ARCH_RISCV64)
 #   include "nodes/kernels/riscv64/cpu_isa_traits.hpp"
 #endif
-
 #include <string>
 #include <vector>
 
+#include "utils/cpu_test_utils.hpp"
+
 std::vector<std::string> disabledTestPatterns() {
     std::vector<std::string> retVector{
         // TODO: Issue 31841
@@ -491,7 +492,7 @@ std::vector<std::string> disabledTestPatterns() {
     retVector.emplace_back(R"(.*smoke_RDFT_CPU_1D/RDFTTestCPU.CompareWithRefs/prec=f32_IS0=\[\]_TS0=\(\(126\)\)_constAxes=true_axes=\(\(0\)\)_isInverse=false.*)");
     retVector.emplace_back(R"(.*smoke_RDFT_CPU_2D/RDFTTestCPU.CompareWithRefs/prec=f32_IS0=\[\]_TS0=\(\(16.38\)\)_constAxes=true_axes=\(\(0.1\)\)_isInverse=false.*)");
 #endif
-    if (!ov::with_cpu_x86_avx512_core()) {
+    if (!ov::intel_cpu::hasHardwareSupport(ov::element::bf16)) {
         // on platforms which do not support bfloat16, we are disabling bf16 tests since there are no bf16 primitives,
         // tests are useless on such platforms
         retVector.emplace_back(R"(.*(BF|bf)16.*)");
@@ -504,7 +505,7 @@ std::vector<std::string> disabledTestPatterns() {
         retVector.emplace_back(R"(.*Snippets.*MHA.*)");
         retVector.emplace_back(R"(.*Snippets.*(MatMul|Matmul).*)");
     }
-    if (!ov::with_cpu_x86_avx512_core_fp16()) {
+    if (!ov::intel_cpu::hasHardwareSupport(ov::element::f16)) {
         // Skip fp16 tests for paltforms that don't support fp16 precision
         retVector.emplace_back(R"(.*INFERENCE_PRECISION_HINT=(F|f)16.*)");
         retVector.emplace_back(R"(.*ConcatMultiQuerySDPTest.*f16.*)");
@@ -638,7 +639,7 @@ std::vector<std::string> disabledTestPatterns() {
         retVector.emplace_back(R"(.*smoke_Deconv_(2|3)D_NSPC_INT8_AMX/DeconvolutionLayerCPUTest.*)");
     }
 
-    if (ov::with_cpu_x86_avx512_core_fp16()) {
+    if (ov::with_cpu_x86_avx512_core_fp16() || CPUTestUtils::with_cpu_x86_avx2_vnni_2()) {
         // Issue: 143852
         retVector.emplace_back(R"(smoke_ConvertRangeSubgraphCPUTest/ConvertRangeSubgraphCPUTest\.CompareWithRefs.*Prc=f16.*)");
         retVector.emplace_back(R"((smoke|nightly)_FC_3D_FP16/.*_Fused=Multiply\(PerChannel\).*)");
@@ -649,5 +650,13 @@ std::vector<std::string> disabledTestPatterns() {
         retVector.emplace_back(R"(smoke_Conv_Sum_Broadcast_FP16/ConvSumInPlaceTest.*Relu\.Multiply\(PerChannel\)\.Add\(PerChannel\).*)");
     }
 
+    if (CPUTestUtils::with_cpu_x86_avx2_vnni_2()) {
+        // jit_gemm_BF16 kernels are not supported for conv,inner_product,matmul on avx2_vnni_2 platforms
+        retVector.emplace_back(R"(smoke_Conv_.*D_GEMM_BF16.*)");
+        retVector.emplace_back(
+            R"(smoke_GroupConv_.*D_Gemm_BF16/GroupConvolutionLayerCPUTest.CompareWithRefs.*primitive=jit_gemm.*)");
+        retVector.emplace_back(R"(smoke_.*MatMulLayerCPUTest.*INFERENCE_PRECISION_HINT=bf16.*_primitive=jit_gemm.*)");
+    }
+
     return retVector;
 }
diff --git a/src/plugins/intel_cpu/tests/functional/utils/cpu_test_utils.cpp b/src/plugins/intel_cpu/tests/functional/utils/cpu_test_utils.cpp
@@ -12,6 +12,9 @@
 #include "transformations/rt_info/primitives_priority_attribute.hpp"
 #include "utils/general_utils.h"
 #include "utils/rt_info/memory_formats_attribute.hpp"
+#if defined(OPENVINO_ARCH_X86) || defined(OPENVINO_ARCH_X86_64)
+#    include <xbyak/xbyak_util.h>
+#endif
 
 namespace CPUTestUtils {
 const char* CPUTestsBase::any_type = "any_type";
@@ -45,6 +48,22 @@ const char* CPUTestsBase::cpu_fmt2str(cpu_memory_format_t v) {
     return "undef";
 }
 
+#if defined(OPENVINO_ARCH_X86) || defined(OPENVINO_ARCH_X86_64)
+static Xbyak::util::Cpu& get_cpu_info() {
+    static Xbyak::util::Cpu cpu;
+    return cpu;
+}
+bool with_cpu_x86_avx2_vnni_2() {
+    return get_cpu_info().has(Xbyak::util::Cpu::tAVX2 | Xbyak::util::Cpu::tAVX_VNNI) &&
+           get_cpu_info().has(Xbyak::util::Cpu::tAVX_VNNI_INT8) &&
+           get_cpu_info().has(Xbyak::util::Cpu::tAVX_NE_CONVERT);
+}
+#else  // OPENVINO_ARCH_X86 || OPENVINO_ARCH_X86_64
+bool with_cpu_x86_avx2_vnni_2() {
+    return false;
+}
+#endif  // OPENVINO_ARCH_X86 || OPENVINO_ARCH_X86_64
+
 cpu_memory_format_t CPUTestsBase::cpu_str2fmt(const char* str) {
 #define CASE(_fmt)                                              \
     do {                                                        \
@@ -472,9 +491,10 @@ CPUTestsBase::deduce_expected_precision(const ov::element::Type& opPrecision,
     if (it != configuration.end()) {
         auto inferencePrecisionConfig = it->second.as<ov::element::Type>();
         inferencePrecisionSetExplicitly = true;
-        // TODO also need to check (dnnl::impl::cpu::x64::avx2_vnni_2)
-        if ((inferencePrecisionConfig == ov::element::bf16 && ov::with_cpu_x86_avx512_core()) ||
-            (inferencePrecisionConfig == ov::element::f16 && ov::with_cpu_x86_avx512_core_fp16()) ||
+        if ((inferencePrecisionConfig == ov::element::bf16 &&
+             (ov::with_cpu_x86_avx512_core() || with_cpu_x86_avx2_vnni_2())) ||
+            (inferencePrecisionConfig == ov::element::f16 &&
+             (ov::with_cpu_x86_avx512_core_fp16() || with_cpu_x86_avx2_vnni_2())) ||
             (inferencePrecisionConfig == ov::element::f32) || (inferencePrecisionConfig == ov::element::dynamic)) {
             inferencePrecision = inferencePrecisionConfig;
         }
@@ -495,7 +515,8 @@ CPUTestsBase::deduce_expected_precision(const ov::element::Type& opPrecision,
     ov::element::Type deducedType = opPrecision;
     // enforceInferPrecision stage
     if (inferencePrecision == ov::element::bf16) {
-        deducedType = ov::with_cpu_x86_avx512_core() ? ov::element::bf16 : ov::element::f32;
+        deducedType =
+            (ov::with_cpu_x86_avx512_core() || with_cpu_x86_avx2_vnni_2()) ? ov::element::bf16 : ov::element::f32;
     }
 
     // ngraph transform pipeline stage
@@ -505,7 +526,8 @@ CPUTestsBase::deduce_expected_precision(const ov::element::Type& opPrecision,
         }
     }
     if (deducedType == ov::element::bf16) {
-        deducedType = ov::with_cpu_x86_avx512_core() ? ov::element::bf16 : ov::element::f32;
+        deducedType =
+            (ov::with_cpu_x86_avx512_core() || with_cpu_x86_avx2_vnni_2()) ? ov::element::bf16 : ov::element::f32;
     } else if (deducedType == ov::element::f16) {
         if (inferencePrecision != ov::element::f16 && inferencePrecision != ov::element::dynamic) {
             deducedType = ov::element::f32;
diff --git a/src/plugins/intel_cpu/tests/functional/utils/cpu_test_utils.hpp b/src/plugins/intel_cpu/tests/functional/utils/cpu_test_utils.hpp
@@ -113,7 +113,7 @@ inline std::string nodeType2str(nodeType nt) {
         return "GroupConvolutionBackpropData";
     throw std::runtime_error("Undefined node type to convert to string!");
 }
-
+bool with_cpu_x86_avx2_vnni_2();
 class CPUTestsBase {
 public:
     typedef std::map<std::string, ov::Any> CPUInfo;
diff --git a/src/tests/functional/plugin/shared/include/snippets/mha.hpp b/src/tests/functional/plugin/shared/include/snippets/mha.hpp
@@ -58,6 +58,7 @@ class MHA : public testing::WithParamInterface<ov::test::snippets::MHAParams>,
 protected:
     std::shared_ptr<SnippetsFunctionBase> get_subgraph() const override;
     void init_params(std::vector<InputShape>& input_shapes, ov::element::Type& prc, ov::AnyMap& additional_config) override;
+    void init_thresholds() override;
 
     bool m_with_mul = false;
 };
diff --git a/src/tests/functional/plugin/shared/src/snippets/mha.cpp b/src/tests/functional/plugin/shared/src/snippets/mha.cpp
@@ -153,6 +153,17 @@ std::shared_ptr<SnippetsFunctionBase> MHA::get_subgraph() const {
     return std::make_shared<ov::test::snippets::MHAFunction>(inputDynamicShapes, m_input_types, m_with_mul, is_with_reshape);
 }
 
+void MHA::init_thresholds() {
+    MHABase::init_thresholds();
+    auto precision_hint = configuration.count(ov::hint::inference_precision.name())
+                              ? configuration.at(ov::hint::inference_precision.name())
+                              : ov::element::f32;
+    if (m_input_types.size() > 1 && m_input_types[0] == ov::element::bf16 && precision_hint == ov::element::f32) {
+        rel_threshold = 0.01f;
+        abs_threshold = 0.0078125f;
+    }
+}
+
 void MHASelect::generate_inputs(const std::vector<ov::Shape>& targetInputStaticShapes) {
     inputs.clear();
     auto model_inputs = function->inputs();
diff --git a/src/tests/functional/shared_test_classes/src/base/ov_subgraph.cpp b/src/tests/functional/shared_test_classes/src/base/ov_subgraph.cpp
@@ -306,7 +306,7 @@ void SubgraphBaseTest::compile_model() {
         std::cout << "[ PLUGIN      ] `SubgraphBaseTest::compile_model()` is finished successfully. Duration is " << duration.count() << "s" << std::endl;
     }
     try {
-        inference_precision = core->get_property(targetDevice, ov::hint::inference_precision);
+        inference_precision = compiledModel.get_property(ov::hint::inference_precision);
     } catch (std::exception& e) {
         std::cout << "[ WARNING ] Impossible to get Inference Precision with exception: " << e.what() << std::endl;
     }

Original file line number	Diff line number	Diff line change
`@@ -157,7 +157,7 @@ std::vector<ov::AnyMap> filterAdditionalConfig_Brgemm() {`
`157`	`157`	`#else`
`158`	`158`	`std::vector<ov::AnyMap> additionalConfig = {{}};`
`159`	`159`	`#endif`
`160`		`- if (with_cpu_x86_bfloat16()) {`
	`160`	`+ if (with_cpu_x86_bfloat16() \|\| with_cpu_x86_avx2_vnni_2()) {`
`161`	`161`	`additionalConfig.push_back({ov::hint::inference_precision(ov::element::bf16)});`
`162`	`162`	`}`
`163`	`163`
Original file line number	Diff line number	Diff line change
`@@ -113,7 +113,7 @@ inline std::string nodeType2str(nodeType nt) {`
`113`	`113`	`return "GroupConvolutionBackpropData";`
`114`	`114`	`throw std::runtime_error("Undefined node type to convert to string!");`
`115`	`115`	`}`
`116`		`-`
	`116`	`+bool with_cpu_x86_avx2_vnni_2();`
`117`	`117`	`class CPUTestsBase {`
`118`	`118`	`public:`
`119`	`119`	`typedef std::map<std::string, ov::Any> CPUInfo;`
Original file line number	Diff line number	Diff line change
`@@ -306,7 +306,7 @@ void SubgraphBaseTest::compile_model() {`
`306`	`306`	std::cout << "[ PLUGIN ] `SubgraphBaseTest::compile_model()` is finished successfully. Duration is " << duration.count() << "s" << std::endl;
`307`	`307`	`}`
`308`	`308`	`try {`
`309`		`- inference_precision = core->get_property(targetDevice, ov::hint::inference_precision);`
	`309`	`+ inference_precision = compiledModel.get_property(ov::hint::inference_precision);`
`310`	`310`	`} catch (std::exception& e) {`
`311`	`311`	`std::cout << "[ WARNING ] Impossible to get Inference Precision with exception: " << e.what() << std::endl;`
`312`	`312`	`}`