From 6ba3e18d6ef5e0843d540f6d0908a2b9f77100bb Mon Sep 17 00:00:00 2001 From: ZheWang Date: Tue, 24 Oct 2023 01:06:46 -0700 Subject: [PATCH 1/5] update KBlocks --- .../graph/core/layers/inner_product.cpp | 38 +++++++++++++++++++ .../graph/core/layers/jblas_common.hpp | 3 +- 2 files changed, 40 insertions(+), 1 deletion(-) diff --git a/intel_extension_for_transformers/llm/runtime/graph/core/layers/inner_product.cpp b/intel_extension_for_transformers/llm/runtime/graph/core/layers/inner_product.cpp index 065ad048df4..3937861d1d9 100644 --- a/intel_extension_for_transformers/llm/runtime/graph/core/layers/inner_product.cpp +++ b/intel_extension_for_transformers/llm/runtime/graph/core/layers/inner_product.cpp @@ -92,6 +92,32 @@ using PerNFp32Fp32 = jblas::wrapper::gemm_pack_weight::GemmInterfaceParallelAB< jblas::utils::parallel::Parallel2DGemm>; } // namespace avx512_vnni +namespace avx_vnni { +JBLAS_ISA constexpr DefaultISA = JblasAVX_VNNI; + +template