From 309c2da5e18ce75b3ecc3ff3f2d71d51477ad4d1 Mon Sep 17 00:00:00 2001 From: lvliang-intel Date: Fri, 21 Jun 2024 10:25:29 +0800 Subject: [PATCH] Add preload env in run.sh to fix xft-vllm perf issue (#204) * add preload env in run.sh Signed-off-by: lvliang-intel * update comments Signed-off-by: lvliang-intel --------- Signed-off-by: lvliang-intel --- comps/llms/text-generation/vllm-xft/run.sh | 4 +++- 1 file changed, 3 insertions(+), 1 deletion(-) diff --git a/comps/llms/text-generation/vllm-xft/run.sh b/comps/llms/text-generation/vllm-xft/run.sh index 85fbb41a2..cd06458fc 100644 --- a/comps/llms/text-generation/vllm-xft/run.sh +++ b/comps/llms/text-generation/vllm-xft/run.sh @@ -3,7 +3,9 @@ # Copyright (C) 2024 Intel Corporation # SPDX-License-Identifier: Apache-2.0 -# Preload libiomp5.so by following cmd or LD_PRELOAD=libiomp5.so manually +# Preloading libiomp5.so is essential for optimal performance. +# libiomp5.so is the Intel OpenMP runtime library, providing parallel computation support, +# thread management, task scheduling, and performance optimization on Intel X86 platforms. export $(python -c 'import xfastertransformer as xft; print(xft.get_env())') # convert the model to fastertransformer format