Skip to content
This repository was archived by the owner on Oct 25, 2024. It is now read-only.

Commit 59ab036

Browse files
Remove OneDNN env setint for BF16 inference (#509)
Signed-off-by: lvliang-intel <liang1.lv@intel.com> Co-authored-by: VincyZhang <wenxin.zhang@intel.com>
1 parent d65bd8b commit 59ab036

File tree

3 files changed

+0
-15
lines changed

3 files changed

+0
-15
lines changed

intel_extension_for_transformers/neural_chat/models/model_utils.py

Lines changed: 0 additions & 7 deletions
Original file line numberDiff line numberDiff line change
@@ -254,11 +254,6 @@ def init_deepspeed_inference(model, model_name_or_path, use_hpu_graphs, is_meta)
254254
model = deepspeed.init_inference(model, **ds_inference_kwargs)
255255
return model.module
256256

257-
258-
def set_cpu_running_env():
259-
os.environ["ONEDNN_MAX_CPU_ISA"] = "AVX512_CORE_BF16"
260-
261-
262257
def load_model(
263258
model_name,
264259
tokenizer_name,
@@ -298,8 +293,6 @@ def load_model(
298293
)
299294

300295
adapt_transformers_to_gaudi()
301-
elif device == "cpu" and not ipex_int8:
302-
set_cpu_running_env()
303296

304297
if isinstance(optimization_config, AMPConfig):
305298
dtype = optimization_config.dtype

intel_extension_for_transformers/neural_chat/pipeline/plugins/ner/ner.py

Lines changed: 0 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -28,7 +28,6 @@
2828
)
2929
import intel_extension_for_pytorch as intel_ipex
3030
from .utils.utils import (
31-
set_cpu_running_env,
3231
enforce_stop_tokens,
3332
get_current_time
3433
)
@@ -43,9 +42,6 @@ class NamedEntityRecognition():
4342
"""
4443

4544
def __init__(self, model_path="./Llama-2-7b-chat-hf/", spacy_model="en_core_web_lg", bf16: bool=False) -> None:
46-
# set up cpu running environment
47-
if bf16:
48-
set_cpu_running_env()
4945
# initialize tokenizer and models
5046
self.nlp = spacy.load(spacy_model)
5147
config = AutoConfig.from_pretrained(model_path, trust_remote_code=True)

intel_extension_for_transformers/neural_chat/pipeline/plugins/ner/utils/utils.py

Lines changed: 0 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -35,7 +35,3 @@ def get_current_time() -> str:
3535
utc_now = datetime.datetime.utcnow().replace(tzinfo=timezone.utc)
3636
cur_time = utc_now.astimezone(SHA_TZ).strftime("%Y/%m/%d")
3737
return cur_time
38-
39-
40-
def set_cpu_running_env():
41-
os.environ["ONEDNN_MAX_CPU_ISA"] = "AVX512_CORE_BF16"

0 commit comments

Comments
 (0)