diff --git a/python/llm/src/ipex_llm/transformers/npu_pipeline_model/qwen.py b/python/llm/src/ipex_llm/transformers/npu_pipeline_model/qwen.py index 38c86a63101..bb8003f06a7 100644 --- a/python/llm/src/ipex_llm/transformers/npu_pipeline_model/qwen.py +++ b/python/llm/src/ipex_llm/transformers/npu_pipeline_model/qwen.py @@ -42,7 +42,6 @@ def convert_lm_head_and_embedding(model, temp_dir, weight_dir, else: lm_heads = lm_head.lm_heads asym = lm_heads[0].qtype == "asym_int4_rtn" - print("asym is ", asym, lm_heads[0].qtype) lm_head_weights = [] scales = [] zeros = []