浏览代码

bugfix: remove duplicate load_peft_model

hongbo.mo 1 年之前
父节点
当前提交
fcc817e923
共有 1 个文件被更改,包括 1 次插入5 次删除
  1. 1 5
      inference/inference.py

+ 1 - 5
inference/inference.py

@@ -99,11 +99,7 @@ def main(
         print("Skipping the inference as the prompt is not safe.")
         sys.exit(1)  # Exit the program with an error status
         
-    if peft_model:
-        model = load_peft_model(model, peft_model)
-
-    model.eval()
-    batch = tokenizer(user_prompt, padding='max_length', truncation=True,max_length=max_padding_length,return_tensors="pt")
+    batch = tokenizer(user_prompt, padding='max_length', truncation=True, max_length=max_padding_length, return_tensors="pt")
 
     batch = {k: v.to("cuda") for k, v in batch.items()}
     start = time.perf_counter()