fix checkpoint loading

2025-12-16 11:50:35 +08:00 · 2023-05-29 17:43:16 +08:00
parent ce71cc8b6d
commit c0e5df92d6
4 changed files with 56 additions and 23 deletions
--- a/src/cli_demo.py
+++ b/src/cli_demo.py
@@ -21,8 +21,14 @@ def main():
        model = model.cuda()
    model.eval()

+    def format_example(query):
+        prompt = "Below is an instruction that describes a task. "
+        prompt += "Write a response that appropriately completes the request.\n"
+        prompt += "Instruction:\nHuman: {}\nAssistant: ".format(query)
+        return prompt
+
    def predict(query, history: list):
-        inputs = tokenizer([query], return_tensors="pt")
+        inputs = tokenizer([format_example(query)], return_tensors="pt")
        inputs = inputs.to(model.device)
        gen_kwargs = {
            "do_sample": True,