fix: batch 推理示例添加 chat template 和 system prompt

- 新增 prompts 列表，对每个输入应用 apply_chat_template - 添加 system message 到对话模板
2026-05-14 20:59:01 +08:00 · 2026-05-14 20:59:01 +08:00 · f0339022c1
parent d8da2cf17c
commit f0339022c1
1 changed files with 12 additions and 1 deletions
--- a/scripts/demo/generate_batch.py
+++ b/scripts/demo/generate_batch.py
@ -24,12 +24,23 @@ def batch_generate():
        "请问什么是显卡",
    ]
    prompts = [
        tokenizer.apply_chat_template(
            [
                {"role": "system", "content": "You are a helpful assistant."},
                {"role": "user", "content": q},
            ],
            tokenize=False,
        )
        for q in inputs
    ]
    engine = InferenceEngine(
        model=model,
        tokenizer=tokenizer,
    )
    responses = engine.generate(
-        prompt=inputs,
+        prompt=prompts,
        stream=False,
        max_tokens=2048,
        temperature=0.8,