From a58fab8d6e5856a5e9b3c91f3d7092f23b11f2db Mon Sep 17 00:00:00 2001 From: ViperEkura <3081035982@qq.com> Date: Sun, 10 May 2026 20:17:47 +0800 Subject: [PATCH] =?UTF-8?q?fix:=20max=5Fseq=5Flen=20=E6=A3=80=E6=9F=A5?= =?UTF-8?q?=E6=94=B9=E4=B8=BA=E4=BB=85=20prompt=20=E8=B6=85=E9=99=90?= =?UTF-8?q?=E5=8F=91=20STOP=EF=BC=8Cmax=5Ftokens=20=E8=B6=85=E5=87=BA?= =?UTF-8?q?=E9=83=A8=E5=88=86=20clamp?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit --- astrai/inference/scheduler.py | 4 +++- 1 file changed, 3 insertions(+), 1 deletion(-) diff --git a/astrai/inference/scheduler.py b/astrai/inference/scheduler.py index d83e2ed..23a1fce 100644 --- a/astrai/inference/scheduler.py +++ b/astrai/inference/scheduler.py @@ -147,11 +147,13 @@ class InferenceScheduler: if len(prompt_ids) > self.max_prompt_len: prompt_ids = prompt_ids[-self.max_prompt_len :] - if len(prompt_ids) + max_tokens > self.max_seq_len: + if len(prompt_ids) >= self.max_seq_len: if stream_callback: stream_callback(STOP) return task_id + max_tokens = min(max_tokens, self.max_seq_len - len(prompt_ids)) + task = Task( task_id=task_id, prompt_ids=prompt_ids,