From 11b8483b63c8ffe9fbe76d78c3db43a87e567874 Mon Sep 17 00:00:00 2001 From: Andreew Gregory Date: Sun, 29 Mar 2026 14:13:20 +0300 Subject: [PATCH] Fixed dumb shit 2 --- dedicated_ai_server/server.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/dedicated_ai_server/server.py b/dedicated_ai_server/server.py index 84a9a9b..c4bd2f2 100644 --- a/dedicated_ai_server/server.py +++ b/dedicated_ai_server/server.py @@ -141,7 +141,7 @@ def generate_llm_pieces(bundle: ModelBundle, messages: list) -> Iterable[str]: token_text = bundle.tokenizer.decode([token_id], skip_special_tokens=True) if token_text: yield token_text -- + past_key_values = outputs.past_key_values input_ids = next_token_id.unsqueeze(1) if attention_mask is not None: