From 0733d178d0c23cc392969c0c79e4ac410b17ff7b Mon Sep 17 00:00:00 2001 From: Dejvino Date: Sun, 28 Jun 2026 14:07:41 +0200 Subject: [PATCH] Add all messages into context, limit output token count --- tools/engine.py | 15 ++++++++++----- 1 file changed, 10 insertions(+), 5 deletions(-) diff --git a/tools/engine.py b/tools/engine.py index 49f9d7f..828c33a 100644 --- a/tools/engine.py +++ b/tools/engine.py @@ -237,6 +237,7 @@ class GameEngine: "api_key": None, "api_base": None, "temperature": 0.8, + "max_tokens": 300, } } self._save_config() @@ -268,6 +269,10 @@ class GameEngine: def temperature(self) -> float: return self.config.get("llm", {}).get("temperature", 0.8) + @property + def max_tokens(self) -> int: + return self.config.get("llm", {}).get("max_tokens", 512) + def _set_llm_env(self) -> None: """Set provider-specific env vars for litellm.""" prefix = self.model.split("/")[0].upper() @@ -812,7 +817,7 @@ class GameEngine: temperature=self.temperature, stream=False, timeout=60, - max_tokens=512, + max_tokens=self.max_tokens, ) text = response.choices[0].message.content or "" self._append_llm_log( @@ -888,7 +893,7 @@ class GameEngine: on_debug("tool_result", {"round": attempt, "tool": name, "result": result}) round_log.append(" finalize_turn ignored (mixed with get tools)") debug_entries.append("\n".join(round_log)) - messages = messages[:2] + # messages = messages[:2] # keep full history across rounds so LLM can learn from prior attempts messages.append({"role": "assistant", "content": text}) messages.append({ "role": "user", @@ -928,7 +933,7 @@ class GameEngine: ) round_log.append(f" finalize_turn validation errors: {', '.join(errs)}") debug_entries.append("\n".join(round_log)) - messages = messages[:2] + # messages = messages[:2] # keep full history across rounds so LLM can learn from prior attempts messages.append({"role": "assistant", "content": text}) messages.append({ "role": "user", @@ -990,7 +995,7 @@ class GameEngine: round_log.append(f" {name}: OK") if on_debug: on_debug("tool_result", {"round": attempt, "tool": name, "result": result}) - messages = messages[:2] + # messages = messages[:2] # keep full history across rounds so LLM can learn from prior attempts messages.append({"role": "assistant", "content": text}) messages.append({ "role": "user", @@ -1018,7 +1023,7 @@ class GameEngine: on_debug("thought", {"round": attempt, "text": text.strip()}) debug_entries.append("\n".join(round_log)) - messages = messages[:2] + # messages = messages[:2] # keep full history across rounds so LLM can learn from prior attempts messages.append({"role": "assistant", "content": text}) reminder_count += 1 if reminder_count % 3 == 0: