diff --git a/navi/llm/fallback.py b/navi/llm/fallback.py index 32e6ab0..3c2862a 100644 --- a/navi/llm/fallback.py +++ b/navi/llm/fallback.py @@ -74,6 +74,8 @@ model: "list[str] | str | None" = None, think: bool | None = None, max_tokens: int | None = None, + top_k: int | None = None, + top_p: float | None = None, ) -> LLMResponse: models = self._model_list(model) last_err: Exception = LLMBackendError("No backends configured") @@ -88,6 +90,7 @@ return await self._get_client(server).complete( messages, tools=tools, temperature=temperature, model=m, think=think, max_tokens=max_tokens, + top_k=top_k, top_p=top_p, ) except LLMConnectionError as e: log.warning("fallback.server_dead", host=server.host, error=str(e)) @@ -107,6 +110,8 @@ messages: list[Message], temperature: float = 0.7, model: "list[str] | str | None" = None, + top_k: int | None = None, + top_p: float | None = None, ) -> AsyncGenerator[LLMChunk, None]: models = self._model_list(model) last_err: Exception = LLMBackendError("No backends configured") @@ -118,7 +123,9 @@ if (server.host, m) in _dead_models: continue try: - gen = self._get_client(server).stream(messages, temperature=temperature, model=m) + gen = self._get_client(server).stream( + messages, temperature=temperature, model=m, top_k=top_k, top_p=top_p + ) first = await gen.__anext__() except StopAsyncIteration: return @@ -147,6 +154,8 @@ temperature: float = 0.7, model: "list[str] | str | None" = None, think: bool | None = None, + top_k: int | None = None, + top_p: float | None = None, ) -> AsyncGenerator[LLMChunk, None]: models = self._model_list(model) last_err: Exception = LLMBackendError("No backends configured") @@ -160,6 +169,7 @@ try: gen = self._get_client(server).stream_complete( messages, tools=tools, temperature=temperature, model=m, think=think, + top_k=top_k, top_p=top_p, ) first = await gen.__anext__() except StopAsyncIteration: diff --git a/navi/profiles/developer/config.json b/navi/profiles/developer/config.json index 99ce158..b7e9963 100644 --- a/navi/profiles/developer/config.json +++ b/navi/profiles/developer/config.json @@ -13,7 +13,7 @@ "gemma4:31b-cloud", "gemma4:26b-a4b-it-q4_K_M" ], - "temperature": 0.7, + "temperature": 0.45, "max_iterations": 45, "planning_enabled": true, "subagent_planning_enabled": true, @@ -56,12 +56,12 @@ "list_tools", "spawn_agent", "share_file", - "email_manager" + "gmail" ], "planning_mandatory": false, "planning_phase1_enabled": true, "planning_phase2_enabled": false, "planning_phase3_enabled": true, - "top_k": 64, - "top_p": 0.95 + "top_k": 40, + "top_p": 0.88 } diff --git a/navi/profiles/discuss/config.json b/navi/profiles/discuss/config.json index 02aa430..91f862c 100644 --- a/navi/profiles/discuss/config.json +++ b/navi/profiles/discuss/config.json @@ -7,7 +7,7 @@ "gemma4:31b-cloud", "gemma4:26b-a4b-it-q4_K_M" ], - "temperature": 0.9, + "temperature": 0.85, "max_iterations": 12, "enabled_tools": [ "web_search", @@ -37,6 +37,6 @@ "step_validation_enabled": false, "adaptive_replan_enabled": false, "subagent_planning_enabled": false, - "top_k": 64, + "top_k": 80, "top_p": 0.95 } diff --git a/navi/profiles/secretary/config.json b/navi/profiles/secretary/config.json index cf1c39a..e6bf32e 100644 --- a/navi/profiles/secretary/config.json +++ b/navi/profiles/secretary/config.json @@ -13,7 +13,7 @@ "gemma4:31b-cloud", "gemma4:26b-a4b-it-q4_K_M" ], - "temperature": 0.7, + "temperature": 0.65, "max_iterations": 35, "planning_enabled": true, "subagent_planning_enabled": true, @@ -35,7 +35,7 @@ "code_exec", "image_view", "memory", - "share_file", + "share_file" ], "enabled_tools": [ "todo", @@ -54,12 +54,12 @@ "spawn_agent", "share_file", "weather", - "email_manager" + "gmail" ], "planning_mandatory": false, "planning_phase1_enabled": true, "planning_phase2_enabled": false, "planning_phase3_enabled": true, - "top_k": 64, - "top_p": 0.95 + "top_k": 50, + "top_p": 0.90 } diff --git a/navi/profiles/server_admin/config.json b/navi/profiles/server_admin/config.json index 1ab6f36..863a422 100644 --- a/navi/profiles/server_admin/config.json +++ b/navi/profiles/server_admin/config.json @@ -13,7 +13,7 @@ "gemma4:31b-cloud", "gemma4:26b-a4b-it-q4_K_M" ], - "temperature": 0.7, + "temperature": 0.30, "max_iterations": 40, "planning_enabled": true, "subagent_planning_enabled": true, @@ -56,12 +56,12 @@ "tool_manual", "spawn_agent", "share_file", - "email_manager" + "gmail" ], "planning_mandatory": false, "planning_phase1_enabled": true, "planning_phase2_enabled": false, "planning_phase3_enabled": true, - "top_k": 64, - "top_p": 0.95 + "top_k": 30, + "top_p": 0.80 } diff --git a/navi/profiles/tool_developer/config.json b/navi/profiles/tool_developer/config.json index 605f82e..3cfa3ca 100644 --- a/navi/profiles/tool_developer/config.json +++ b/navi/profiles/tool_developer/config.json @@ -13,7 +13,7 @@ "gemma4:31b-cloud", "gemma4:26b-a4b-it-q4_K_M" ], - "temperature": 0.7, + "temperature": 0.35, "max_iterations": 35, "planning_enabled": true, "subagent_planning_enabled": true, @@ -65,12 +65,12 @@ "test_tool", "spawn_agent", "share_file", - "email_manager" + "gmail" ], "planning_mandatory": false, "planning_phase1_enabled": true, "planning_phase2_enabled": false, "planning_phase3_enabled": true, - "top_k": 64, - "top_p": 0.95 + "top_k": 40, + "top_p": 0.85 }