From 3da44dbda7cc127bc803fe9212acd53b567c4683 Mon Sep 17 00:00:00 2001 From: teknium1 <127238744+teknium1@users.noreply.github.com> Date: Fri, 5 Jun 2026 02:36:20 -0700 Subject: [PATCH] fix(models): use deepseek-v4-flash as Nous silent default Follow-up on the salvaged fix: point the Nous silent-default override at deepseek/deepseek-v4-flash (a cheap chat model) instead of the nvidia nemotron entry. Keeps the no-model-configured fallback off the priciest flagship while landing on a low-cost, broadly-capable default. --- hermes_cli/models.py | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/hermes_cli/models.py b/hermes_cli/models.py index 8d5c610aeef..b9b3c819c16 100644 --- a/hermes_cli/models.py +++ b/hermes_cli/models.py @@ -1158,7 +1158,7 @@ _PROVIDER_ALIASES = { # non-interactive fallback when a profile sets ``provider: nous`` with no model # silently bills the most expensive model for traffic the user never opted into # (a missing default escalated to Opus and billed 863 requests before the user -# noticed). Pin the silent default to the cheapest curated tier instead so a +# noticed). Pin the silent default to a low-cost curated model instead so a # missing model can never escalate to the flagship. # # This is deliberately a fixed, side-effect-free default for the hot resolution @@ -1167,7 +1167,7 @@ _PROVIDER_ALIASES = { # in hermes_cli/web_server.py and ``partition_nous_models_by_tier`` — which can # hit the Portal; this fallback must stay cheap and network-free. _PROVIDER_SILENT_DEFAULT_OVERRIDES: dict[str, str] = { - "nous": "nvidia/nemotron-3-super-120b-a12b", + "nous": "deepseek/deepseek-v4-flash", }