diff --git a/cli.py b/cli.py index ac9231b089..931610bf6f 100644 --- a/cli.py +++ b/cli.py @@ -180,7 +180,7 @@ def load_cli_config() -> Dict[str, Any]: "compression": { "enabled": True, # Auto-compress when approaching context limit "threshold": 0.50, # Compress at 50% of model's context limit - "summary_model": "google/gemini-3-flash-preview", # Fast/cheap model for summaries + "summary_model": "", # Model for summaries (empty = use main model) }, "smart_model_routing": { "enabled": False, diff --git a/hermes_cli/config.py b/hermes_cli/config.py index b2fd27c15e..b0e14f2a0d 100644 --- a/hermes_cli/config.py +++ b/hermes_cli/config.py @@ -159,7 +159,7 @@ DEFAULT_CONFIG = { "compression": { "enabled": True, "threshold": 0.50, - "summary_model": "google/gemini-3-flash-preview", + "summary_model": "", # empty = use main configured model "summary_provider": "auto", "summary_base_url": None, }, @@ -1659,7 +1659,8 @@ def show_config(): print(f" Enabled: {'yes' if enabled else 'no'}") if enabled: print(f" Threshold: {compression.get('threshold', 0.50) * 100:.0f}%") - print(f" Model: {compression.get('summary_model', 'google/gemini-3-flash-preview')}") + _sm = compression.get('summary_model', '') or '(main model)' + print(f" Model: {_sm}") comp_provider = compression.get('summary_provider', 'auto') if comp_provider != 'auto': print(f" Provider: {comp_provider}")