diff --git a/agent/context_compressor.py b/agent/context_compressor.py index d81de94794..5f4ea4a3ce 100644 --- a/agent/context_compressor.py +++ b/agent/context_compressor.py @@ -93,6 +93,14 @@ class ContextCompressor: ) self.threshold_tokens = int(self.context_length * threshold_percent) self.compression_count = 0 + + if not quiet_mode: + logger.info( + "Context compressor initialized: model=%s context_length=%d " + "threshold=%d (%.0f%%) provider=%s base_url=%s", + model, self.context_length, self.threshold_tokens, + threshold_percent * 100, provider or "none", base_url or "none", + ) self._context_probed = False # True after a step-down from context error self.last_prompt_tokens = 0 diff --git a/agent/model_metadata.py b/agent/model_metadata.py index e3636b6fe4..ca651fce25 100644 --- a/agent/model_metadata.py +++ b/agent/model_metadata.py @@ -855,10 +855,11 @@ def get_model_context_length( # Only check `default_model in model` (is the key a substring of the input). # The reverse (`model in default_model`) causes shorter names like # "claude-sonnet-4" to incorrectly match "claude-sonnet-4-6" and return 1M. + model_lower = model.lower() for default_model, length in sorted( DEFAULT_CONTEXT_LENGTHS.items(), key=lambda x: len(x[0]), reverse=True ): - if default_model in model: + if default_model in model_lower: return length # 9. Query local server as last resort