feat: Enhance configuration management and embedding capabilities

- Added JSON-based settings management in Config class for embedding and LLM configurations. - Introduced methods to save and load settings from a JSON file. - Updated BaseEmbedder and its subclasses to include max_tokens property for better token management. - Enhanced chunking strategy to support recursive splitting of large symbols with improved overlap handling. - Implemented comprehensive tests for recursive splitting and chunking behavior. - Added CLI tools configuration management for better integration with external tools. - Introduced a new command for compacting session memory into structured text for recovery.
2026-02-14 02:42:04 +08:00 · 2025-12-24 16:32:27 +08:00
parent b00113d212
commit e671b45948
25 changed files with 2889 additions and 153 deletions
--- a/ccw-litellm/src/ccw_litellm/clients/litellm_embedder.py
+++ b/ccw-litellm/src/ccw_litellm/clients/litellm_embedder.py
@@ -81,7 +81,7 @@ class LiteLLMEmbedder(AbstractEmbedder):
        """Format model name for LiteLLM.

        Returns:
-            Formatted model name (e.g., "text-embedding-3-small")
+            Formatted model name (e.g., "openai/text-embedding-3-small")
        """
        provider = self._model_config.provider
        model = self._model_config.model
@@ -90,6 +90,11 @@ class LiteLLMEmbedder(AbstractEmbedder):
        if provider in ["azure", "vertex_ai", "bedrock"]:
            return f"{provider}/{model}"

+        # For providers with custom api_base (OpenAI-compatible endpoints),
+        # use openai/ prefix to tell LiteLLM to use OpenAI API format
+        if self._provider_config.api_base and provider not in ["openai", "anthropic"]:
+            return f"openai/{model}"
+
        return model

    @property
@@ -133,6 +138,10 @@ class LiteLLMEmbedder(AbstractEmbedder):
        embedding_kwargs = {**self._litellm_kwargs, **kwargs}

        try:
+            # For OpenAI-compatible endpoints, ensure encoding_format is set
+            if self._provider_config.api_base and "encoding_format" not in embedding_kwargs:
+                embedding_kwargs["encoding_format"] = "float"
+
            # Call LiteLLM embedding
            response = litellm.embedding(
                model=self._format_model_name(),