feat: Add support for litellm as a provider

drajnic · drajnic · commit 2bd81bf32992 · 2025-09-13T08:28:25.000+02:00
- Allow users to configure a litellm API base and key to use a litellm instance as a model provider.
   - Implement model discovery from the /models and /model_group/info endpoints of the litellm instance.
   - Use the discovered model information, including pricing, to enable cost calculation for litellm models.
   - Improve the cost display to show token usage even when the cost is zero.
diff --git a/aider/args.py b/aider/args.py
@@ -77,6 +77,14 @@ def get_parser(default_config_files, git_root):
         "--openai-api-base",
         help="Specify the api base url",
     )
+    group.add_argument(
+        "--litellm-api-base",
+        help="Specify the litellm api base url",
+    )
+    group.add_argument(
+        "--litellm-api-key",
+        help="Specify the litellm api key",
+    )
     group.add_argument(
         "--openai-api-type",
         help="(deprecated, use --set-env OPENAI_API_TYPE=<value>)",
diff --git a/aider/coders/base_coder.py b/aider/coders/base_coder.py
@@ -2055,17 +2055,20 @@ def format_cost(value):
             else:
                 return f"{value:.{max(2, 2 - int(math.log10(magnitude)))}f}"
 
-        cost_report = (
-            f"Cost: ${format_cost(self.message_cost)} message,"
-            f" ${format_cost(self.total_cost)} session."
-        )
+        if cost:
+            cost_report = (
+                f"Cost: ${format_cost(self.message_cost)} message,"
+                f" ${format_cost(self.total_cost)} session."
+            )
 
-        if cache_hit_tokens and cache_write_tokens:
-            sep = "\n"
-        else:
-            sep = " "
+            if cache_hit_tokens and cache_write_tokens:
+                sep = "\n"
+            else:
+                sep = " "
 
-        self.usage_report = tokens_report + sep + cost_report
+            self.usage_report = tokens_report + sep + cost_report
+        else:
+            self.usage_report = tokens_report
 
     def compute_costs_from_tokens(
         self, prompt_tokens, completion_tokens, cache_write_tokens, cache_hit_tokens
diff --git a/aider/main.py b/aider/main.py
@@ -409,6 +409,60 @@ def register_litellm_models(git_root, model_metadata_fname, io, verbose=False):
         return 1
 
 
+def discover_litellm_models(io, verbose=False):
+    litellm_api_base = os.environ.get("LITELLM_API_BASE")
+    if not litellm_api_base:
+        return
+
+    try:
+        import requests
+
+        headers = {}
+        api_key = os.environ.get("LITELLM_API_KEY")
+        if api_key:
+            headers["Authorization"] = f"Bearer {api_key}"
+
+        # First, get the models and their owners
+        url = litellm_api_base.rstrip("/") + "/models"
+
+        response = requests.get(
+            url, headers=headers, timeout=5, verify=models.model_info_manager.verify_ssl
+        )
+        if response.status_code != 200:
+            io.tool_warning(f"Error fetching models from {url}: {response.status_code}")
+            return
+
+        models_data = response.json()
+        model_owners = {
+            model_info.get("id"): model_info.get("owned_by")
+            for model_info in models_data.get("data", [])
+        }
+
+        # Now, get the model group info
+        url = litellm_api_base.rstrip("/") + "/model_group/info"
+        response = requests.get(
+            url, headers=headers, timeout=5, verify=models.model_info_manager.verify_ssl
+        )
+        if response.status_code == 200:
+            model_group_data = response.json()
+            for model_info in model_group_data.get("data", []):
+                model_group = model_info.get("model_group")
+                if model_group:
+                    models.model_info_manager.local_model_metadata[f"litellm/{model_group}"] = {
+                        "litellm_provider": "litellm",
+                        "mode": "chat",
+                        "owned_by": model_owners.get(model_group),
+                        "input_cost_per_token": model_info.get("input_cost_per_token"),
+                        "output_cost_per_token": model_info.get("output_cost_per_token"),
+                        "max_input_tokens": model_info.get("max_input_tokens"),
+                        "max_output_tokens": model_info.get("max_output_tokens"),
+                    }
+            if verbose:
+                io.tool_output(f"Discovered model info from {url}")
+    except Exception as e:
+        io.tool_warning(f"Error fetching model info from litellm: {e}")
+
+
 def sanity_check_repo(repo, io):
     if not repo:
         return True
@@ -619,6 +673,10 @@ def get_io(pretty):
     handle_deprecated_model_args(args, io)
     if args.openai_api_base:
         os.environ["OPENAI_API_BASE"] = args.openai_api_base
+    if args.litellm_api_base:
+        os.environ["LITELLM_API_BASE"] = args.litellm_api_base
+    if args.litellm_api_key:
+        os.environ["LITELLM_API_KEY"] = args.litellm_api_key
     if args.openai_api_version:
         io.tool_warning(
             "--openai-api-version is deprecated, use --set-env OPENAI_API_VERSION=<value>"
@@ -755,6 +813,7 @@ def get_io(pretty):
 
     register_models(git_root, args.model_settings_file, io, verbose=args.verbose)
     register_litellm_models(git_root, args.model_metadata_file, io, verbose=args.verbose)
+    discover_litellm_models(io, verbose=args.verbose)
 
     if args.list_models:
         models.print_matching_models(io, args.list_models)
diff --git a/aider/models.py b/aider/models.py
@@ -953,8 +953,17 @@ def send_completion(self, messages, functions, stream, temperature=None):
         if self.is_deepseek_r1():
             messages = ensure_alternating_roles(messages)
 
+        model_name = self.name
+        if self.info.get("litellm_provider") == "litellm":
+            owned_by = self.info.get("owned_by")
+            model_id = model_name[len("litellm/") :]
+            if owned_by:
+                model_name = f"{owned_by}/{model_id}"
+            else:
+                model_name = model_id
+
         kwargs = dict(
-            model=self.name,
+            model=model_name,
             stream=stream,
         )
 
@@ -997,6 +1006,14 @@ def send_completion(self, messages, functions, stream, temperature=None):
 
             self.github_copilot_token_to_open_ai_key(kwargs["extra_headers"])
 
+        if self.info.get("litellm_provider") == "litellm":
+            litellm_api_base = os.environ.get("LITELLM_API_BASE")
+            if litellm_api_base:
+                kwargs["api_base"] = litellm_api_base
+            litellm_api_key = os.environ.get("LITELLM_API_KEY")
+            if litellm_api_key:
+                kwargs["api_key"] = litellm_api_key
+
         res = litellm.completion(**kwargs)
         return hash_object, res
 
diff --git a/aider/onboarding.py b/aider/onboarding.py
@@ -11,7 +11,7 @@
 
 import requests
 
-from aider import urls
+from aider import models, urls
 from aider.io import InputOutput
 
 
@@ -73,6 +73,11 @@ def try_to_select_default_model():
         if api_key_value:
             return model_name
 
+    if os.environ.get("LITELLM_API_BASE") and os.environ.get("LITELLM_API_KEY"):
+        for model_name, model_info in models.model_info_manager.local_model_metadata.items():
+            if model_info.get("litellm_provider") == "litellm":
+                return model_name
+
     return None
 
 
diff --git a/pyproject.toml b/pyproject.toml
@@ -3,6 +3,7 @@
 name = "aider-chat"
 description = "Aider is AI pair programming in your terminal"
 readme = "README.md"
+version = "1.0.0-dev"
 classifiers = [
     "Development Status :: 4 - Beta",
     "Environment :: Console",
diff --git a/tests/basic/test_main.py b/tests/basic/test_main.py
@@ -14,10 +14,25 @@
 from aider.coders import Coder
 from aider.dump import dump  # noqa: F401
 from aider.io import InputOutput
-from aider.main import check_gitignore, load_dotenv_files, main, setup_git
+from aider.main import (
+    check_gitignore,
+    discover_litellm_models,
+    load_dotenv_files,
+    main,
+    setup_git,
+)
 from aider.utils import GitTemporaryDirectory, IgnorantTemporaryDirectory, make_repo
 
 
+class DummyResponse:
+    def __init__(self, json_data, status_code=200):
+        self.json_data = json_data
+        self.status_code = status_code
+
+    def json(self):
+        return self.json_data
+
+
 class TestMain(TestCase):
     def setUp(self):
         self.original_env = os.environ.copy()
@@ -45,6 +60,59 @@ def tearDown(self):
         self.input_patcher.stop()
         self.webbrowser_patcher.stop()
 
+    def test_litellm_discover_models(self):
+        """
+        discover_litellm_models should return correct metadata taken from the
+        downloaded (and locally cached) models JSON payload.
+        """
+        models_payload = {
+            "data": [
+                {
+                    "id": "bedrock-claude-opus-4.1",
+                    "object": "model",
+                    "created": 1677610602,
+                    "owned_by": "openai",
+                }
+            ]
+        }
+
+        model_group_payload = {
+            "data": [
+                {
+                    "model_group": "bedrock-claude-opus-4.1",
+                    "providers": ["bedrock"],
+                    "max_input_tokens": 200000,
+                    "max_output_tokens": 32000,
+                    "input_cost_per_token": 0.000015,
+                    "output_cost_per_token": 0.000075,
+                }
+            ]
+        }
+
+        def mock_get(url, **kwargs):
+            if "/models" in url:
+                return DummyResponse(models_payload)
+            elif "/model_group/info" in url:
+                return DummyResponse(model_group_payload)
+            return DummyResponse({}, 404)
+
+        with patch("requests.get", mock_get):
+            os.environ["LITELLM_API_BASE"] = "http://localhost:4000"
+            os.environ["LITELLM_API_KEY"] = "test-key"
+
+            io = MagicMock()
+            discover_litellm_models(io)
+
+            from aider import models
+
+            info = models.model_info_manager.get_model_info("litellm/bedrock-claude-opus-4.1")
+
+            assert info["max_input_tokens"] == 200000
+            assert info["input_cost_per_token"] == 0.000015
+            assert info["output_cost_per_token"] == 0.000075
+            assert info["litellm_provider"] == "litellm"
+            assert info["owned_by"] == "openai"
+
     def test_main_with_empty_dir_no_files_on_command(self):
         main(["--no-git", "--exit", "--yes"], input=DummyInput(), output=DummyOutput())
 
diff --git a/tests/basic/test_models.py b/tests/basic/test_models.py
@@ -1,6 +1,8 @@
+import os
 import unittest
 from unittest.mock import ANY, MagicMock, patch
 
+from aider.coders.base_coder import Coder
 from aider.models import (
     ANTHROPIC_BETA_HEADER,
     Model,
@@ -17,13 +19,16 @@ def setUp(self):
         from aider.models import MODEL_SETTINGS
 
         self._original_settings = MODEL_SETTINGS.copy()
+        self.original_env = os.environ.copy()
 
     def tearDown(self):
         """Restore original MODEL_SETTINGS after each test"""
         from aider.models import MODEL_SETTINGS
 
         MODEL_SETTINGS.clear()
         MODEL_SETTINGS.extend(self._original_settings)
+        os.environ.clear()
+        os.environ.update(self.original_env)
 
     def test_get_model_info_nonexistent(self):
         manager = ModelInfoManager()
@@ -558,6 +563,64 @@ def test_use_temperature_in_send_completion(self, mock_completion):
             timeout=600,
         )
 
+    @patch("aider.models.litellm.completion")
+    def test_litellm_send_completion(self, mock_completion):
+        """
+        Model.send_completion should call litellm.completion with the correct arguments.
+        """
+        os.environ["LITELLM_API_BASE"] = "http://localhost:4000"
+        os.environ["LITELLM_API_KEY"] = "test-key"
+
+        model = Model("litellm/my-model")
+        model.info["litellm_provider"] = "litellm"
+        model.info["owned_by"] = "my-provider"
+
+        messages = [{"role": "user", "content": "Hello"}]
+        model.send_completion(messages, None, True)
+
+        mock_completion.assert_called_once_with(
+            model="my-provider/my-model",
+            messages=messages,
+            stream=True,
+            temperature=0,
+            api_base="http://localhost:4000",
+            api_key="test-key",
+            timeout=600,
+        )
+
+    @patch("aider.coders.base_coder.litellm.completion_cost")
+    def test_litellm_cost_calculation(self, mock_completion_cost):
+        """
+        Test that the cost is calculated correctly for a litellm model.
+        """
+        os.environ["LITELLM_API_BASE"] = "http://localhost:4000"
+        os.environ["LITELLM_API_KEY"] = "test-key"
+
+        model = Model("litellm/my-model")
+        model.info["litellm_provider"] = "litellm"
+        model.info["input_cost_per_token"] = 0.00001
+        model.info["output_cost_per_token"] = 0.00002
+
+        messages = [{"role": "user", "content": "Hello"}]
+        completion = MagicMock()
+        completion.usage.prompt_tokens = 10
+        completion.usage.completion_tokens = 20
+        completion.usage.prompt_cache_hit_tokens = 0
+        completion.usage.cache_read_input_tokens = 0
+        completion.usage.cache_creation_input_tokens = 0
+
+        mock_completion_cost.return_value = (10 * 0.00001) + (20 * 0.00002)
+
+        coder = Coder.create(main_model=model, io=MagicMock())
+        coder.message_tokens_sent = 0
+        coder.message_tokens_received = 0
+        coder.total_cost = 0
+        coder.message_cost = 0
+        coder.calculate_and_show_tokens_and_cost(messages, completion)
+
+        self.assertIsNotNone(coder.usage_report)
+        self.assertIn("Cost: $0.0005", coder.usage_report)
+
 
 if __name__ == "__main__":
     unittest.main()