fix(models): query v1 models for llama-server endpoints (#3380)

* fix(models): query v1 models for llama-server endpoints * test(models): accept owner kwargs in llama-server regression
2026-06-27 23:25:22 -04:00 · 2026-06-08 19:09:02 -04:00
parent f7ae85590b
commit e7c1d75884
5 changed files with 66 additions and 4 deletions
@@ -1042,7 +1042,9 @@ def list_model_ids(
        if provider == "ollama":
            models_url = _ollama_api_root(base_chat_url) + "/tags"
        else:
-            models_url = base_chat_url.replace("/chat/completions", "/models")
+            from src.endpoint_resolver import build_models_url
+
+            models_url = build_models_url(base_chat_url)
        r = httpx.get(models_url, headers=h, timeout=timeout)
        r.raise_for_status()
        data = r.json()