fix(models): query v1 models for llama-server endpoints (#3380)

* fix(models): query v1 models for llama-server endpoints

* test(models): accept owner kwargs in llama-server regression
This commit is contained in:
Ocean Bennett
2026-06-08 19:09:02 -04:00
committed by GitHub
parent f7ae85590b
commit e7c1d75884
5 changed files with 66 additions and 4 deletions
+1 -1
View File
@@ -857,7 +857,7 @@ def _ping_endpoint(base_url: str, api_key: str = None, timeout: float = 1.5) ->
and 400 <= result["status_code"] < 500
and result["status_code"] not in (401, 403)
):
models_url = base.rstrip("/") + "/models"
models_url = build_models_url(base)
try:
r2 = httpx.get(models_url, headers=headers, timeout=timeout, verify=llm_verify())
result2 = _result_from_response(r2)