Skip to content

Commit 42787c7

Browse files
alisonshaoeternally-z
authored andcommitted
[Bug fix] Add /model_info endpoint to mini_lb (sgl-project#14535)
1 parent 469d4c6 commit 42787c7

File tree

1 file changed

+12
-3
lines changed
  • sgl-model-gateway/bindings/python/sglang_router

1 file changed

+12
-3
lines changed

sgl-model-gateway/bindings/python/sglang_router/mini_lb.py

Lines changed: 12 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -341,16 +341,15 @@ async def get_server_info():
341341
}
342342

343343

344-
@app.get("/get_model_info")
345-
async def get_model_info():
344+
async def _get_model_info_impl():
346345
if not lb or not lb.prefill_urls:
347346
raise HTTPException(
348347
status_code=HTTPStatus.SERVICE_UNAVAILABLE,
349348
detail="There is no server registered",
350349
)
351350

352351
target_server_url = lb.prefill_urls[0]
353-
endpoint_url = f"{target_server_url}/get_model_info"
352+
endpoint_url = f"{target_server_url}/model_info"
354353

355354
async with aiohttp.ClientSession() as session:
356355
try:
@@ -375,6 +374,16 @@ async def get_model_info():
375374
)
376375

377376

377+
@app.get("/model_info")
378+
async def model_info():
379+
return await _get_model_info_impl()
380+
381+
382+
@app.get("/get_model_info")
383+
async def get_model_info():
384+
return await _get_model_info_impl()
385+
386+
378387
@app.post("/generate")
379388
async def handle_generate_request(request_data: dict):
380389
prefill_server, bootstrap_port, decode_server = lb.select_pair()

0 commit comments

Comments
 (0)