feat(cluster,api,models,cli): add cluster-aware model catalog deployments and request routing

This commit is contained in:
2026-04-20 23:00:50 +00:00
parent 83cacd0cf1
commit 4f2266e1b7
55 changed files with 3970 additions and 1630 deletions
+3 -2
View File
@@ -1,14 +1,15 @@
{
"name": "@modelgrid.com/modelgrid",
"version": "1.0.1",
"description": "ModelGrid - GPU infrastructure management daemon for AI model containers with OpenAI-compatible API",
"description": "ModelGrid - vLLM deployment manager with an OpenAI-compatible API and OSS model catalog",
"keywords": [
"gpu",
"docker",
"ai",
"llm",
"ollama",
"vllm",
"model-catalog",
"cluster",
"openai",
"api",
"nvidia",