{"slug":"mgm-falcon/quelllm-mcp","name":"quelllm-mcp","description":"Query a catalog of 250+ open-weights LLMs â list, compare, estimate VRAM and API-vs-self-hosted cost â directly from Claude Code, Cursor or any MCP client.","category":"development","tags":[],"official":false,"stars":0,"transport":null,"install":[{"cmd":"uvx --from","imports":[]}],"tools":[{"name":"list_models","description":"List models with filters (origin code, family, max params in B)"},{"name":"get_model","description":"Full record for one model (params, vram per quant, context window, family, tags, license, URLs)"},{"name":"compare","description":"Side-by-side comparison with verdict"},{"name":"estimate_vram","description":"VRAM in GB at chosen quant + recommended GPU/Mac tiers"},{"name":"estimate_cost","description":"Cost in EUR — full table API providers vs self-hosted hardware OR a specific id"},{"name":"search_models","description":"Fuzzy search by name, family, tag, author"}],"env_vars":[],"auth_type":"none","github":"https://github.com/MGM-FALCON/quelllm-mcp","homepage":"","server_url":"","status":"active","source":"mcpservers.org","updated_at":"Thu May 28"}