{"slug":"woling-dev/promptthrift-mcp","name":"PromptThrift MCP","description":"Smart token compression for LLM apps. Save 70-90% on API costs with Gemma 4 local compression, multi-model cost tracking, and intelligent model routing.","category":"development","tags":[],"official":false,"stars":1,"transport":"http","install":[{"cmd":"pip install (recommended)**","imports":[]}],"tools":[{"name":"promptthrift_compress_history","description":"Compress old turns into a smart summary to reduce input tokens by 50-90%"},{"name":"promptthrift_count_tokens","description":"Track token usage and costs across 14 models"},{"name":"promptthrift_suggest_model","description":"Recommend the cheapest model for a given task to save 60-80% on simple tasks"},{"name":"promptthrift_pin_facts","description":"Pin critical facts that survive compression to never lose key context"}],"env_vars":["PROMPTTHRIFT_OLLAMA_URL"],"auth_type":"none","github":"https://github.com/woling-dev/promptthrift-mcp","homepage":"","server_url":"","status":"active","source":"mcpservers.org","updated_at":"Mon May 25"}