{"slug":"grok-vision-beta","title":"Grok Vision Beta","description":"Beta multimodal model from xAI capable of understanding and analyzing images alongside text.","provider":"xai","model_type":"multimodal","status":"active","context_window":8192,"max_output_tokens":8192,"pricing":{"currency":"USD","input_per_mtok":5,"output_per_mtok":15},"modalities":["text","image"],"capabilities":["vision","streaming","function-calling","tool-use"],"knowledge_cutoff":null,"release_date":null,"deprecation_date":null,"retirement_date":null,"aliases":[],"homepage":null,"docs":null,"categories":["ai-ml"],"tags":[],"last_verified":"2026-06-09T00:00:00.000Z","next_check":"2026-09-07T00:00:00.000Z","created_at":"2026-06-09T18:06:11.109Z","updated_at":"2026-06-09T18:06:11.109Z"}