{"slug":"llama-3.1-8b-instant","title":"Llama 3.1 8B Instant","description":"A fast, lightweight instruction-tuned language model from Meta optimized for low-latency text generation and chat applications.","provider":"meta","model_type":"llm","status":"active","context_window":128000,"max_output_tokens":8192,"pricing":{"currency":"USD","input_per_mtok":0.05,"output_per_mtok":0.08},"modalities":["text"],"capabilities":["streaming","code-generation","function-calling","tool-use","json-mode"],"knowledge_cutoff":"2023-12-01T00:00:00.000Z","release_date":"2024-07-01T00:00:00.000Z","deprecation_date":null,"retirement_date":null,"aliases":[],"homepage":"https://llama.meta.com/","docs":"https://ai.meta.com/llama/","categories":["ai-ml"],"tags":[],"last_verified":"2026-06-09T00:00:00.000Z","next_check":"2026-09-07T00:00:00.000Z","created_at":"2026-06-09T18:07:15.850Z","updated_at":"2026-06-09T18:07:15.850Z"}