{"slug":"facebook/wav2vec2-xlsr-53-espeak-cv-ft","title":"Wav2Vec2 XLSR-53 eSpeak CV FT","description":"A fine-tuned Wav2Vec2 model for cross-lingual speech recognition using eSpeak phoneme labels and Common Voice data.","provider":"meta","model_type":"audio","status":"active","context_window":null,"max_output_tokens":null,"pricing":null,"modalities":["audio","text"],"capabilities":[],"knowledge_cutoff":null,"release_date":"2021-08-01T00:00:00.000Z","deprecation_date":null,"retirement_date":null,"aliases":[],"homepage":"https://huggingface.co/facebook/wav2vec2-xlsr-53-espeak-cv-ft","docs":null,"categories":["ai-ml"],"tags":[],"last_verified":"2026-06-10T00:00:00.000Z","next_check":"2026-09-08T00:00:00.000Z","created_at":"2026-06-09T19:23:24.405Z","updated_at":"2026-06-09T19:23:24.405Z"}