In [2]:
import torch
from transformers import Wav2Vec2ForCTC, Wav2Vec2Processor
import librosa
import numpy as np

class AudioTranscriber:
    def __init__(self, model_name="facebook/wav2vec2-base-960h"):
        """
        Initialise le modèle de transcription audio.
        
        Args:
            model_name (str): Nom du modèle Wav2Vec2
        """
        # Charger le processeur et le modèle
        self.processor = Wav2Vec2Processor.from_pretrained(model_name)
        self.model = Wav2Vec2ForCTC.from_pretrained(model_name)
    
    def transcribe_audio(self, audio_path):
        """
        Transcrit un fichier audio en texte.
        
        Args:
            audio_path (str): Chemin vers le fichier audio MP3
        
        Returns:
            str: Transcription du texte
        """
        # Charger l'audio
        audio, _ = librosa.load(audio_path, sr=16000)
        
        # Prétraitement de l'audio
        input_values = self.processor(audio, sampling_rate=16000, return_tensors="pt").input_values
        
        # Désactiver le calcul de gradient
        with torch.no_grad():
            # Obtenir les logits de prédiction
            logits = self.model(input_values).logits
        
        # Prédire les tokens
        predicted_ids = torch.argmax(logits, dim=-1)
        
        # Convertir en texte
        transcription = self.processor.batch_decode(predicted_ids)[0]
        
        return transcription

def main():
    # Utilisation
    transcriber = AudioTranscriber()
    transcription = transcriber.transcribe_audio("Audio/Download1.mp3")
    print("Transcription:", transcription)

if __name__ == "__main__":
    main()

Some weights of Wav2Vec2ForCTC were not initialized from the model checkpoint at facebook/wav2vec2-base-960h and are newly initialized: ['wav2vec2.masked_spec_embed']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Transcription: PEH DO YOU WANT TO SPEAK ENGLISH FLUENTLY NOW GO TO POWER ENGLISH DATNETTE AND DOWNLOAD OUR IMPY THREE AUDIALE LESSONS LISTEN TO OUR EASY STORIES AND CONVERSATION LESSONS EVERY DAY YOU WILL LEARN ENGLISH VOCABULARY EASILY AND IMPROVE YOUR ENGLISH LISTENING AND SPEAKING SKILLS FAST
