File size: 679 Bytes
4537507
5eb65f4
4d6764a
4537507
 
4d6764a
 
4537507
 
 
 
 
 
 
 
4d6764a
 
4537507
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
import torchaudio
from transformers import pipeline

# Load the Hugging Face ASR model
asr_pipeline = pipeline("automatic-speech-recognition", model="facebook/wav2vec2-base-960h")

def inference(audio, sentiment_option):
    # Load and preprocess audio
    audio_tensor, _ = torchaudio.load(audio)
    
    # Perform ASR
    transcription = asr_pipeline(audio_tensor.numpy()[0], sampling_rate=audio_tensor.sampling_rate)

    # Perform sentiment analysis
    sentiment_results = analyze_sentiment(transcription[0]['sentence'])
    sentiment_output = display_sentiment_results(sentiment_results, sentiment_option)

    return "N/A", transcription[0]['sentence'], sentiment_output