whisper_simple / src /utils.py
nunenuh's picture
feat: fix with original whisper
70c05b8
raw
history blame
552 Bytes
import librosa
import torch
from pathlib import Path
import whisper
sample_rate: int = 16000
float_factor: float = 32678.0
def preprocess_audio(filepath: str):
# load audio and pad/trim it to fit 30 seconds
audio = whisper.load_audio(filepath)
audio = whisper.pad_or_trim(audio)
return audio
def parsing_text(filepath: str):
path = Path(filepath)
if path.suffix.lower() not in ('.txt', '.md'):
raise ValueError("Invalid file type. Only '.txt' and '.md' files are supported.")
return path.read_text()