File size: 434 Bytes
4fceee3
6e5b840
 
 
4fceee3
 
 
 
 
 
 
6e5b840
 
4fceee3
 
 
6e5b840
 
 
4fceee3
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
# Core dependencies
torch>=2.0.0
transformers>=4.34.0
gradio>=4.13.0

# Audio processing and model dependencies
datasets[audio]>=2.14.0
evaluate>=0.4.0
jiwer>=3.0.0

# Optimization and acceleration
bitsandbytes>=0.41.1
accelerate>=0.24.1
xformers>=0.0.27

# Hugging Face integration
huggingface_hub>=0.19.3
peft
spaces

# Image processing
Pillow>=9.0.0

# Additional required packages for whisper model
librosa
soundfile
ffmpeg-python