Feature Extraction
Transformers
Safetensors
English
custom_model
multi-modal
speech-language
custom_code
Eval Results
shangeth commited on
Commit
6a10328
1 Parent(s): 4d00091

Update README.md

Browse files
Files changed (1) hide show
  1. README.md +1 -1
README.md CHANGED
@@ -122,7 +122,7 @@ model = AutoModel.from_pretrained("skit-ai/speechllm-2B", trust_remote_code=True
122
 
123
  model.generate_meta(
124
  audio_path="path-to-audio.wav", #16k Hz, mono
125
- audio_tensor=torchaudio.load("path-to-audio.wav")[2], # [Optional] either audio_path or audio_tensor directly
126
  instruction="Give me the following information about the audio [SpeechActivity, Transcript, Gender, Emotion, Age, Accent]",
127
  max_new_tokens=500,
128
  return_special_tokens=False
 
122
 
123
  model.generate_meta(
124
  audio_path="path-to-audio.wav", #16k Hz, mono
125
+ audio_tensor=torchaudio.load("path-to-audio.wav")[1], # [Optional] either audio_path or audio_tensor directly
126
  instruction="Give me the following information about the audio [SpeechActivity, Transcript, Gender, Emotion, Age, Accent]",
127
  max_new_tokens=500,
128
  return_special_tokens=False