Update README.md
Browse files
README.md
CHANGED
@@ -122,7 +122,7 @@ model = AutoModel.from_pretrained("skit-ai/speechllm-2B", trust_remote_code=True
|
|
122 |
|
123 |
model.generate_meta(
|
124 |
audio_path="path-to-audio.wav", #16k Hz, mono
|
125 |
-
audio_tensor=torchaudio.load("path-to-audio.wav")[
|
126 |
instruction="Give me the following information about the audio [SpeechActivity, Transcript, Gender, Emotion, Age, Accent]",
|
127 |
max_new_tokens=500,
|
128 |
return_special_tokens=False
|
|
|
122 |
|
123 |
model.generate_meta(
|
124 |
audio_path="path-to-audio.wav", #16k Hz, mono
|
125 |
+
audio_tensor=torchaudio.load("path-to-audio.wav")[1], # [Optional] either audio_path or audio_tensor directly
|
126 |
instruction="Give me the following information about the audio [SpeechActivity, Transcript, Gender, Emotion, Age, Accent]",
|
127 |
max_new_tokens=500,
|
128 |
return_special_tokens=False
|