Update README.md
Browse files
README.md
CHANGED
@@ -48,7 +48,7 @@ model = SpeechT5ForSpeechToText.from_pretrained("mbzuai/artst_asr").to(device)
|
|
48 |
audio, sr = sf.read("audio.wav")
|
49 |
|
50 |
inputs = processor(audio=audio, sampling_rate=sr, return_tensors="pt")
|
51 |
-
predicted_ids = model.generate(**inputs.to(device), max_length=150)
|
52 |
|
53 |
transcription = processor.batch_decode(predicted_ids, skip_special_tokens=True)
|
54 |
print(transcription[0])
|
|
|
48 |
audio, sr = sf.read("audio.wav")
|
49 |
|
50 |
inputs = processor(audio=audio, sampling_rate=sr, return_tensors="pt")
|
51 |
+
predicted_ids = model.generate(**inputs.to(device), max_length=150, num_beams=10)
|
52 |
|
53 |
transcription = processor.batch_decode(predicted_ids, skip_special_tokens=True)
|
54 |
print(transcription[0])
|