Spaces:

legusxyz
/

whisper

Sleeping

legusxyz commited on Sep 28, 2024

Commit

d520218

verified ·

1 Parent(s): 43ab7a4

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -14,7 +14,7 @@ app = FastAPI()
 device = 0 if torch.cuda.is_available() else -1
 # Load Whisper model and processor
-model_name = "openai/whisper-small"  # Model name can be changed to other variants
 model = WhisperForConditionalGeneration.from_pretrained(model_name)
 processor = WhisperProcessor.from_pretrained(model_name)
@@ -22,11 +22,12 @@ processor = WhisperProcessor.from_pretrained(model_name)
 forced_decoder_ids = processor.get_decoder_prompt_ids(language="portuguese", task="transcribe")
 model.config.forced_decoder_ids = forced_decoder_ids
-# Initialize the ASR pipeline with the modified model
 asr_pipeline = pipeline(
     "automatic-speech-recognition",
     model=model,
-    processor=processor,
     device=device
 )

 device = 0 if torch.cuda.is_available() else -1
 # Load Whisper model and processor
+model_name = "openai/whisper-large-v2"  # You can change to other variants like "openai/whisper-small"
 model = WhisperForConditionalGeneration.from_pretrained(model_name)
 processor = WhisperProcessor.from_pretrained(model_name)
 forced_decoder_ids = processor.get_decoder_prompt_ids(language="portuguese", task="transcribe")
 model.config.forced_decoder_ids = forced_decoder_ids
+# Initialize the ASR pipeline with the modified model and processor
 asr_pipeline = pipeline(
     "automatic-speech-recognition",
     model=model,
+    tokenizer=processor.tokenizer,  # Explicitly set the tokenizer from the processor
+    feature_extractor=processor.feature_extractor,  # Also set the feature extractor
     device=device
 )