JabriA commited on
Commit
fcf4167
·
1 Parent(s): 3f47ed7

Add Darija transcription and topic extraction app6

Browse files
Files changed (1) hide show
  1. app.py +3 -2
app.py CHANGED
@@ -13,8 +13,9 @@ transcription_model = Wav2Vec2ForCTC.from_pretrained("boumehdi/wav2vec2-large-xl
13
  summarizer = pipeline("summarization", model="facebook/bart-large-cnn")
14
 
15
  # Topic Classification Model (BERT for example)
16
- topic_model = BertForSequenceClassification.from_pretrained("your-finetuned-topic-model")
17
- topic_tokenizer = BertTokenizer.from_pretrained("your-finetuned-topic-model")
 
18
 
19
  # Function to resample audio to 16kHz if necessary
20
  def resample_audio(audio_path, target_sr=16000):
 
13
  summarizer = pipeline("summarization", model="facebook/bart-large-cnn")
14
 
15
  # Topic Classification Model (BERT for example)
16
+ topic_model = BertForSequenceClassification.from_pretrained("bert-base-uncased") # Example model
17
+ topic_tokenizer = BertTokenizer.from_pretrained("bert-base-uncased")
18
+
19
 
20
  # Function to resample audio to 16kHz if necessary
21
  def resample_audio(audio_path, target_sr=16000):