Update app.py
Browse files
app.py
CHANGED
@@ -16,14 +16,6 @@ model = Wav2Vec2ForCTC.from_pretrained(MODEL_NAME).to(device)
|
|
16 |
processor = Wav2Vec2Processor.from_pretrained(MODEL_NAME) # do i need this? can't remember
|
17 |
|
18 |
|
19 |
-
|
20 |
-
#def greet(name):
|
21 |
-
# return "Hello " + name + "!!"
|
22 |
-
#iface = gr.Interface(fn=greet, inputs="text", outputs="text")
|
23 |
-
#iface.launch()
|
24 |
-
#api = gr.Interface.load("models/carlosdanielhernandezmena/wav2vec2-large-xlsr-53-icelandic-ep10-1000h")
|
25 |
-
#iface.launch()
|
26 |
-
|
27 |
#ds = load_dataset("language-and-voice-lab/samromur_asr",split='train',streaming=True)
|
28 |
#ds = load_dataset("language-and-voice-lab/samromur_asr",split='test')
|
29 |
#ds = ds.cast_column("audio", Audio(sampling_rate=16_000))
|
@@ -42,9 +34,9 @@ def recc(a_f):
|
|
42 |
wav = signal.resample(wav, wlen)
|
43 |
|
44 |
with torch.inference_mode():
|
45 |
-
wav = torch.from_numpy(wav).unsqueeze(0)
|
46 |
-
if torch.cuda.is_available():
|
47 |
-
|
48 |
input_values = processor(wav,sampling_rate=16000).input_values[0]
|
49 |
input_values = torch.tensor(input_values, device=device).unsqueeze(0)
|
50 |
logits = model(input_values).logits
|
|
|
16 |
processor = Wav2Vec2Processor.from_pretrained(MODEL_NAME) # do i need this? can't remember
|
17 |
|
18 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
19 |
#ds = load_dataset("language-and-voice-lab/samromur_asr",split='train',streaming=True)
|
20 |
#ds = load_dataset("language-and-voice-lab/samromur_asr",split='test')
|
21 |
#ds = ds.cast_column("audio", Audio(sampling_rate=16_000))
|
|
|
34 |
wav = signal.resample(wav, wlen)
|
35 |
|
36 |
with torch.inference_mode():
|
37 |
+
#wav = torch.from_numpy(wav).unsqueeze(0)
|
38 |
+
#if torch.cuda.is_available():
|
39 |
+
# wav = wav.cuda()
|
40 |
input_values = processor(wav,sampling_rate=16000).input_values[0]
|
41 |
input_values = torch.tensor(input_values, device=device).unsqueeze(0)
|
42 |
logits = model(input_values).logits
|