Update README.md
Browse files
README.md
CHANGED
|
@@ -148,7 +148,7 @@ from datasets import load_dataset
|
|
| 148 |
device = "cuda:0" if torch.cuda.is_available() else "cpu"
|
| 149 |
torch_dtype = torch.float16 if torch.cuda.is_available() else torch.float32
|
| 150 |
|
| 151 |
-
model_id = "
|
| 152 |
|
| 153 |
model = AutoModelForSpeechSeq2Seq.from_pretrained(
|
| 154 |
model_id, torch_dtype=torch_dtype, low_cpu_mem_usage=True, use_safetensors=True
|
|
@@ -252,7 +252,7 @@ from datasets import Audio, load_dataset
|
|
| 252 |
device = "cuda:0" if torch.cuda.is_available() else "cpu"
|
| 253 |
torch_dtype = torch.float16 if torch.cuda.is_available() else torch.float32
|
| 254 |
|
| 255 |
-
model_id = "
|
| 256 |
|
| 257 |
model = AutoModelForSpeechSeq2Seq.from_pretrained(
|
| 258 |
model_id, torch_dtype=torch_dtype, low_cpu_mem_usage=True
|
|
@@ -327,7 +327,7 @@ from datasets import load_dataset
|
|
| 327 |
device = "cuda:0" if torch.cuda.is_available() else "cpu"
|
| 328 |
torch_dtype = torch.float16 if torch.cuda.is_available() else torch.float32
|
| 329 |
|
| 330 |
-
model_id = "
|
| 331 |
|
| 332 |
model = AutoModelForSpeechSeq2Seq.from_pretrained(
|
| 333 |
model_id, torch_dtype=torch_dtype, low_cpu_mem_usage=True
|
|
@@ -373,7 +373,7 @@ torch.set_float32_matmul_precision("high")
|
|
| 373 |
device = "cuda:0" if torch.cuda.is_available() else "cpu"
|
| 374 |
torch_dtype = torch.float16 if torch.cuda.is_available() else torch.float32
|
| 375 |
|
| 376 |
-
model_id = "
|
| 377 |
|
| 378 |
model = AutoModelForSpeechSeq2Seq.from_pretrained(
|
| 379 |
model_id, torch_dtype=torch_dtype, low_cpu_mem_usage=True
|
|
@@ -472,7 +472,7 @@ checkpoints are summarised in the following table with links to the models on th
|
|
| 472 |
| large | 1550 M | x | [✓](https://huggingface.co/openai/whisper-large) |
|
| 473 |
| large-v2 | 1550 M | x | [✓](https://huggingface.co/openai/whisper-large-v2) |
|
| 474 |
| large-v3 | 1550 M | x | [✓](https://huggingface.co/openai/whisper-large-v3) |
|
| 475 |
-
| large-v3-turbo | 809 M | x | [✓](https://huggingface.co/
|
| 476 |
|
| 477 |
|
| 478 |
## Fine-Tuning
|
|
|
|
| 148 |
device = "cuda:0" if torch.cuda.is_available() else "cpu"
|
| 149 |
torch_dtype = torch.float16 if torch.cuda.is_available() else torch.float32
|
| 150 |
|
| 151 |
+
model_id = "ylacombe/whisper-large-v3-turbo"
|
| 152 |
|
| 153 |
model = AutoModelForSpeechSeq2Seq.from_pretrained(
|
| 154 |
model_id, torch_dtype=torch_dtype, low_cpu_mem_usage=True, use_safetensors=True
|
|
|
|
| 252 |
device = "cuda:0" if torch.cuda.is_available() else "cpu"
|
| 253 |
torch_dtype = torch.float16 if torch.cuda.is_available() else torch.float32
|
| 254 |
|
| 255 |
+
model_id = "ylacombe/whisper-large-v3-turbo"
|
| 256 |
|
| 257 |
model = AutoModelForSpeechSeq2Seq.from_pretrained(
|
| 258 |
model_id, torch_dtype=torch_dtype, low_cpu_mem_usage=True
|
|
|
|
| 327 |
device = "cuda:0" if torch.cuda.is_available() else "cpu"
|
| 328 |
torch_dtype = torch.float16 if torch.cuda.is_available() else torch.float32
|
| 329 |
|
| 330 |
+
model_id = "ylacombe/whisper-large-v3-turbo"
|
| 331 |
|
| 332 |
model = AutoModelForSpeechSeq2Seq.from_pretrained(
|
| 333 |
model_id, torch_dtype=torch_dtype, low_cpu_mem_usage=True
|
|
|
|
| 373 |
device = "cuda:0" if torch.cuda.is_available() else "cpu"
|
| 374 |
torch_dtype = torch.float16 if torch.cuda.is_available() else torch.float32
|
| 375 |
|
| 376 |
+
model_id = "ylacombe/whisper-large-v3-turbo"
|
| 377 |
|
| 378 |
model = AutoModelForSpeechSeq2Seq.from_pretrained(
|
| 379 |
model_id, torch_dtype=torch_dtype, low_cpu_mem_usage=True
|
|
|
|
| 472 |
| large | 1550 M | x | [✓](https://huggingface.co/openai/whisper-large) |
|
| 473 |
| large-v2 | 1550 M | x | [✓](https://huggingface.co/openai/whisper-large-v2) |
|
| 474 |
| large-v3 | 1550 M | x | [✓](https://huggingface.co/openai/whisper-large-v3) |
|
| 475 |
+
| large-v3-turbo | 809 M | x | [✓](https://huggingface.co/ylacombe/whisper-large-v3-turbo) |
|
| 476 |
|
| 477 |
|
| 478 |
## Fine-Tuning
|