Spaces:
Running
on
Zero
Running
on
Zero
liuyang
commited on
Commit
·
5dddf57
1
Parent(s):
4417549
Add job_id and task_id handling in WhisperTranscriber to improve metadata management during audio processing. Update file key generation for intermediate uploads.
Browse files
app.py
CHANGED
@@ -279,6 +279,7 @@ def prepare_and_save_audio_for_model(task: dict, out_dir: str) -> dict:
|
|
279 |
"abs_start_ms": int(ck["global_offset_ms"]) + eff_start_ms,
|
280 |
"chunk_idx": idx,
|
281 |
"channel": ch,
|
|
|
282 |
"skip": False if (trim_applied or len(pcm) > 0) else True,
|
283 |
}
|
284 |
|
@@ -724,8 +725,8 @@ class WhisperTranscriber:
|
|
724 |
"batch_size": batch_size,
|
725 |
"speaker_embeddings": speaker_embeddings,
|
726 |
}
|
727 |
-
job_id =
|
728 |
-
task_id =
|
729 |
filekey = f"ai-transcribe/split/{job_id}-{task_id}.json"
|
730 |
ret = upload_to_r2(json.dumps(result), "intermediate", filekey)
|
731 |
if ret:
|
|
|
279 |
"abs_start_ms": int(ck["global_offset_ms"]) + eff_start_ms,
|
280 |
"chunk_idx": idx,
|
281 |
"channel": ch,
|
282 |
+
"job_id": job,
|
283 |
"skip": False if (trim_applied or len(pcm) > 0) else True,
|
284 |
}
|
285 |
|
|
|
725 |
"batch_size": batch_size,
|
726 |
"speaker_embeddings": speaker_embeddings,
|
727 |
}
|
728 |
+
job_id = pre_meta["job_id"]
|
729 |
+
task_id = pre_meta["chunk_idx"]
|
730 |
filekey = f"ai-transcribe/split/{job_id}-{task_id}.json"
|
731 |
ret = upload_to_r2(json.dumps(result), "intermediate", filekey)
|
732 |
if ret:
|