liuyang commited on
Commit
5dddf57
·
1 Parent(s): 4417549

Add job_id and task_id handling in WhisperTranscriber to improve metadata management during audio processing. Update file key generation for intermediate uploads.

Browse files
Files changed (1) hide show
  1. app.py +3 -2
app.py CHANGED
@@ -279,6 +279,7 @@ def prepare_and_save_audio_for_model(task: dict, out_dir: str) -> dict:
279
  "abs_start_ms": int(ck["global_offset_ms"]) + eff_start_ms,
280
  "chunk_idx": idx,
281
  "channel": ch,
 
282
  "skip": False if (trim_applied or len(pcm) > 0) else True,
283
  }
284
 
@@ -724,8 +725,8 @@ class WhisperTranscriber:
724
  "batch_size": batch_size,
725
  "speaker_embeddings": speaker_embeddings,
726
  }
727
- job_id = task_json["job_id"]
728
- task_id = task_json["task_id"]["chunk"]["idx"]
729
  filekey = f"ai-transcribe/split/{job_id}-{task_id}.json"
730
  ret = upload_to_r2(json.dumps(result), "intermediate", filekey)
731
  if ret:
 
279
  "abs_start_ms": int(ck["global_offset_ms"]) + eff_start_ms,
280
  "chunk_idx": idx,
281
  "channel": ch,
282
+ "job_id": job,
283
  "skip": False if (trim_applied or len(pcm) > 0) else True,
284
  }
285
 
 
725
  "batch_size": batch_size,
726
  "speaker_embeddings": speaker_embeddings,
727
  }
728
+ job_id = pre_meta["job_id"]
729
+ task_id = pre_meta["chunk_idx"]
730
  filekey = f"ai-transcribe/split/{job_id}-{task_id}.json"
731
  ret = upload_to_r2(json.dumps(result), "intermediate", filekey)
732
  if ret: