Spaces:

SkalskiP
/

florence-2-video

Running on Zero

SkalskiP commited on Jun 30, 2024

Commit

1f28a9c

1 Parent(s): 4e14a56

generate caption only once

Files changed (1) hide show

app.py CHANGED Viewed

@@ -89,16 +89,20 @@ def process_video(
     )
     result_file_name = generate_file_name(extension="mp4")
     result_file_path = os.path.join(RESULTS, result_file_name)
     TRACKER.reset()
     with sv.VideoSink(result_file_path, video_info=video_info) as sink:
         for _ in tqdm(range(total // OUTPUT_LENGTH), desc="Processing video..."):
             frame = next(frame_generator)
-            caption = run_captioning(
-                model=MODEL,
-                processor=PROCESSOR,
-                image=frame,
-                device=DEVICE
-            )[CAPTIONING_TASK]
             detections = run_caption_to_phrase_grounding(
                 model=MODEL,
                 processor=PROCESSOR,

     )
     result_file_name = generate_file_name(extension="mp4")
     result_file_path = os.path.join(RESULTS, result_file_name)
     TRACKER.reset()
+    caption = None
     with sv.VideoSink(result_file_path, video_info=video_info) as sink:
         for _ in tqdm(range(total // OUTPUT_LENGTH), desc="Processing video..."):
             frame = next(frame_generator)
+            if caption is None:
+                caption = run_captioning(
+                    model=MODEL,
+                    processor=PROCESSOR,
+                    image=frame,
+                    device=DEVICE
+                )[CAPTIONING_TASK]
             detections = run_caption_to_phrase_grounding(
                 model=MODEL,
                 processor=PROCESSOR,