Spaces:

GF-John
/

video-caption

Sleeping

John Ho commited on Jul 23

Commit

2a9891d

1 Parent(s): 7c03996

trying to set device outsite of spaces.GPU decorator

Files changed (1) hide show

app.py CHANGED Viewed

@@ -22,6 +22,10 @@ subprocess.run(
 # The model is trained on 8.0 FPS which we recommend for optimal inference
 def get_fps_ffmpeg(video_path: str):
     probe = ffmpeg.probe(video_path)
@@ -37,7 +41,6 @@ def get_fps_ffmpeg(video_path: str):
     return num / denom
-@spaces.GPU(duration=30)
 def load_model(
     model_name: str = "chancharikm/qwen2.5-vl-7b-cam-motion-preview",
     use_flash_attention: bool = True,
@@ -54,7 +57,7 @@ def load_model(
         else Qwen2_5_VLForConditionalGeneration.from_pretrained(
             model_name,
             torch_dtype=torch.bfloat16,  # "auto",
-            device_map="auto",
         )
     )
     return model
@@ -98,7 +101,7 @@ def inference(
         return_tensors="pt",
         **video_kwargs,
     )
-    inputs = inputs.to("cuda" if torch.cuda.is_available() else "cpu")
     # Inference
     generated_ids = model.generate(**inputs, max_new_tokens=128)

 # The model is trained on 8.0 FPS which we recommend for optimal inference
+DTYPE = torch.bfloat16
+DEVICE = "cuda" if torch.cuda.is_available() else "cpu"
+logger.info(f"Device: {device}, dtype: {dtype}")
 def get_fps_ffmpeg(video_path: str):
     probe = ffmpeg.probe(video_path)
     return num / denom
 def load_model(
     model_name: str = "chancharikm/qwen2.5-vl-7b-cam-motion-preview",
     use_flash_attention: bool = True,
         else Qwen2_5_VLForConditionalGeneration.from_pretrained(
             model_name,
             torch_dtype=torch.bfloat16,  # "auto",
+            device_map=DEVICE,
         )
     )
     return model
         return_tensors="pt",
         **video_kwargs,
     )
+    # inputs = inputs.to("cuda" if torch.cuda.is_available() else "cpu")
     # Inference
     generated_ids = model.generate(**inputs, max_new_tokens=128)