John Ho commited on
Commit
c697b34
·
1 Parent(s): 8edc124

added low_cpu_mem_usage and move input to device also

Browse files
Files changed (1) hide show
  1. app.py +1 -1
app.py CHANGED
@@ -128,7 +128,7 @@ def inference(
128
  return_tensors="pt",
129
  **video_kwargs,
130
  )
131
- inputs = inputs.to(DEVICE)
132
 
133
  # Inference
134
  generated_ids = model.generate(**inputs, max_new_tokens=128)
 
128
  return_tensors="pt",
129
  **video_kwargs,
130
  )
131
+ inputs = inputs.to("cuda")
132
 
133
  # Inference
134
  generated_ids = model.generate(**inputs, max_new_tokens=128)