Spaces:

ariG23498
/

phi4-multimodal

Running on Zero

ariG23498 HF staff commited on 2 days ago

Commit

2b310a5

1 Parent(s): f9923d4

flash-attn

Files changed (2) hide show

app.py CHANGED Viewed

@@ -11,11 +11,11 @@ model_path = "microsoft/Phi-4-multimodal-instruct"
 processor = AutoProcessor.from_pretrained(model_path, trust_remote_code=True)
 model = AutoModelForCausalLM.from_pretrained(
     model_path,
-    device_map="auto",
     torch_dtype="auto",
     trust_remote_code=True,
-    attn_implementation='eager',
-)
 generation_config = GenerationConfig.from_pretrained(model_path)

 processor = AutoProcessor.from_pretrained(model_path, trust_remote_code=True)
 model = AutoModelForCausalLM.from_pretrained(
     model_path,
+    device_map="cuda",
     torch_dtype="auto",
     trust_remote_code=True,
+    attn_implementation='flash_attention_2',
+).cuda()
 generation_config = GenerationConfig.from_pretrained(model_path)

requirements.txt CHANGED Viewed

@@ -7,5 +7,6 @@ scipy
 soundfile
 pillow
 accelerate
 transformers
 backoff

 soundfile
 pillow
 accelerate
+flash-attn
 transformers
 backoff