Spaces:

thankfulcarp
/

Wan_t2v_FusionX_with_Loras

Runtime error

thankfulcarp commited on Jul 2

Commit

e500465

1 Parent(s): 1d1a8c3

added flash-attn to requirements.txt

Files changed (2) hide show

app.py CHANGED Viewed

@@ -209,7 +209,13 @@ def enhance_prompt_with_llm(prompt: str):
         print("\n🤖 Loading LLM for Prompt Enhancement (first run)...")
         try:
             # This happens inside the GPU session, so device_map="auto" is correct.
-            ENHANCER_PIPE_CACHE = pipeline("text-generation", model=ENHANCER_MODEL_ID, torch_dtype=torch.bfloat16, device_map="auto")
             print("✅ LLM Prompt Enhancer loaded successfully.")
         except Exception as e:
             print(f"❌ Error loading LLM enhancer: {e}")

         print("\n🤖 Loading LLM for Prompt Enhancement (first run)...")
         try:
             # This happens inside the GPU session, so device_map="auto" is correct.
+            ENHANCER_PIPE_CACHE = pipeline(
+                "text-generation",
+                model=ENHANCER_MODEL_ID,
+                torch_dtype=torch.bfloat16,
+                device_map="auto",
+                model_kwargs={"attn_implementation": "flash_attention_2"}
+            )
             print("✅ LLM Prompt Enhancer loaded successfully.")
         except Exception as e:
             print(f"❌ Error loading LLM enhancer: {e}")

requirements.txt CHANGED Viewed

@@ -17,4 +17,7 @@ sentencepiece
 ftfy
 imageio
 imageio-ffmpeg
-opencv-python

 ftfy
 imageio
 imageio-ffmpeg
+opencv-python
+# Performance
+flash-attn