idefics2_playground

Paused

dwb2023 commited on Aug 23, 2024

Commit

6bb06c8

verified ·

1 Parent(s): 3cf2930

disable flash_attention

Files changed (1) hide show

app_dialogue.py CHANGED Viewed

@@ -2,11 +2,11 @@ import os
 import subprocess
 # Install flash attention
-subprocess.run(
-    "pip install flash-attn --no-build-isolation",
-    env={"FLASH_ATTENTION_SKIP_CUDA_BUILD": "TRUE"},
-    shell=True,
-)
 import copy
@@ -31,7 +31,7 @@ MODELS = {
     "xgen-mm-phi3-mini-instruct-interleave-r-v1.5": AutoModelForVision2Seq.from_pretrained(
         "Salesforce/xgen-mm-phi3-mini-instruct-interleave-r-v1.5",
         torch_dtype=torch.bfloat16,
-        _attn_implementation="flash_attention_2",
         trust_remote_code=True
     ).to(DEVICE),
 }

 import subprocess
 # Install flash attention
+# subprocess.run(
+#     "pip install flash-attn --no-build-isolation",
+#     env={"FLASH_ATTENTION_SKIP_CUDA_BUILD": "TRUE"},
+#     shell=True,
+# )
 import copy
     "xgen-mm-phi3-mini-instruct-interleave-r-v1.5": AutoModelForVision2Seq.from_pretrained(
         "Salesforce/xgen-mm-phi3-mini-instruct-interleave-r-v1.5",
         torch_dtype=torch.bfloat16,
+        # _attn_implementation="flash_attention_2",
         trust_remote_code=True
     ).to(DEVICE),
 }