ai_agent_course_final_project

Sleeping

keynes42 commited on Jun 9

Commit

aa13977

verified ·

1 Parent(s): 8340c60

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -75,7 +75,7 @@ class BasicModel:
             model_id,
             torch_dtype=torch.float16,
             device_map="auto",  ## auto-distributes to GPU
-            attn_implementation="flash_attention_2",
             token=hf_token,
             trust_remote_code=True, ## <- Use the custom code that isn't part of the base transformers library yet
             quantization_config=quantization_config ## <- Load 4-bit quantization because vRAM is not big enough

             model_id,
             torch_dtype=torch.float16,
             device_map="auto",  ## auto-distributes to GPU
+            # attn_implementation="flash_attention_2", ## Not able to install 'flash-attn' here for now
             token=hf_token,
             trust_remote_code=True, ## <- Use the custom code that isn't part of the base transformers library yet
             quantization_config=quantization_config ## <- Load 4-bit quantization because vRAM is not big enough