Spaces:

Dovakiins
/

qwerrwe

Build error

winglian commited on Apr 18, 2023

Commit

8746b70

•

1 Parent(s): 6045345

attempt xformers hijack attention

Files changed (1) hide show

src/axolotl/utils/models.py CHANGED Viewed

@@ -43,6 +43,10 @@ def load_model(
             logging.info("patching with flash attention")
             replace_llama_attn_with_flash_attn()
     torch_dtype = (torch.float16 if cfg.load_in_8bit or cfg.fp16 else torch.float32,)
     try:

             logging.info("patching with flash attention")
             replace_llama_attn_with_flash_attn()
+    elif is_llama_derived_model and cfg.xformers_attention:
+        from alpaca_lora_4bit.monkeypatch.llama_attn_hijack_xformers import hijack_llama_attention
+        logging.info("patching with xformers attention")
+        hijack_llama_attention()
     torch_dtype = (torch.float16 if cfg.load_in_8bit or cfg.fp16 else torch.float32,)
     try: