Spaces:

Dovakiins
/

qwerrwe

Build error

tmm1 commited on Aug 3, 2023

Commit

312a9fa

•

1 Parent(s): 248bf90

move flash-attn monkey patch alongside the others

Files changed (2) hide show

src/axolotl/{flash_attn.py → monkeypatch/llama_attn_hijack_flash.py} RENAMED Viewed

File without changes

src/axolotl/utils/models.py CHANGED Viewed

@@ -92,7 +92,9 @@ def load_model(
     if cfg.is_llama_derived_model and cfg.flash_attention:
         if cfg.device not in ["mps", "cpu"] and not cfg.inference:
-            from axolotl.flash_attn import replace_llama_attn_with_flash_attn
             LOG.info("patching with flash attention")
             replace_llama_attn_with_flash_attn()

     if cfg.is_llama_derived_model and cfg.flash_attention:
         if cfg.device not in ["mps", "cpu"] and not cfg.inference:
+            from axolotl.monkeypatch.llama_attn_hijack_flash import (
+                replace_llama_attn_with_flash_attn,
+            )
             LOG.info("patching with flash attention")
             replace_llama_attn_with_flash_attn()