Spaces:

Dovakiins
/

qwerrwe

Build error

winglian commited on Aug 2, 2023

Commit

77085ea

unverified ·

1 Parent(s): db2a358

qlora w flash attention fixes (#333)

Files changed (1) hide show

src/axolotl/utils/models.py CHANGED Viewed

@@ -407,6 +407,14 @@ def load_llama_adapter(model, cfg):
     else:
         model = get_peft_model(model, peft_config)
     model.print_trainable_parameters()
     return model, peft_config

     else:
         model = get_peft_model(model, peft_config)
+    if cfg.flash_attention:
+        for name, module in model.named_modules():
+            if "norm" in name:
+                module.to(torch.float16)
+            if "lm_head" in name or "embed_tokens" in name:
+                if hasattr(module, "weight"):
+                    module.to(torch.float16)
     model.print_trainable_parameters()
     return model, peft_config