disable future fix for now

axolotl-ai-cloud · Dec 10, 2023 · 8335e40 · 8335e40
1 parent 99d68c4
commit 8335e40
Show file tree

Hide file tree

Showing 2 changed files with 3 additions and 1 deletion.
diff --git a/docker/Dockerfile-runpod b/docker/Dockerfile-runpod
@@ -4,6 +4,7 @@ FROM winglian/axolotl:$BASE_TAG
 ENV HF_DATASETS_CACHE="/workspace/data/huggingface-cache/datasets"
 ENV HUGGINGFACE_HUB_CACHE="/workspace/data/huggingface-cache/hub"
 ENV TRANSFORMERS_CACHE="/workspace/data/huggingface-cache/hub"
+ENV HF_HOME="/workspace/data/huggingface-cache/hub"
 
 COPY scripts/runpod-entrypoint.sh /root/runpod-entrypoint.sh
 

diff --git a/src/axolotl/utils/models.py b/src/axolotl/utils/models.py
@@ -308,7 +308,8 @@ def load_model(
             or cfg.is_falcon_derived_model
             or cfg.is_mistral_derived_model
         ):
-            model_kwargs["attn_implementation"] = "flash_attention_2"
+            # TODO enable once properly supported in transformers
+            # model_kwargs["attn_implementation"] = "flash_attention_2"
             model_kwargs["use_flash_attention_2"] = True  # legacy, to be deprecated
 
     try: