Make sure patch does not persist between tests

mosaicml · Oct 30, 2023 · f569531 · f569531
1 parent c099da3
commit f569531
Showing 1 changed file with 10 additions and 0 deletions.
diff --git a/tests/test_huggingface_flash.py b/tests/test_huggingface_flash.py
@@ -3,6 +3,7 @@
 
 import contextlib
 import os
+from unittest import mock
 from unittest.mock import patch
 
 import pytest
@@ -113,6 +114,12 @@ def test_attn_patch_integration(patch: str):
         pytest.skip(
             'The CI cluster does not have access to the Llama models, so skip this test.'
         )
+
+    # Save the original attention function to restore at the end of the test.
+    from transformers.models.llama.modeling_llama import \
+                    LlamaAttention
+    original_attn = LlamaAttention.forward
+
     name = 'meta-llama/Llama-2-7b-hf'
     model_cfg = DictConfig({
         'name': 'hf_causal_lm',
@@ -145,6 +152,9 @@ def test_attn_patch_integration(patch: str):
         outputs = model(tokenized_input)
         loss = outputs.loss
         loss.backward()
+
+    # Ensure the patch does not persist beyond this test.
+    LlamaAttention.forward = original_attn
 
 @pytest.mark.gpu
 @pytest.mark.parametrize('model_name', ['llama2', 'mistral'])