From 7a66bebe0ffbb80f13d737db9ce22d5b956797be Mon Sep 17 00:00:00 2001 From: Saaketh Date: Mon, 29 Jul 2024 00:25:17 +0200 Subject: [PATCH] yo --- llmfoundry/callbacks/hf_checkpointer.py | 1 + 1 file changed, 1 insertion(+) diff --git a/llmfoundry/callbacks/hf_checkpointer.py b/llmfoundry/callbacks/hf_checkpointer.py index a186f67f14..5aa81acaa5 100644 --- a/llmfoundry/callbacks/hf_checkpointer.py +++ b/llmfoundry/callbacks/hf_checkpointer.py @@ -517,6 +517,7 @@ def tensor_hook( new_model_instance.generation_config.update( **original_model.generation_config.to_dict(), ) + new_model_instance.name_or_path = original_model.name_or_path # Then load the state dict in with "assign" so that the state dict # is loaded properly even though the model is initially on meta device.