Skip to content

Commit

Permalink
fix: Set local directory when downloading datasets from Hugging Face
Browse files Browse the repository at this point in the history
  • Loading branch information
anth-volk committed Dec 19, 2024
1 parent cd0f149 commit 926c3b5
Show file tree
Hide file tree
Showing 3 changed files with 11 additions and 1 deletion.
4 changes: 4 additions & 0 deletions changelog_entry.yaml
Original file line number Diff line number Diff line change
@@ -0,0 +1,4 @@
- bump: patch
changes:
changed:
- Explicitly set local directory when downloading datasets from Hugging Face
1 change: 1 addition & 0 deletions policyengine_core/data/dataset.py
Original file line number Diff line number Diff line change
Expand Up @@ -501,4 +501,5 @@ def download_from_huggingface(
repo=f"{owner_name}/{model_name}",
repo_filename=file_name,
version=version,
local_dir=self.file_path.parent,
)
7 changes: 6 additions & 1 deletion policyengine_core/tools/hugging_face.py
Original file line number Diff line number Diff line change
Expand Up @@ -13,7 +13,10 @@


def download_huggingface_dataset(
repo: str, repo_filename: str, version: str = None
repo: str,
repo_filename: str,
version: str = None,
local_dir: str | None = None,
):
"""
Download a dataset from the Hugging Face Hub.
Expand All @@ -22,6 +25,7 @@ def download_huggingface_dataset(
repo (str): The Hugging Face repo name, in format "{org}/{repo}".
repo_filename (str): The filename of the dataset.
version (str, optional): The version of the dataset. Defaults to None.
local_dir (str, optional): The local directory to save the dataset to. Defaults to None.
"""
# Attempt connection to Hugging Face model_info endpoint
# (https://huggingface.co/docs/huggingface_hub/v0.26.5/en/package_reference/hf_api#huggingface_hub.HfApi.model_info)
Expand Down Expand Up @@ -52,6 +56,7 @@ def download_huggingface_dataset(
filename=repo_filename,
revision=version,
token=authentication_token,
local_dir=local_dir,
)


Expand Down

0 comments on commit 926c3b5

Please sign in to comment.