Remove os.path.join

mosaicml · Oct 24, 2023 · dba1104 · dba1104
1 parent e85fc95
commit dba1104
Showing 1 changed file with 7 additions and 8 deletions.
diff --git a/tests/fixtures/data.py b/tests/fixtures/data.py
@@ -1,7 +1,6 @@
 # Copyright 2022 MosaicML LLM Foundry authors
 # SPDX-License-Identifier: Apache-2.0
 
-import os
 from pathlib import Path
 
 from omegaconf import DictConfig
@@ -14,24 +13,24 @@
 
 
 @fixture
-def tiny_ft_dataset_path(tmp_path: Path, dataset_size: int = 4) -> str:
+def tiny_ft_dataset_path(tmp_path: Path, dataset_size: int = 4) -> Path:
     """Creates a tiny dataset and returns the path."""
-    tiny_dataset_path = os.path.join(tmp_path, 'test-ift-data-small')
-    os.mkdir(tiny_dataset_path)
-    tiny_dataset_file = os.path.join(tiny_dataset_path, 'train.jsonl')
-    make_tiny_ft_dataset(path=tiny_dataset_file, size=dataset_size)
+    tiny_dataset_path = tmp_path / 'test-ift-data-small'
+    tiny_dataset_path.mkdir(exist_ok=True)
+    tiny_dataset_file = tiny_dataset_path / 'train.jsonl'
+    make_tiny_ft_dataset(path=str(tiny_dataset_file), size=dataset_size)
     return tiny_dataset_path
 
 
 @fixture
-def tiny_ft_dataloader(tiny_ft_dataset_path: str,
+def tiny_ft_dataloader(tiny_ft_dataset_path: Path,
                        mpt_tokenizer: PreTrainedTokenizerBase,
                        max_seq_len: int = 128,
                        device_batch_size: int = 1) -> DataLoader:
     dataloader_cfg = DictConfig({
         'name': 'finetuning',
         'dataset': {
-            'hf_name': tiny_ft_dataset_path,
+            'hf_name': str(tiny_ft_dataset_path),
             'split': 'train',
             'max_seq_len': max_seq_len,
             'decoder_only_format': True,