Skip to content

Commit

Permalink
update
Browse files Browse the repository at this point in the history
  • Loading branch information
XiaohanZhangCMU committed Oct 11, 2024
1 parent adf6d95 commit 6bbdee7
Showing 1 changed file with 4 additions and 4 deletions.
8 changes: 4 additions & 4 deletions llmfoundry/data/text_data.py
Original file line number Diff line number Diff line change
Expand Up @@ -3,6 +3,7 @@

"""Build a StreamingTextDataset dataset and dataloader for training."""

import inspect
from itertools import islice
from typing import (
Any,
Expand Down Expand Up @@ -327,14 +328,13 @@ def build_text_dataloader(
StreamingTextDataset,
).parameters

valid_base_dataset_params = inspect.signature(
StreamingDataset,
).parameters
valid_base_dataset_params = inspect.signature(StreamingDataset,).parameters

dataset_config_subset_for_streaming_text_dataset = {
k: v
for k, v in dataset_cfg.items()
if k in valid_streaming_text_dataset_parameters or k in valid_base_dataset_params
if k in valid_streaming_text_dataset_parameters or
k in valid_base_dataset_params
}

# build dataset potentially with streams
Expand Down

0 comments on commit 6bbdee7

Please sign in to comment.