Skip to content

Commit

Permalink
Add debug logs
Browse files Browse the repository at this point in the history
  • Loading branch information
irenedea committed Oct 22, 2024
1 parent abc21f0 commit 0a3846f
Show file tree
Hide file tree
Showing 2 changed files with 6 additions and 0 deletions.
2 changes: 2 additions & 0 deletions llmfoundry/data/finetuning/dataloader.py
Original file line number Diff line number Diff line change
Expand Up @@ -593,6 +593,8 @@ def _download_remote_hf_dataset(remote_path: str, split: str) -> str:
finetune_dir,
f'.node_{dist.get_node_rank()}_local_rank0_completed',
)

log.debug(f'Downloading dataset {name} to {destination}.')
if dist.get_local_rank() == 0:
try:
get_file(path=name, destination=destination, overwrite=True)
Expand Down
4 changes: 4 additions & 0 deletions llmfoundry/data/finetuning/tasks.py
Original file line number Diff line number Diff line change
Expand Up @@ -901,6 +901,10 @@ def build_from_hf(
dataset_name,
)

log.debug(
f'Downloading dataset {dataset_name} to {local_dataset_dir}.',
)

if _is_empty_or_nonexistent(dirpath=local_dataset_dir):
# Safely load a dataset from HF Hub with restricted file types.
hf_hub.snapshot_download(
Expand Down

0 comments on commit 0a3846f

Please sign in to comment.