Skip to content

Commit

Permalink
precommit
Browse files Browse the repository at this point in the history
  • Loading branch information
dakinggg committed Oct 16, 2023
1 parent 1935674 commit c6f381b
Showing 1 changed file with 2 additions and 1 deletion.
3 changes: 2 additions & 1 deletion llmfoundry/data/denoising.py
Original file line number Diff line number Diff line change
Expand Up @@ -876,7 +876,8 @@ def _format_tokens_for_decoder_only(
tokenizer = build_tokenizer(tokenizer_name=tokenizer_name,
tokenizer_kwargs=tokenizer_kwargs)

loader = build_text_denoising_dataloader(cfg, tokenizer, device_batch_size).dataloader
loader = build_text_denoising_dataloader(cfg, tokenizer,
device_batch_size).dataloader
assert isinstance(loader.dataset, StreamingTextDataset)

print(f'\n\nTRUNCATING TO: {loader.dataset.max_seq_len}\n\n')
Expand Down

0 comments on commit c6f381b

Please sign in to comment.