>>> from tatm.data import get_dataset, torch_collate_fn
>>> get_dataset("/dolma_path/dolma/tokenized/baseten-meta-llama-3-tokenizer/c4")
Traceback (most recent call last):
File "<stdin>", line 1, in <module>
File "/conda_env/lib/python3.12/site-packages/tatm/data/datasets.py", line 49, in get_dataset
return TatmMemmapDataset(
^^^^^^^^^^^^^^^^^^
TypeError: TatmMemmapDataset.__init__() missing 1 required positional argument: 'context_length'