diff --git a/config/llama2_1b_mark.yaml b/config/llama2_1b_mark.yaml index 53bc6c167..88ad31bd7 100644 --- a/config/llama2_1b_mark.yaml +++ b/config/llama2_1b_mark.yaml @@ -6,7 +6,7 @@ data: configs: fineweb: id: "HuggingFaceFW/fineweb" - stream: False + stream: True pile/arxiv: train_urls: - gs://levanter-data/pile-domains/arxiv/{00..29}.jsonl.zst