{ "dataset_repo": "EleutherAI/fineweb-edu-dedup-10b", "dataset_split": "train", "dataset_name": "", "dataset_column": "text", "batch_size": 16, "cache_ctx_len": 256, "n_tokens": 1000000, "n_splits": 5, "model_name": "meta-llama/Llama-3.2-1B" }