nev's picture
Add files using upload-large-folder tool
8f1d1d7 verified
{
"dataset_repo": "EleutherAI/fineweb-edu-dedup-10b",
"dataset_split": "train",
"dataset_name": "",
"dataset_column": "text",
"batch_size": 16,
"cache_ctx_len": 256,
"n_tokens": 1000000,
"n_splits": 5,
"model_name": "google/gemma-2-2b"
}