doc-to-lora/data/download_fineweb_edu.py
2026-02-27 03:47:04 +00:00

10 lines
284 B
Python

from huggingface_hub import snapshot_download
if __name__ == "__main__":
fw_dir = "./data/raw_datasets/fineweb_edu/"
snapshot_download(
"HuggingFaceFW/fineweb-edu",
repo_type="dataset",
local_dir=fw_dir,
allow_patterns="sample/100BT/*",
)