Spaces:
Sleeping
Sleeping
File size: 834 Bytes
3b64038 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 |
import argparse
from huggingface_hub import hf_hub_download
parser = argparse.ArgumentParser(description="Download files from a Hugging Face dataset repository.")
parser.add_argument("--repo_id", type=str, default="PeterJinGo/wiki-18-e5-index", help="Hugging Face repository ID")
parser.add_argument("--save_path", type=str, required=True, help="Local directory to save files")
args = parser.parse_args()
repo_id = "PeterJinGo/wiki-18-e5-index"
for file in ["part_aa", "part_ab"]:
hf_hub_download(
repo_id=repo_id,
filename=file, # e.g., "e5_Flat.index"
repo_type="dataset",
local_dir=args.save_path,
)
repo_id = "PeterJinGo/wiki-18-corpus"
hf_hub_download(
repo_id=repo_id,
filename="wiki-18.jsonl.gz",
repo_type="dataset",
local_dir=args.save_path,
)
|