Odin / scripts /download_data.py
ODIN
Update HF dataset repo ID to KoopaK/OdinDB
9e6cc8a
"""
download_data.py
----------------
Downloads the ODIN runtime data (processed CSVs + ChromaDB knowledge bases)
from Hugging Face Hub into the local data/ directory.
Usage:
python scripts/download_data.py
Requirements:
pip install huggingface_hub
"""
import os
import sys
from pathlib import Path
HF_REPO_ID = "KoopaK/OdinDB"
LOCAL_DIR = Path(__file__).parent.parent / "data"
def main():
try:
from huggingface_hub import snapshot_download
except ImportError:
print("huggingface_hub not installed. Run: pip install huggingface_hub")
sys.exit(1)
print(f"Downloading ODIN data from HuggingFace ({HF_REPO_ID}) …")
print(f"Destination: {LOCAL_DIR.resolve()}")
print("This may take a few minutes (~400 MB knowledge bases + processed CSVs).\n")
snapshot_download(
repo_id = HF_REPO_ID,
repo_type = "dataset",
local_dir = str(LOCAL_DIR),
ignore_patterns=["*.git*", "README.md"],
)
print("\nDone. You can now run the app:")
print(" python src/agents/app.py")
if __name__ == "__main__":
main()