| # Git and development files | |
| .git | |
| __pycache__/ | |
| *.pyc | |
| .env | |
| # Pipeline (exclude entire directory for Phase 1) | |
| pipeline/ | |
| # OS cruft | |
| .DS_Store | |
| # Exclude only large files that aren't essential | |
| data/*.bin | |
| data/*.pdf | |
| # Exclude individual embedding files (too many for HF Spaces) | |
| data/embeddings/CLIP_Embeddings/ | |
| data/embeddings/PaintingCLIP_Embeddings/ | |
| # Allow consolidated embedding files | |
| !data/embeddings/*_consolidated.pt | |
| !data/embeddings/*_metadata.json | |
| # Keep essential ML files: | |
| # - .pt files for embeddings (consolidated) | |
| # - .safetensors files for models | |
| # - JSON files for metadata | |