| set -euo pipefail | |
| DATA_ROOT="${DATA_ROOT:-/home/v-menggao/code/data}" | |
| # HF datasets | |
| huggingface-cli download --repo-type dataset nlphuji/flickr30k --local-dir "${DATA_ROOT}/flickr30k" | |
| # huggingface-cli download --repo-type dataset Lin-Chen/ShareGPT4V --local-dir "${DATA_ROOT}/ShareGPT4V" | |
| # huggingface-cli download --repo-type dataset BeichenZhang/Urban1k --local-dir "${DATA_ROOT}/Urban1k" | |
| # huggingface-cli download --repo-type dataset royokong/coco_test --local-dir "${DATA_ROOT}/coco_test" | |
| # sugar-crepe repo | |
| if [ ! -d "${DATA_ROOT}/sugar-crepe" ]; then | |
| git clone https://github.com/RAIVNLab/sugar-crepe.git "${DATA_ROOT}/sugar-crepe" | |
| else | |
| echo "sugar-crepe already exists, skipping clone" | |
| fi | |
| # # COCO val2017 images | |
| # mkdir -p "${DATA_ROOT}/MSCOCO-2017" | |
| # wget -c -O "${DATA_ROOT}/MSCOCO-2017/val2017.zip" http://images.cocodataset.org/zips/val2017.zip | |
| # unzip -n "${DATA_ROOT}/MSCOCO-2017/val2017.zip" -d "${DATA_ROOT}/MSCOCO-2017" |