laion_root="allava_laion" mkdir $laion_root cd $laion_root # 1. download annotation files ## 1.1 caption wget -c -O ALLaVA-Caption-LAION-4V.json https://huggingface.co/datasets/FreedomIntelligence/ALLaVA-4V/resolve/main/allava_laion/ALLaVA-Caption-LAION-4V.json?download=true ## 1.2 instruction wget -c -O ALLaVA-Instruct-LAION-4V.json https://huggingface.co/datasets/FreedomIntelligence/ALLaVA-4V/resolve/main/allava_laion/ALLaVA-Instruct-LAION-4V.json?download=true # 2. download and upzip images mkdir image_chunks ## 2.1 download for ((i=0; i<10; i++)) do wget -c -O image_chunks/images_$i.zip https://huggingface.co/datasets/FreedomIntelligence/ALLaVA-4V/resolve/main/allava_laion/image_chunks/images_$i.zip?download=true & done mkdir -p images/ wait ## 2.2 unzip for ((i=0; i<10; i++)) do unzip -j -o image_chunks/images_$i.zip -d images/ & # wait patiently, it takes a while... done wait echo "All done!"