Hanrui / progress /github /SpecForge /datasets /download_laion.sh
Lekr0's picture
Add files using upload-large-folder tool
212a146 verified
laion_root="allava_laion"
mkdir $laion_root
cd $laion_root
# 1. download annotation files
## 1.1 caption
wget -c -O ALLaVA-Caption-LAION-4V.json https://huggingface.co/datasets/FreedomIntelligence/ALLaVA-4V/resolve/main/allava_laion/ALLaVA-Caption-LAION-4V.json?download=true
## 1.2 instruction
wget -c -O ALLaVA-Instruct-LAION-4V.json https://huggingface.co/datasets/FreedomIntelligence/ALLaVA-4V/resolve/main/allava_laion/ALLaVA-Instruct-LAION-4V.json?download=true
# 2. download and upzip images
mkdir image_chunks
## 2.1 download
for ((i=0; i<10; i++))
do
wget -c -O image_chunks/images_$i.zip https://huggingface.co/datasets/FreedomIntelligence/ALLaVA-4V/resolve/main/allava_laion/image_chunks/images_$i.zip?download=true &
done
mkdir -p images/
wait
## 2.2 unzip
for ((i=0; i<10; i++))
do
unzip -j -o image_chunks/images_$i.zip -d images/ & # wait patiently, it takes a while...
done
wait
echo "All done!"