flax-community
/

clip-reply

Model card Files Files and versions

Metrics Training metrics Community

clip-reply / train.sh

Ceyda Cinarel

add model

3d243f4 over 4 years ago

history blame contribute delete

1.1 kB

	MODEL_DIR=./output
	BASE_L_MODEL=cardiffnlp/twitter-roberta-base
	BASE_LL_MODEL=cardiffnlp/twitter-roberta-base-emoji
	# BASE_LL_MODEL=cardiffnlp/twitter-roberta-base-emotion
	# BASE_LL_MODEL=cardiffnlp/twitter-roberta-base-sentiment
	# BASE_L_MODEL=roberta-base
	# BASE_L_MODEL=bert-large-cased



	BASE_V_MODEL=openai/clip-vit-base-patch32

	# BASE_V_MODEL=google/vit-base-patch16-384
	# BASE_V_MODEL=google/vit-base-patch32-384
	# BASE_V_MODEL=timm/vit_huge_patch14_224_in21k

	#USE_TORCH=false
	python run_hybrid_clip.py \
	--output_dir ${MODEL_DIR} \
	--text_model_name_or_path=${BASE_LL_MODEL} \
	--vision_model_name_or_path=${BASE_V_MODEL} \
	--tokenizer_name=${BASE_L_MODEL} \
	--train_file="/home/ceyda/data/train.json" \
	--validation_file="/home/ceyda/data/val.json" \
	--do_train --do_eval \
	--num_train_epochs="40" --max_seq_length 128 \
	--per_device_train_batch_size="32" \
	--per_device_eval_batch_size="8" \
	--learning_rate="1e-5" --warmup_steps="150" --weight_decay 0.1 \
	--overwrite_output_dir \
	--preprocessing_num_workers 32
	# --push_to_hub