*.7z filter=lfs diff=lfs merge=lfs -text *.arrow filter=lfs diff=lfs merge=lfs -text *.bin filter=lfs diff=lfs merge=lfs -text *.bz2 filter=lfs diff=lfs merge=lfs -text *.ckpt filter=lfs diff=lfs merge=lfs -text *.ftz filter=lfs diff=lfs merge=lfs -text *.gz filter=lfs diff=lfs merge=lfs -text *.h5 filter=lfs diff=lfs merge=lfs -text *.joblib filter=lfs diff=lfs merge=lfs -text *.lfs.* filter=lfs diff=lfs merge=lfs -text *.mlmodel filter=lfs diff=lfs merge=lfs -text *.model filter=lfs diff=lfs merge=lfs -text *.msgpack filter=lfs diff=lfs merge=lfs -text *.npy filter=lfs diff=lfs merge=lfs -text *.npz filter=lfs diff=lfs merge=lfs -text *.onnx filter=lfs diff=lfs merge=lfs -text *.ot filter=lfs diff=lfs merge=lfs -text *.parquet filter=lfs diff=lfs merge=lfs -text *.pb filter=lfs diff=lfs merge=lfs -text *.pickle filter=lfs diff=lfs merge=lfs -text *.pkl filter=lfs diff=lfs merge=lfs -text *.pt filter=lfs diff=lfs merge=lfs -text *.pth filter=lfs diff=lfs merge=lfs -text *.rar filter=lfs diff=lfs merge=lfs -text *.safetensors filter=lfs diff=lfs merge=lfs -text saved_model/**/* filter=lfs diff=lfs merge=lfs -text *.tar.* filter=lfs diff=lfs merge=lfs -text *.tar filter=lfs diff=lfs merge=lfs -text *.tflite filter=lfs diff=lfs merge=lfs -text *.tgz filter=lfs diff=lfs merge=lfs -text *.wasm filter=lfs diff=lfs merge=lfs -text *.xz filter=lfs diff=lfs merge=lfs -text *.zip filter=lfs diff=lfs merge=lfs -text *.zst filter=lfs diff=lfs merge=lfs -text *tfevents* filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=8/seed=7/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=8/seed=7/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=128/seed=4/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=128/seed=4/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=128/seed=4/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=128/seed=4/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=128/seed=6/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=128/seed=6/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=128/seed=6/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=128/seed=6/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=128/seed=2/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=128/seed=2/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=128/seed=2/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=128/seed=2/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=128/seed=3/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=128/seed=3/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=128/seed=3/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=128/seed=8/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=128/seed=3/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=128/seed=8/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=128/seed=8/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=128/seed=8/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=128/seed=5/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=128/seed=5/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=128/seed=5/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=128/seed=5/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=128/seed=0/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=128/seed=0/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=128/seed=0/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=128/seed=0/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=128/seed=1/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=128/seed=1/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=128/seed=1/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=128/seed=1/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=128/seed=7/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=128/seed=7/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=128/seed=7/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=128/seed=7/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=256/seed=4/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=256/seed=4/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=256/seed=4/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=256/seed=4/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=256/seed=6/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=256/seed=6/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=256/seed=6/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=256/seed=6/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=256/seed=2/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=256/seed=2/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=256/seed=2/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=256/seed=2/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=256/seed=3/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=256/seed=3/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=256/seed=3/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=256/seed=3/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=256/seed=8/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=256/seed=8/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=256/seed=8/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=256/seed=5/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=256/seed=8/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=256/seed=5/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=256/seed=5/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=256/seed=0/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=256/seed=5/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=64/seed=5/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=64/seed=5/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=64/seed=5/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=64/seed=0/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=64/seed=0/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=64/seed=0/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=64/seed=1/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=64/seed=0/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=64/seed=1/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=64/seed=1/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=64/seed=1/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=64/seed=7/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=64/seed=7/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=64/seed=7/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=64/seed=7/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=16/seed=4/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=16/seed=4/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=16/seed=4/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=16/seed=6/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=16/seed=4/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=16/seed=6/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=16/seed=6/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=16/seed=6/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=16/seed=2/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=16/seed=2/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=16/seed=2/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=16/seed=2/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=16/seed=3/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=16/seed=3/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=16/seed=3/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=16/seed=3/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=16/seed=8/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=16/seed=8/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=16/seed=8/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=16/seed=8/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=16/seed=5/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=16/seed=5/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=16/seed=5/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=16/seed=5/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=16/seed=0/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=16/seed=0/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=16/seed=0/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=16/seed=0/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=16/seed=1/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=16/seed=1/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=16/seed=1/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=16/seed=1/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=16/seed=7/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=16/seed=7/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=16/seed=7/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=16/seed=7/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=32/seed=4/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=32/seed=4/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=32/seed=4/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=32/seed=4/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=32/seed=6/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=32/seed=6/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=32/seed=6/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=32/seed=6/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=32/seed=2/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=32/seed=2/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=32/seed=2/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=32/seed=3/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=32/seed=2/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=32/seed=3/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=32/seed=3/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=32/seed=3/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=32/seed=8/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=32/seed=8/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=32/seed=8/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=32/seed=5/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=32/seed=8/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=32/seed=5/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=32/seed=5/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=32/seed=5/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=32/seed=0/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=32/seed=0/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=32/seed=0/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=32/seed=1/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=32/seed=1/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=32/seed=1/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=32/seed=0/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=32/seed=1/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=32/seed=7/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=32/seed=7/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=32/seed=7/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=32/seed=7/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=8/seed=4/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=8/seed=4/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=8/seed=4/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=8/seed=4/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=8/seed=6/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=8/seed=6/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=8/seed=6/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=8/seed=2/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=8/seed=6/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=8/seed=2/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=8/seed=2/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=8/seed=2/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=8/seed=3/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=8/seed=3/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=8/seed=3/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=8/seed=3/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=8/seed=8/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=8/seed=8/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=8/seed=8/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=8/seed=8/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=8/seed=5/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=8/seed=5/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=8/seed=5/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=8/seed=5/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=8/seed=0/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=8/seed=0/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=8/seed=0/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=8/seed=0/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=8/seed=1/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=8/seed=1/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=8/seed=1/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=8/seed=7/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=8/seed=1/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=8/seed=7/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=8/seed=7/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=8/seed=7/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=128/seed=4/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=128/seed=4/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=128/seed=4/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=128/seed=4/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=128/seed=6/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=128/seed=6/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=128/seed=6/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=128/seed=6/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=128/seed=2/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=128/seed=2/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=128/seed=2/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=128/seed=2/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=128/seed=3/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=128/seed=3/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=128/seed=3/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=128/seed=3/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=128/seed=8/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=128/seed=8/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=128/seed=8/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=128/seed=8/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=128/seed=5/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=128/seed=5/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=128/seed=5/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=128/seed=5/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=128/seed=0/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=128/seed=0/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=128/seed=0/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=128/seed=0/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=128/seed=1/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=128/seed=1/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=128/seed=1/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=128/seed=1/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=128/seed=7/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=128/seed=7/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=128/seed=7/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=128/seed=7/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=256/seed=4/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=256/seed=4/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=256/seed=4/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=256/seed=4/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=256/seed=6/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=256/seed=6/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=256/seed=6/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=256/seed=6/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=256/seed=2/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=256/seed=2/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=256/seed=2/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=256/seed=2/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=256/seed=3/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=256/seed=3/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=256/seed=3/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=256/seed=3/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=256/seed=8/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=256/seed=8/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=256/seed=8/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=256/seed=5/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=256/seed=5/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=256/seed=8/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=256/seed=5/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=256/seed=5/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=256/seed=0/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=256/seed=0/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=256/seed=0/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=256/seed=0/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=256/seed=1/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=256/seed=1/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=256/seed=1/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=256/seed=1/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=256/seed=7/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=256/seed=7/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=256/seed=7/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=64/seed=4/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=256/seed=7/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=64/seed=4/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=64/seed=4/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=64/seed=4/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=64/seed=6/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=64/seed=6/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=64/seed=6/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=64/seed=2/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=64/seed=6/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=64/seed=2/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=64/seed=2/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=64/seed=2/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=64/seed=3/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=64/seed=3/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=64/seed=3/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=64/seed=3/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=64/seed=8/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=64/seed=8/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=64/seed=8/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=64/seed=8/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=64/seed=5/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=64/seed=5/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=64/seed=5/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=64/seed=5/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=64/seed=0/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=64/seed=0/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=64/seed=0/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=64/seed=1/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=64/seed=1/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=64/seed=1/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=64/seed=1/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=64/seed=7/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=64/seed=7/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=64/seed=0/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=64/seed=7/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=64/seed=7/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=16/seed=4/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=16/seed=4/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=16/seed=4/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=16/seed=4/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=16/seed=6/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=16/seed=6/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=16/seed=6/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=16/seed=6/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=16/seed=2/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=16/seed=2/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=16/seed=2/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=16/seed=3/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=16/seed=2/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=16/seed=3/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=16/seed=3/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=16/seed=8/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=16/seed=3/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=16/seed=8/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=16/seed=5/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=16/seed=8/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=16/seed=5/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=16/seed=8/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=16/seed=5/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=16/seed=5/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=16/seed=0/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=16/seed=0/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=16/seed=0/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=16/seed=1/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=16/seed=1/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=16/seed=0/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=16/seed=1/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=16/seed=1/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=16/seed=7/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=16/seed=7/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=16/seed=7/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=16/seed=7/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=32/seed=4/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=32/seed=4/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=32/seed=4/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=32/seed=6/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=32/seed=6/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=32/seed=4/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=32/seed=6/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=32/seed=6/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=32/seed=2/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=32/seed=2/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=32/seed=2/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=32/seed=2/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=32/seed=3/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=32/seed=3/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=32/seed=3/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=32/seed=3/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=32/seed=8/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=32/seed=8/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=32/seed=8/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=32/seed=8/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=32/seed=5/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=32/seed=5/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=32/seed=5/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=32/seed=5/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=32/seed=0/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=32/seed=0/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=32/seed=0/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=32/seed=0/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=32/seed=1/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=32/seed=1/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=32/seed=1/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=32/seed=1/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=32/seed=7/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=32/seed=7/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=32/seed=7/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/20newsgroups/size=8/seed=4/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/20newsgroups/size=8/seed=4/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/sst2/size=32/seed=7/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/20newsgroups/size=8/seed=4/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/20newsgroups/size=8/seed=2/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/20newsgroups/size=8/seed=4/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/20newsgroups/size=8/seed=2/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/20newsgroups/size=8/seed=2/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/20newsgroups/size=8/seed=2/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/20newsgroups/size=8/seed=3/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/20newsgroups/size=8/seed=3/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/20newsgroups/size=8/seed=3/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/20newsgroups/size=8/seed=0/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/20newsgroups/size=8/seed=3/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/20newsgroups/size=8/seed=0/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/20newsgroups/size=8/seed=0/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/20newsgroups/size=8/seed=0/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/20newsgroups/size=8/seed=1/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/20newsgroups/size=8/seed=1/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/20newsgroups/size=8/seed=1/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/20newsgroups/size=128/seed=4/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/20newsgroups/size=8/seed=1/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/20newsgroups/size=128/seed=4/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/20newsgroups/size=128/seed=4/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/20newsgroups/size=128/seed=2/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/20newsgroups/size=128/seed=4/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/20newsgroups/size=128/seed=2/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/20newsgroups/size=128/seed=2/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/20newsgroups/size=128/seed=2/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/20newsgroups/size=128/seed=3/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/20newsgroups/size=128/seed=3/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/20newsgroups/size=128/seed=3/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/20newsgroups/size=128/seed=0/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/20newsgroups/size=128/seed=3/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/20newsgroups/size=128/seed=0/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/20newsgroups/size=128/seed=0/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/20newsgroups/size=128/seed=0/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/20newsgroups/size=128/seed=1/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/20newsgroups/size=128/seed=1/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/20newsgroups/size=128/seed=1/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/20newsgroups/size=128/seed=1/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/20newsgroups/size=256/seed=4/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/20newsgroups/size=256/seed=4/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/20newsgroups/size=256/seed=4/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/20newsgroups/size=256/seed=4/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/20newsgroups/size=256/seed=2/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/20newsgroups/size=256/seed=2/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/20newsgroups/size=256/seed=2/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/20newsgroups/size=256/seed=2/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/20newsgroups/size=256/seed=3/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/20newsgroups/size=256/seed=3/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/20newsgroups/size=256/seed=3/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/20newsgroups/size=256/seed=3/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/20newsgroups/size=256/seed=0/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/20newsgroups/size=256/seed=0/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/20newsgroups/size=256/seed=0/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/20newsgroups/size=256/seed=0/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/20newsgroups/size=256/seed=1/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/20newsgroups/size=256/seed=1/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/20newsgroups/size=256/seed=1/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/20newsgroups/size=64/seed=4/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/20newsgroups/size=256/seed=1/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/20newsgroups/size=64/seed=4/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/20newsgroups/size=64/seed=4/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/20newsgroups/size=64/seed=4/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/20newsgroups/size=64/seed=2/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/20newsgroups/size=64/seed=2/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/20newsgroups/size=64/seed=2/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/20newsgroups/size=64/seed=3/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/20newsgroups/size=64/seed=2/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/20newsgroups/size=64/seed=3/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/20newsgroups/size=64/seed=3/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/20newsgroups/size=64/seed=3/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/20newsgroups/size=64/seed=0/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/20newsgroups/size=64/seed=0/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/20newsgroups/size=64/seed=0/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/20newsgroups/size=64/seed=0/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/20newsgroups/size=64/seed=1/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/20newsgroups/size=64/seed=1/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/20newsgroups/size=64/seed=1/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/20newsgroups/size=64/seed=1/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/20newsgroups/size=16/seed=4/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/20newsgroups/size=16/seed=4/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/20newsgroups/size=16/seed=4/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/20newsgroups/size=16/seed=4/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/20newsgroups/size=16/seed=2/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/20newsgroups/size=16/seed=2/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/20newsgroups/size=16/seed=2/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/20newsgroups/size=16/seed=2/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/20newsgroups/size=16/seed=3/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/20newsgroups/size=16/seed=3/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/20newsgroups/size=16/seed=3/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/20newsgroups/size=16/seed=3/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/20newsgroups/size=16/seed=0/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/20newsgroups/size=16/seed=0/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/20newsgroups/size=16/seed=0/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/20newsgroups/size=16/seed=0/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/20newsgroups/size=16/seed=1/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/20newsgroups/size=16/seed=1/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/20newsgroups/size=16/seed=1/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/20newsgroups/size=16/seed=1/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/20newsgroups/size=32/seed=4/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/20newsgroups/size=32/seed=4/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/20newsgroups/size=32/seed=4/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/20newsgroups/size=32/seed=4/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/20newsgroups/size=32/seed=2/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/20newsgroups/size=32/seed=2/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/20newsgroups/size=32/seed=2/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/20newsgroups/size=32/seed=2/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/20newsgroups/size=32/seed=3/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/20newsgroups/size=32/seed=3/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/20newsgroups/size=32/seed=3/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/20newsgroups/size=32/seed=3/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/20newsgroups/size=32/seed=0/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/20newsgroups/size=32/seed=0/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/20newsgroups/size=32/seed=0/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/20newsgroups/size=32/seed=0/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/20newsgroups/size=32/seed=1/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/20newsgroups/size=32/seed=1/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/20newsgroups/size=32/seed=1/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/dbpedia/size=8/seed=4/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/20newsgroups/size=32/seed=1/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/dbpedia/size=8/seed=4/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/dbpedia/size=8/seed=4/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/dbpedia/size=8/seed=4/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/dbpedia/size=8/seed=2/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/dbpedia/size=8/seed=2/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/dbpedia/size=8/seed=2/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/dbpedia/size=8/seed=2/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/dbpedia/size=8/seed=3/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/dbpedia/size=8/seed=3/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/dbpedia/size=8/seed=3/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/dbpedia/size=8/seed=3/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/dbpedia/size=8/seed=0/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/dbpedia/size=8/seed=0/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/dbpedia/size=8/seed=0/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/dbpedia/size=8/seed=0/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/dbpedia/size=8/seed=1/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/dbpedia/size=8/seed=1/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/dbpedia/size=8/seed=1/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/dbpedia/size=8/seed=1/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/dbpedia/size=128/seed=4/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/dbpedia/size=128/seed=4/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/dbpedia/size=128/seed=4/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/dbpedia/size=128/seed=2/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/dbpedia/size=128/seed=4/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/dbpedia/size=128/seed=2/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/dbpedia/size=128/seed=2/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/dbpedia/size=128/seed=2/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/dbpedia/size=128/seed=3/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/dbpedia/size=128/seed=3/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/dbpedia/size=128/seed=3/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/dbpedia/size=128/seed=3/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/dbpedia/size=128/seed=0/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/dbpedia/size=128/seed=0/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/dbpedia/size=128/seed=0/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/dbpedia/size=128/seed=0/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/dbpedia/size=128/seed=1/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/dbpedia/size=128/seed=1/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/dbpedia/size=128/seed=1/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/dbpedia/size=256/seed=4/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/dbpedia/size=128/seed=1/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/dbpedia/size=256/seed=4/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/dbpedia/size=256/seed=4/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/dbpedia/size=256/seed=2/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/dbpedia/size=256/seed=4/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/dbpedia/size=256/seed=2/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/dbpedia/size=256/seed=2/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/dbpedia/size=256/seed=2/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/dbpedia/size=256/seed=3/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/dbpedia/size=256/seed=3/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/dbpedia/size=256/seed=3/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/dbpedia/size=256/seed=3/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/dbpedia/size=256/seed=0/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/dbpedia/size=256/seed=0/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/dbpedia/size=256/seed=0/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/dbpedia/size=256/seed=1/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/dbpedia/size=256/seed=0/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/dbpedia/size=256/seed=1/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/dbpedia/size=256/seed=1/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/dbpedia/size=64/seed=4/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/dbpedia/size=256/seed=1/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/dbpedia/size=64/seed=4/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/dbpedia/size=64/seed=4/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/dbpedia/size=64/seed=4/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/dbpedia/size=64/seed=2/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/dbpedia/size=64/seed=2/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/dbpedia/size=64/seed=2/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/dbpedia/size=64/seed=2/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/dbpedia/size=64/seed=3/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/dbpedia/size=64/seed=3/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/dbpedia/size=64/seed=3/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/dbpedia/size=64/seed=3/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/dbpedia/size=64/seed=0/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/dbpedia/size=64/seed=0/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/dbpedia/size=64/seed=0/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/dbpedia/size=64/seed=0/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/dbpedia/size=64/seed=1/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/dbpedia/size=64/seed=1/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/dbpedia/size=16/seed=4/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/dbpedia/size=64/seed=1/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/dbpedia/size=64/seed=1/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/dbpedia/size=16/seed=4/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/dbpedia/size=16/seed=4/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/dbpedia/size=16/seed=2/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/dbpedia/size=16/seed=4/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/dbpedia/size=16/seed=2/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/dbpedia/size=16/seed=2/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/dbpedia/size=16/seed=3/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/dbpedia/size=16/seed=2/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/dbpedia/size=16/seed=3/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/dbpedia/size=16/seed=3/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/dbpedia/size=16/seed=3/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/dbpedia/size=16/seed=0/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/dbpedia/size=16/seed=0/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/dbpedia/size=16/seed=0/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/dbpedia/size=16/seed=0/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/dbpedia/size=16/seed=1/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/dbpedia/size=16/seed=1/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/dbpedia/size=16/seed=1/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/dbpedia/size=16/seed=1/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/dbpedia/size=32/seed=4/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/dbpedia/size=32/seed=4/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/dbpedia/size=32/seed=4/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/dbpedia/size=32/seed=4/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/dbpedia/size=32/seed=2/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/dbpedia/size=32/seed=2/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/dbpedia/size=32/seed=2/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/dbpedia/size=32/seed=2/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/dbpedia/size=32/seed=3/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/dbpedia/size=32/seed=3/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/dbpedia/size=32/seed=3/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/dbpedia/size=32/seed=0/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/dbpedia/size=32/seed=3/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/dbpedia/size=32/seed=0/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/dbpedia/size=32/seed=0/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/dbpedia/size=32/seed=0/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/dbpedia/size=32/seed=1/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/dbpedia/size=32/seed=1/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/dbpedia/size=32/seed=1/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/dbpedia/size=32/seed=1/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/banking77/size=8/seed=4/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/banking77/size=8/seed=4/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/banking77/size=8/seed=4/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/banking77/size=8/seed=4/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/banking77/size=8/seed=2/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/banking77/size=8/seed=2/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/banking77/size=8/seed=2/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/banking77/size=8/seed=2/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/banking77/size=8/seed=3/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/banking77/size=8/seed=3/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/banking77/size=8/seed=3/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/banking77/size=8/seed=3/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/banking77/size=8/seed=0/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/banking77/size=8/seed=0/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/banking77/size=8/seed=0/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/banking77/size=8/seed=0/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/banking77/size=8/seed=1/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/banking77/size=8/seed=1/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/banking77/size=8/seed=1/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/banking77/size=8/seed=1/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/banking77/size=128/seed=4/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/banking77/size=128/seed=4/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/banking77/size=128/seed=4/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/banking77/size=128/seed=2/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/banking77/size=128/seed=2/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/banking77/size=128/seed=2/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/banking77/size=128/seed=2/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/banking77/size=128/seed=3/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/banking77/size=128/seed=4/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/banking77/size=128/seed=3/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/banking77/size=128/seed=3/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/banking77/size=128/seed=3/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/banking77/size=128/seed=0/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/banking77/size=128/seed=0/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/banking77/size=128/seed=0/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/banking77/size=128/seed=0/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/banking77/size=128/seed=1/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/banking77/size=128/seed=1/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/banking77/size=128/seed=1/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/banking77/size=128/seed=1/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/banking77/size=256/seed=4/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/banking77/size=256/seed=4/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/banking77/size=256/seed=4/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/banking77/size=256/seed=4/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/banking77/size=256/seed=2/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/banking77/size=256/seed=2/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/banking77/size=256/seed=2/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/banking77/size=256/seed=3/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/banking77/size=256/seed=2/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/banking77/size=256/seed=3/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/banking77/size=256/seed=3/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/banking77/size=256/seed=0/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/banking77/size=256/seed=0/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/banking77/size=256/seed=0/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/banking77/size=256/seed=3/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/banking77/size=256/seed=0/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/banking77/size=256/seed=1/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/banking77/size=256/seed=1/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/banking77/size=256/seed=1/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/banking77/size=256/seed=1/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/banking77/size=64/seed=4/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/banking77/size=64/seed=4/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/banking77/size=64/seed=4/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/banking77/size=64/seed=2/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/banking77/size=64/seed=2/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/banking77/size=64/seed=2/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/banking77/size=64/seed=2/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/banking77/size=64/seed=3/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/banking77/size=64/seed=4/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/banking77/size=64/seed=3/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/banking77/size=64/seed=3/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/banking77/size=64/seed=3/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/banking77/size=64/seed=0/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/banking77/size=64/seed=0/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/banking77/size=64/seed=0/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/banking77/size=64/seed=1/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/banking77/size=64/seed=0/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/banking77/size=64/seed=1/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/banking77/size=64/seed=1/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/banking77/size=64/seed=1/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/banking77/size=16/seed=4/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/banking77/size=16/seed=4/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/banking77/size=16/seed=4/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/banking77/size=16/seed=4/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/banking77/size=16/seed=2/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/banking77/size=16/seed=2/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/banking77/size=16/seed=2/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/banking77/size=16/seed=3/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/banking77/size=16/seed=2/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/banking77/size=16/seed=3/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/banking77/size=16/seed=3/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/banking77/size=16/seed=3/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/banking77/size=16/seed=0/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/banking77/size=16/seed=0/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/banking77/size=16/seed=1/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/banking77/size=16/seed=0/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/banking77/size=16/seed=0/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/banking77/size=16/seed=1/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/banking77/size=16/seed=1/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/banking77/size=16/seed=1/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/banking77/size=32/seed=4/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/banking77/size=32/seed=4/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/banking77/size=32/seed=4/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/banking77/size=32/seed=2/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/banking77/size=32/seed=4/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/banking77/size=32/seed=2/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/banking77/size=32/seed=2/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/banking77/size=32/seed=3/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/banking77/size=32/seed=3/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/banking77/size=32/seed=3/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/banking77/size=32/seed=2/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/banking77/size=32/seed=0/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/banking77/size=32/seed=3/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/banking77/size=32/seed=0/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/banking77/size=32/seed=0/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/banking77/size=32/seed=1/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/banking77/size=32/seed=0/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/banking77/size=32/seed=1/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/banking77/size=32/seed=1/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/banking77/size=32/seed=1/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=8/seed=4/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=8/seed=4/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=8/seed=4/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=8/seed=4/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=8/seed=6/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=8/seed=6/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=8/seed=6/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=8/seed=6/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=8/seed=2/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=8/seed=2/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=8/seed=2/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=8/seed=2/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=8/seed=3/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=8/seed=3/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text results_paper/llama3.2-1b-instruct/metric_vs_samples/combined_performance_llama3.2-1b-instruct.png filter=lfs diff=lfs merge=lfs -text results_paper/llama3.2-1b-instruct/metric_vs_samples/adaptation_performance_llama3.2-1b-instruct.png filter=lfs diff=lfs merge=lfs -text results_paper/qwen2.5-7b-instruct/metric_vs_samples/adaptation_performance_qwen2.5-7b-instruct.png filter=lfs diff=lfs merge=lfs -text results_paper/qwen2.5-7b-instruct/metric_vs_samples/combined_performance_qwen2.5-7b-instruct.png filter=lfs diff=lfs merge=lfs -text results_paper/all_models/comparison.png filter=lfs diff=lfs merge=lfs -text results_paper.wrong/llama3.2-1b-instruct/metric_vs_samples/adaptation_performance_llama3.2-1b-instruct.png filter=lfs diff=lfs merge=lfs -text results_paper.wrong/qwen2.5-7b-instruct/metric_vs_samples/adaptation_performance_qwen2.5-7b-instruct.png filter=lfs diff=lfs merge=lfs -text results_paper.wrong/all_models/comparison.png filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=8/seed=4/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=8/seed=4/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=8/seed=4/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=8/seed=4/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=8/seed=6/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=8/seed=6/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=8/seed=6/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=8/seed=6/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=8/seed=2/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=8/seed=2/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=8/seed=2/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=8/seed=2/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=8/seed=3/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=8/seed=3/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=8/seed=3/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=8/seed=3/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=8/seed=8/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=8/seed=8/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=8/seed=8/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=8/seed=8/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=8/seed=5/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=8/seed=5/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=8/seed=5/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=8/seed=5/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=8/seed=0/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=8/seed=0/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=8/seed=0/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=8/seed=0/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=8/seed=1/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=8/seed=1/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=8/seed=1/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=8/seed=1/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=8/seed=7/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=8/seed=7/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=256/seed=0/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=256/seed=0/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=256/seed=0/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=256/seed=1/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=256/seed=1/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=256/seed=1/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=256/seed=1/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=256/seed=7/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=256/seed=7/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=256/seed=7/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=256/seed=7/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=64/seed=4/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=64/seed=4/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=64/seed=4/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=64/seed=4/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=64/seed=6/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=64/seed=6/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=64/seed=6/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=64/seed=6/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=64/seed=2/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=64/seed=2/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=64/seed=2/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=64/seed=2/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=64/seed=3/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=64/seed=3/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=64/seed=3/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=64/seed=3/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=64/seed=8/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=64/seed=8/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=64/seed=8/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=64/seed=8/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/llama3.2-1b-instruct/agnews/size=64/seed=5/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=8/seed=3/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=8/seed=3/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=8/seed=8/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=8/seed=8/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=8/seed=8/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=8/seed=8/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=8/seed=5/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=8/seed=5/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=8/seed=5/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=8/seed=5/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=8/seed=0/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=8/seed=0/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=8/seed=0/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=8/seed=0/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=8/seed=1/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=8/seed=1/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=8/seed=1/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=8/seed=1/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=8/seed=7/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=8/seed=7/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=8/seed=7/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=8/seed=7/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=128/seed=4/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=128/seed=4/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=128/seed=4/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=128/seed=4/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=128/seed=6/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=128/seed=6/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=128/seed=6/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=128/seed=6/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=128/seed=2/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=128/seed=2/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=128/seed=2/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=128/seed=2/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=128/seed=3/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=128/seed=3/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=128/seed=3/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=128/seed=3/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=128/seed=8/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=128/seed=8/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=128/seed=8/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=128/seed=8/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=128/seed=5/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=128/seed=5/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=128/seed=5/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=128/seed=5/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=128/seed=0/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=128/seed=0/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=128/seed=0/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=128/seed=0/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=128/seed=1/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=128/seed=1/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=128/seed=1/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=128/seed=1/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=128/seed=7/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=128/seed=7/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=128/seed=7/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=128/seed=7/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=256/seed=4/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=256/seed=4/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=256/seed=4/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=256/seed=4/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=256/seed=6/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=256/seed=6/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=256/seed=6/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=256/seed=6/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=256/seed=2/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=256/seed=2/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=256/seed=2/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=256/seed=2/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=256/seed=3/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=256/seed=3/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=256/seed=3/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=256/seed=3/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=256/seed=8/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=256/seed=8/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=256/seed=8/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=256/seed=8/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=256/seed=5/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=256/seed=5/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=256/seed=5/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=256/seed=5/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=256/seed=0/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=256/seed=0/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=256/seed=0/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=256/seed=0/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=256/seed=1/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=256/seed=1/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=256/seed=1/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=256/seed=1/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=256/seed=7/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=256/seed=7/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=256/seed=7/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=256/seed=7/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=64/seed=4/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=64/seed=4/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=64/seed=4/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=64/seed=4/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=64/seed=6/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=64/seed=6/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=64/seed=6/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=64/seed=6/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=64/seed=2/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=64/seed=2/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=64/seed=2/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=64/seed=2/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=64/seed=3/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=64/seed=3/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=64/seed=3/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=64/seed=3/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=64/seed=8/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=64/seed=8/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=64/seed=8/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=64/seed=8/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=64/seed=5/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=64/seed=5/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=64/seed=5/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=64/seed=5/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=64/seed=0/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=64/seed=0/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=64/seed=0/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=64/seed=0/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=64/seed=1/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=64/seed=1/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=64/seed=1/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=64/seed=1/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=64/seed=7/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=64/seed=7/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=64/seed=7/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=64/seed=7/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=16/seed=4/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=16/seed=4/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=16/seed=4/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=16/seed=4/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=16/seed=6/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=16/seed=6/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=16/seed=6/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=16/seed=6/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=16/seed=2/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=16/seed=2/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=16/seed=2/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=16/seed=2/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=16/seed=3/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=16/seed=3/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=16/seed=3/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=16/seed=3/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=16/seed=8/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=16/seed=8/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=16/seed=8/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=16/seed=8/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=16/seed=5/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=16/seed=5/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=16/seed=5/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=16/seed=5/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=16/seed=0/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=16/seed=0/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=16/seed=0/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=16/seed=0/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=16/seed=1/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=16/seed=1/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=16/seed=1/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=16/seed=1/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=16/seed=7/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=16/seed=7/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=16/seed=7/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=16/seed=7/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=32/seed=4/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=32/seed=4/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=32/seed=4/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=32/seed=4/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=32/seed=6/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=32/seed=6/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=32/seed=6/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=32/seed=6/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=32/seed=2/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=32/seed=2/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=32/seed=2/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=32/seed=2/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=32/seed=3/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=32/seed=3/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=32/seed=3/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=32/seed=3/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=32/seed=8/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=32/seed=8/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=32/seed=8/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=32/seed=8/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=32/seed=5/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=32/seed=5/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=32/seed=5/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=32/seed=5/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=32/seed=0/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=32/seed=0/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=32/seed=0/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=32/seed=0/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=32/seed=1/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=32/seed=1/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=32/seed=1/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=32/seed=1/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=32/seed=7/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=32/seed=7/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=32/seed=7/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/agnews/size=32/seed=7/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=8/seed=4/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=8/seed=4/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=8/seed=4/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=8/seed=4/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=8/seed=6/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=8/seed=6/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=8/seed=6/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=8/seed=6/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=8/seed=2/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=8/seed=2/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=8/seed=2/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=8/seed=2/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=8/seed=3/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=8/seed=3/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=8/seed=3/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=8/seed=3/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=8/seed=8/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=8/seed=8/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=8/seed=8/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=8/seed=8/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=8/seed=5/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=8/seed=5/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=8/seed=5/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=8/seed=5/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=8/seed=0/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=8/seed=0/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=8/seed=0/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=8/seed=0/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=8/seed=1/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=8/seed=1/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=8/seed=1/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=8/seed=1/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=8/seed=7/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=8/seed=7/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=8/seed=7/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=8/seed=7/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=128/seed=4/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=128/seed=4/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=128/seed=4/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=128/seed=4/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=128/seed=6/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=128/seed=6/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=128/seed=6/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=128/seed=6/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=128/seed=2/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=128/seed=2/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=128/seed=2/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=128/seed=2/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=128/seed=3/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=128/seed=3/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=128/seed=3/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=128/seed=3/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=128/seed=8/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=128/seed=8/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=128/seed=8/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=128/seed=8/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=128/seed=5/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=128/seed=5/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=128/seed=5/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=128/seed=5/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=128/seed=0/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=128/seed=0/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=128/seed=0/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=128/seed=0/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=128/seed=1/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=128/seed=1/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=128/seed=1/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=128/seed=1/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=128/seed=7/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=128/seed=7/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=128/seed=7/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=128/seed=7/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=256/seed=4/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=256/seed=4/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=256/seed=4/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=256/seed=4/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=256/seed=6/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=256/seed=6/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=256/seed=6/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=256/seed=6/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=256/seed=2/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=256/seed=2/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=256/seed=2/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=256/seed=2/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=256/seed=3/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=256/seed=3/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=256/seed=3/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=256/seed=3/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=256/seed=8/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=256/seed=8/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=256/seed=8/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=256/seed=8/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=256/seed=5/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=256/seed=5/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=256/seed=5/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=256/seed=5/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=256/seed=0/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=256/seed=0/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=256/seed=0/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=256/seed=0/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=256/seed=1/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=256/seed=1/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=256/seed=1/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=256/seed=1/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=256/seed=7/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=256/seed=7/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=256/seed=7/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=256/seed=7/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=64/seed=4/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=64/seed=4/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=64/seed=4/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=64/seed=4/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=64/seed=6/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=64/seed=6/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=64/seed=6/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=64/seed=6/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=64/seed=2/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=64/seed=2/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=64/seed=2/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=64/seed=2/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=64/seed=3/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=64/seed=3/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=64/seed=3/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=64/seed=3/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=64/seed=8/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=64/seed=8/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=64/seed=8/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=64/seed=8/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=64/seed=5/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=64/seed=5/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=64/seed=5/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=64/seed=5/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=64/seed=0/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=64/seed=0/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=64/seed=0/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=64/seed=0/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=64/seed=1/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=64/seed=1/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=64/seed=1/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=64/seed=1/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=64/seed=7/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=64/seed=7/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=64/seed=7/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=64/seed=7/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=16/seed=4/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=16/seed=4/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=16/seed=4/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=16/seed=4/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=16/seed=6/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=16/seed=6/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=16/seed=6/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=16/seed=6/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=16/seed=2/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=16/seed=2/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=16/seed=2/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=16/seed=2/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=16/seed=3/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=16/seed=3/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=16/seed=3/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=16/seed=3/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=16/seed=8/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=16/seed=8/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=16/seed=8/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=16/seed=8/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=16/seed=5/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=16/seed=5/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=16/seed=5/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=16/seed=5/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=16/seed=0/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=16/seed=0/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=16/seed=0/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=16/seed=0/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=16/seed=1/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=16/seed=1/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=16/seed=1/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=16/seed=1/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=16/seed=7/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=16/seed=7/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=16/seed=7/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=16/seed=7/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=32/seed=4/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=32/seed=4/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=32/seed=4/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=32/seed=4/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=32/seed=6/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=32/seed=6/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=32/seed=6/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=32/seed=6/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=32/seed=2/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=32/seed=2/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=32/seed=2/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=32/seed=2/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=32/seed=3/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=32/seed=3/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=32/seed=3/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=32/seed=3/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=32/seed=8/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=32/seed=8/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=32/seed=8/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=32/seed=8/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=32/seed=5/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=32/seed=5/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=32/seed=5/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=32/seed=5/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=32/seed=0/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=32/seed=0/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=32/seed=0/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=32/seed=0/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=32/seed=1/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=32/seed=1/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=32/seed=1/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=32/seed=1/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=32/seed=7/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=32/seed=7/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=32/seed=7/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/sst2/size=32/seed=7/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/20newsgroups/size=8/seed=4/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/20newsgroups/size=8/seed=4/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/20newsgroups/size=8/seed=4/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/20newsgroups/size=8/seed=4/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/20newsgroups/size=8/seed=2/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/20newsgroups/size=8/seed=2/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/20newsgroups/size=8/seed=2/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/20newsgroups/size=8/seed=2/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/20newsgroups/size=8/seed=3/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/20newsgroups/size=8/seed=3/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/20newsgroups/size=8/seed=3/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/20newsgroups/size=8/seed=3/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/20newsgroups/size=8/seed=0/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/20newsgroups/size=8/seed=0/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/20newsgroups/size=8/seed=0/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/20newsgroups/size=8/seed=0/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/20newsgroups/size=8/seed=1/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/20newsgroups/size=8/seed=1/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/20newsgroups/size=8/seed=1/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/20newsgroups/size=8/seed=1/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/20newsgroups/size=128/seed=4/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/20newsgroups/size=128/seed=4/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/20newsgroups/size=128/seed=4/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/20newsgroups/size=128/seed=4/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/20newsgroups/size=128/seed=2/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/20newsgroups/size=128/seed=2/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/20newsgroups/size=128/seed=2/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/20newsgroups/size=128/seed=2/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/20newsgroups/size=128/seed=3/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/20newsgroups/size=128/seed=3/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/20newsgroups/size=128/seed=3/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/20newsgroups/size=128/seed=3/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/20newsgroups/size=128/seed=0/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/20newsgroups/size=128/seed=0/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/20newsgroups/size=128/seed=0/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/20newsgroups/size=128/seed=0/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/20newsgroups/size=128/seed=1/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/20newsgroups/size=128/seed=1/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/20newsgroups/size=128/seed=1/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/20newsgroups/size=128/seed=1/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/20newsgroups/size=256/seed=4/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/20newsgroups/size=256/seed=4/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/20newsgroups/size=256/seed=4/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/20newsgroups/size=256/seed=4/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/20newsgroups/size=256/seed=2/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/20newsgroups/size=256/seed=2/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/20newsgroups/size=256/seed=2/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/20newsgroups/size=256/seed=2/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/20newsgroups/size=256/seed=3/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/20newsgroups/size=256/seed=3/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/20newsgroups/size=256/seed=3/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/20newsgroups/size=256/seed=3/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/20newsgroups/size=256/seed=0/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/20newsgroups/size=256/seed=0/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/20newsgroups/size=256/seed=0/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/20newsgroups/size=256/seed=0/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/20newsgroups/size=256/seed=1/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/20newsgroups/size=256/seed=1/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/20newsgroups/size=256/seed=1/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/20newsgroups/size=256/seed=1/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/20newsgroups/size=64/seed=4/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/20newsgroups/size=64/seed=4/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/20newsgroups/size=64/seed=4/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/20newsgroups/size=64/seed=4/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/20newsgroups/size=64/seed=2/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/20newsgroups/size=64/seed=2/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/20newsgroups/size=64/seed=2/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/20newsgroups/size=64/seed=2/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/20newsgroups/size=64/seed=3/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/20newsgroups/size=64/seed=3/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/20newsgroups/size=64/seed=3/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/20newsgroups/size=64/seed=3/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/20newsgroups/size=64/seed=0/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/20newsgroups/size=64/seed=0/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/20newsgroups/size=64/seed=0/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/20newsgroups/size=64/seed=0/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/20newsgroups/size=64/seed=1/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/20newsgroups/size=64/seed=1/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/20newsgroups/size=64/seed=1/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/20newsgroups/size=64/seed=1/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/20newsgroups/size=16/seed=4/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/20newsgroups/size=16/seed=4/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/20newsgroups/size=16/seed=4/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/20newsgroups/size=16/seed=4/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/20newsgroups/size=16/seed=2/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/20newsgroups/size=16/seed=2/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/20newsgroups/size=16/seed=2/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/20newsgroups/size=16/seed=2/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/20newsgroups/size=16/seed=3/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/20newsgroups/size=16/seed=3/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/20newsgroups/size=16/seed=3/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/20newsgroups/size=16/seed=3/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/20newsgroups/size=16/seed=0/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/20newsgroups/size=16/seed=0/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/20newsgroups/size=16/seed=0/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/20newsgroups/size=16/seed=0/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/20newsgroups/size=16/seed=1/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/20newsgroups/size=16/seed=1/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/20newsgroups/size=16/seed=1/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/20newsgroups/size=16/seed=1/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/20newsgroups/size=32/seed=4/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/20newsgroups/size=32/seed=4/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/20newsgroups/size=32/seed=4/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/20newsgroups/size=32/seed=4/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/20newsgroups/size=32/seed=2/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/20newsgroups/size=32/seed=2/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/20newsgroups/size=32/seed=2/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/20newsgroups/size=32/seed=2/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/20newsgroups/size=32/seed=3/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/20newsgroups/size=32/seed=3/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/20newsgroups/size=32/seed=3/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/20newsgroups/size=32/seed=3/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/20newsgroups/size=32/seed=0/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/20newsgroups/size=32/seed=0/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/20newsgroups/size=32/seed=0/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/20newsgroups/size=32/seed=0/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/20newsgroups/size=32/seed=1/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/20newsgroups/size=32/seed=1/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/20newsgroups/size=32/seed=1/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/20newsgroups/size=32/seed=1/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/dbpedia/size=8/seed=4/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/dbpedia/size=8/seed=4/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/dbpedia/size=8/seed=4/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/dbpedia/size=8/seed=4/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/dbpedia/size=8/seed=2/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/dbpedia/size=8/seed=2/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/dbpedia/size=8/seed=2/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/dbpedia/size=8/seed=2/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/dbpedia/size=8/seed=3/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/dbpedia/size=8/seed=3/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/dbpedia/size=8/seed=3/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/dbpedia/size=8/seed=3/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/dbpedia/size=8/seed=0/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/dbpedia/size=8/seed=0/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/dbpedia/size=8/seed=0/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/dbpedia/size=8/seed=0/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/dbpedia/size=8/seed=1/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/dbpedia/size=8/seed=1/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/dbpedia/size=8/seed=1/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/dbpedia/size=8/seed=1/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/dbpedia/size=128/seed=4/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/dbpedia/size=128/seed=4/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/dbpedia/size=128/seed=4/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/dbpedia/size=128/seed=4/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/dbpedia/size=128/seed=2/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/dbpedia/size=128/seed=2/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/dbpedia/size=128/seed=2/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/dbpedia/size=128/seed=2/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/dbpedia/size=128/seed=3/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/dbpedia/size=128/seed=3/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/dbpedia/size=128/seed=3/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/dbpedia/size=128/seed=3/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/dbpedia/size=128/seed=0/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/dbpedia/size=128/seed=0/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/dbpedia/size=128/seed=0/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/dbpedia/size=128/seed=0/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/dbpedia/size=128/seed=1/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/dbpedia/size=128/seed=1/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/dbpedia/size=128/seed=1/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/dbpedia/size=128/seed=1/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/dbpedia/size=256/seed=4/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/dbpedia/size=256/seed=4/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/dbpedia/size=256/seed=4/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/dbpedia/size=256/seed=4/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/dbpedia/size=256/seed=2/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/dbpedia/size=256/seed=2/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/dbpedia/size=256/seed=2/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/dbpedia/size=256/seed=2/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/dbpedia/size=256/seed=3/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/dbpedia/size=256/seed=3/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/dbpedia/size=256/seed=3/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/dbpedia/size=256/seed=3/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/dbpedia/size=256/seed=0/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/dbpedia/size=256/seed=0/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/dbpedia/size=256/seed=0/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/dbpedia/size=256/seed=0/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/dbpedia/size=256/seed=1/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/dbpedia/size=256/seed=1/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/dbpedia/size=256/seed=1/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/dbpedia/size=256/seed=1/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/dbpedia/size=64/seed=4/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/dbpedia/size=64/seed=4/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/dbpedia/size=64/seed=4/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/dbpedia/size=64/seed=4/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/dbpedia/size=64/seed=2/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/dbpedia/size=64/seed=2/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/dbpedia/size=64/seed=2/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/dbpedia/size=64/seed=2/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/dbpedia/size=64/seed=3/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/dbpedia/size=64/seed=3/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/dbpedia/size=64/seed=3/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/dbpedia/size=64/seed=1/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/dbpedia/size=64/seed=1/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/dbpedia/size=64/seed=1/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/dbpedia/size=16/seed=4/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/dbpedia/size=16/seed=4/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/dbpedia/size=16/seed=4/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/dbpedia/size=16/seed=4/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/dbpedia/size=16/seed=2/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/dbpedia/size=16/seed=2/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/dbpedia/size=16/seed=2/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/dbpedia/size=16/seed=2/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/dbpedia/size=16/seed=3/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/dbpedia/size=16/seed=3/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/dbpedia/size=16/seed=3/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/dbpedia/size=16/seed=3/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/dbpedia/size=16/seed=0/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/dbpedia/size=16/seed=0/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/dbpedia/size=16/seed=0/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/dbpedia/size=16/seed=0/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/dbpedia/size=16/seed=1/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/dbpedia/size=16/seed=1/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/dbpedia/size=16/seed=1/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/dbpedia/size=16/seed=1/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/dbpedia/size=32/seed=4/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/dbpedia/size=32/seed=4/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/dbpedia/size=32/seed=4/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/dbpedia/size=32/seed=4/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/dbpedia/size=32/seed=2/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/dbpedia/size=32/seed=2/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/dbpedia/size=32/seed=2/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/dbpedia/size=32/seed=2/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/dbpedia/size=32/seed=3/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/dbpedia/size=32/seed=3/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/dbpedia/size=32/seed=3/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/dbpedia/size=32/seed=3/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/dbpedia/size=32/seed=0/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/dbpedia/size=32/seed=0/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/dbpedia/size=32/seed=0/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/dbpedia/size=32/seed=0/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/dbpedia/size=32/seed=1/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/dbpedia/size=32/seed=1/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/dbpedia/size=32/seed=1/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/dbpedia/size=32/seed=1/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/banking77/size=8/seed=4/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/banking77/size=8/seed=4/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/banking77/size=8/seed=4/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/banking77/size=8/seed=4/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/banking77/size=8/seed=2/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/banking77/size=8/seed=2/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/banking77/size=8/seed=2/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/banking77/size=8/seed=2/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/banking77/size=8/seed=3/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/banking77/size=8/seed=3/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/banking77/size=8/seed=3/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/banking77/size=8/seed=3/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/banking77/size=8/seed=0/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/banking77/size=8/seed=0/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/banking77/size=8/seed=0/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/banking77/size=8/seed=0/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/banking77/size=8/seed=1/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/banking77/size=8/seed=1/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/banking77/size=8/seed=1/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/banking77/size=8/seed=1/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/banking77/size=128/seed=4/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/banking77/size=128/seed=4/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/banking77/size=128/seed=4/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/banking77/size=128/seed=4/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/banking77/size=128/seed=2/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/banking77/size=128/seed=2/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/banking77/size=128/seed=2/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/banking77/size=128/seed=2/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/banking77/size=128/seed=3/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/banking77/size=128/seed=3/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/banking77/size=128/seed=3/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/banking77/size=128/seed=3/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/banking77/size=128/seed=0/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/banking77/size=128/seed=0/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/banking77/size=128/seed=0/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/banking77/size=128/seed=0/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/banking77/size=128/seed=1/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/banking77/size=128/seed=1/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/banking77/size=128/seed=1/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/banking77/size=128/seed=1/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/banking77/size=256/seed=4/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/banking77/size=256/seed=4/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/banking77/size=256/seed=4/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/banking77/size=256/seed=4/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/banking77/size=256/seed=2/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/banking77/size=256/seed=2/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/banking77/size=256/seed=2/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/banking77/size=256/seed=2/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/banking77/size=256/seed=3/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/banking77/size=256/seed=3/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/banking77/size=256/seed=3/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/banking77/size=256/seed=3/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/banking77/size=256/seed=0/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/banking77/size=256/seed=0/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/banking77/size=256/seed=0/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/banking77/size=256/seed=0/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/banking77/size=256/seed=1/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/banking77/size=256/seed=1/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/banking77/size=256/seed=1/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/banking77/size=256/seed=1/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/banking77/size=64/seed=4/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/banking77/size=64/seed=4/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/banking77/size=64/seed=4/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/banking77/size=64/seed=4/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/banking77/size=64/seed=2/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/banking77/size=64/seed=2/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/banking77/size=64/seed=2/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/banking77/size=64/seed=2/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/banking77/size=64/seed=3/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/banking77/size=64/seed=3/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/banking77/size=64/seed=3/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/banking77/size=64/seed=3/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/banking77/size=64/seed=0/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/banking77/size=64/seed=0/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/banking77/size=64/seed=0/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/banking77/size=64/seed=0/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/banking77/size=64/seed=1/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/banking77/size=64/seed=1/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/banking77/size=64/seed=1/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/banking77/size=64/seed=1/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/banking77/size=16/seed=4/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/banking77/size=16/seed=4/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/banking77/size=16/seed=4/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/banking77/size=16/seed=4/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/banking77/size=16/seed=2/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/banking77/size=16/seed=2/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/banking77/size=16/seed=2/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/banking77/size=16/seed=2/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/banking77/size=16/seed=3/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/banking77/size=16/seed=3/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/banking77/size=16/seed=3/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/banking77/size=16/seed=3/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/banking77/size=16/seed=0/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/banking77/size=16/seed=0/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/banking77/size=16/seed=0/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/banking77/size=16/seed=0/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/banking77/size=16/seed=1/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/banking77/size=16/seed=1/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/banking77/size=16/seed=1/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/banking77/size=16/seed=1/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/banking77/size=32/seed=4/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/banking77/size=32/seed=4/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/banking77/size=32/seed=4/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/banking77/size=32/seed=4/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/banking77/size=32/seed=2/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/banking77/size=32/seed=2/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/banking77/size=32/seed=2/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/banking77/size=32/seed=2/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/banking77/size=32/seed=3/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/banking77/size=32/seed=3/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/banking77/size=32/seed=3/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/banking77/size=32/seed=3/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/banking77/size=32/seed=0/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/banking77/size=32/seed=0/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/banking77/size=32/seed=0/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/banking77/size=32/seed=0/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/banking77/size=32/seed=1/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/banking77/size=32/seed=1/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/banking77/size=32/seed=1/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/banking77/size=32/seed=1/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text results_paper.old/llama3.2-1b-instruct/metric_vs_samples/combined_performance_llama3.2-1b-instruct.png filter=lfs diff=lfs merge=lfs -text results_paper.old/llama3.2-1b-instruct/metric_vs_samples/adaptation_performance_llama3.2-1b-instruct.png filter=lfs diff=lfs merge=lfs -text results_paper.old/qwen2.5-7b-instruct/metric_vs_samples/adaptation_performance_qwen2.5-7b-instruct.png filter=lfs diff=lfs merge=lfs -text results_paper.old/qwen2.5-7b-instruct/metric_vs_samples/combined_performance_qwen2.5-7b-instruct.png filter=lfs diff=lfs merge=lfs -text results_paper.old/all_models/comparison.png filter=lfs diff=lfs merge=lfs -text lora_plus_biasshift/llama3.2-1b-instruct/dbpedia/size=32/seed=4/lora_ans_no_es/0.0-0.7/0.0-0.3/0.7-1.0/logs/metrics.csv filter=lfs diff=lfs merge=lfs -text lora_plus_biasshift/llama3.2-1b-instruct/dbpedia/size=32/seed=3/lora_ans_no_es/0.0-0.7/0.0-0.3/0.7-1.0/logs/metrics.csv filter=lfs diff=lfs merge=lfs -text lora_plus_biasshift/llama3.2-1b-instruct/dbpedia/size=32/seed=1/lora_ans_no_es/0.0-0.7/0.0-0.3/0.7-1.0/logs/metrics.csv filter=lfs diff=lfs merge=lfs -text lora_plus_biasshift/qwen2.5-7b-instruct/dbpedia/size=32/seed=4/lora_ans_no_es/0.0-0.7/0.0-0.3/0.7-1.0/logs/metrics.csv filter=lfs diff=lfs merge=lfs -text lora_plus_biasshift/qwen2.5-7b-instruct/dbpedia/size=32/seed=1/lora_ans_no_es/0.0-0.7/0.0-0.3/0.7-1.0/logs/metrics.csv filter=lfs diff=lfs merge=lfs -text prompts/llama3.2-1b-instruct/agnews/all.jsonl filter=lfs diff=lfs merge=lfs -text prompts/llama3.2-1b-instruct/sst2/all.jsonl filter=lfs diff=lfs merge=lfs -text prompts/llama3.2-1b-instruct/20newsgroups/all.jsonl filter=lfs diff=lfs merge=lfs -text prompts/llama3.2-1b-instruct/dbpedia/all.jsonl filter=lfs diff=lfs merge=lfs -text prompts/llama3.2-1b-instruct/banking77/all.jsonl filter=lfs diff=lfs merge=lfs -text prompts/qwen2.5-7b-instruct/agnews/all.jsonl filter=lfs diff=lfs merge=lfs -text prompts/qwen2.5-7b-instruct/sst2/all.jsonl filter=lfs diff=lfs merge=lfs -text prompts/qwen2.5-7b-instruct/20newsgroups/all.jsonl filter=lfs diff=lfs merge=lfs -text prompts/qwen2.5-7b-instruct/dbpedia/all.jsonl filter=lfs diff=lfs merge=lfs -text prompts/qwen2.5-7b-instruct/banking77/all.jsonl filter=lfs diff=lfs merge=lfs -text prompts/llama3.2-1b/agnews/all.jsonl filter=lfs diff=lfs merge=lfs -text prompts/llama3.2-1b/sst2/all.jsonl filter=lfs diff=lfs merge=lfs -text prompts/llama3.2-1b/20newsgroups/all.jsonl filter=lfs diff=lfs merge=lfs -text prompts/llama3.2-1b/dbpedia/all.jsonl filter=lfs diff=lfs merge=lfs -text prompts/llama3.2-1b/banking77/all.jsonl filter=lfs diff=lfs merge=lfs -text results/llama3.2-1b-instruct/metric_vs_samples/nce.png filter=lfs diff=lfs merge=lfs -text results/llama3.2-1b-instruct/metric_vs_samples/goodness.png filter=lfs diff=lfs merge=lfs -text results/qwen2.5-7b-instruct/metric_vs_samples/ner.png filter=lfs diff=lfs merge=lfs -text results/qwen2.5-7b-instruct/metric_vs_samples/nce.png filter=lfs diff=lfs merge=lfs -text results/qwen2.5-7b-instruct/metric_vs_samples/goodness.png filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/dbpedia/size=64/seed=3/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/dbpedia/size=64/seed=0/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/dbpedia/size=64/seed=0/lora_ans/0.0-0.7/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/dbpedia/size=64/seed=0/lora_ans_no_es/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/dbpedia/size=64/seed=0/lora_ans_no_es/0.0-0.7/0.0-0.3/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text finetune_lora/qwen2.5-7b-instruct/dbpedia/size=64/seed=1/lora_ans/0.0-1.0/0.7-1.0/checkpoint/lit_model.pth.lora filter=lfs diff=lfs merge=lfs -text