fix: revert eval_strategy back to evaluation_strategy (4.40.2 uses old name)
Browse files- root_gainlora/gen_script_long_order3_t5_gainlora_inflora.sh +15 -15
- root_gainlora/gen_script_long_order3_t5_inflora.sh +15 -15
- root_gainlora/gen_script_long_order4_t5_gainlora_inflora.sh +15 -15
- root_gainlora/gen_script_long_order4_t5_inflora.sh +15 -15
- root_gainlora/gen_script_superni_order1_llama_gainlora_inflora.sh +15 -15
- root_gainlora/gen_script_superni_order1_llama_gainlora_olora.sh +15 -15
- root_gainlora/gen_script_superni_order1_llama_inflora.sh +15 -15
- root_gainlora/gen_script_superni_order1_llama_olora.sh +15 -15
- root_gainlora/gen_script_superni_order1_t5_gainlora_inflora.sh +15 -15
- root_gainlora/gen_script_superni_order1_t5_inflora.sh +15 -15
- root_gainlora/gen_script_superni_order2_llama_gainlora_inflora.sh +15 -15
- root_gainlora/gen_script_superni_order2_llama_gainlora_olora.sh +15 -15
- root_gainlora/gen_script_superni_order2_llama_inflora.sh +15 -15
- root_gainlora/gen_script_superni_order2_llama_olora.sh +15 -15
- root_gainlora/gen_script_superni_order2_t5_gainlora_inflora.sh +15 -15
- root_gainlora/gen_script_superni_order2_t5_inflora.sh +15 -15
root_gainlora/gen_script_long_order3_t5_gainlora_inflora.sh
CHANGED
|
@@ -37,7 +37,7 @@ CUDA_VISIBLE_DEVICES=$1 python src/run_t5.py \
|
|
| 37 |
--logging_strategy steps \
|
| 38 |
--logging_steps 10 \
|
| 39 |
--metric_for_best_model eval_exact_match \
|
| 40 |
-
--
|
| 41 |
--save_strategy steps \
|
| 42 |
--save_total_limit 1 \
|
| 43 |
--load_best_model_at_end \
|
|
@@ -87,7 +87,7 @@ CUDA_VISIBLE_DEVICES=$1 python src/run_t5.py \
|
|
| 87 |
--logging_strategy steps \
|
| 88 |
--logging_steps 10 \
|
| 89 |
--metric_for_best_model eval_exact_match_for_amazon \
|
| 90 |
-
--
|
| 91 |
--save_strategy steps \
|
| 92 |
--save_total_limit 1 \
|
| 93 |
--load_best_model_at_end \
|
|
@@ -137,7 +137,7 @@ CUDA_VISIBLE_DEVICES=$1 python src/run_t5.py \
|
|
| 137 |
--logging_strategy steps \
|
| 138 |
--logging_steps 10 \
|
| 139 |
--metric_for_best_model eval_exact_match_for_mnli \
|
| 140 |
-
--
|
| 141 |
--save_strategy steps \
|
| 142 |
--save_total_limit 1 \
|
| 143 |
--load_best_model_at_end \
|
|
@@ -187,7 +187,7 @@ CUDA_VISIBLE_DEVICES=$1 python src/run_t5.py \
|
|
| 187 |
--logging_strategy steps \
|
| 188 |
--logging_steps 10 \
|
| 189 |
--metric_for_best_model eval_exact_match_for_cb \
|
| 190 |
-
--
|
| 191 |
--save_strategy steps \
|
| 192 |
--save_total_limit 1 \
|
| 193 |
--load_best_model_at_end \
|
|
@@ -237,7 +237,7 @@ CUDA_VISIBLE_DEVICES=$1 python src/run_t5.py \
|
|
| 237 |
--logging_strategy steps \
|
| 238 |
--logging_steps 10 \
|
| 239 |
--metric_for_best_model eval_exact_match_for_copa \
|
| 240 |
-
--
|
| 241 |
--save_strategy steps \
|
| 242 |
--save_total_limit 1 \
|
| 243 |
--load_best_model_at_end \
|
|
@@ -287,7 +287,7 @@ CUDA_VISIBLE_DEVICES=$1 python src/run_t5.py \
|
|
| 287 |
--logging_strategy steps \
|
| 288 |
--logging_steps 10 \
|
| 289 |
--metric_for_best_model eval_exact_match_for_qqp \
|
| 290 |
-
--
|
| 291 |
--save_strategy steps \
|
| 292 |
--save_total_limit 1 \
|
| 293 |
--load_best_model_at_end \
|
|
@@ -337,7 +337,7 @@ CUDA_VISIBLE_DEVICES=$1 python src/run_t5.py \
|
|
| 337 |
--logging_strategy steps \
|
| 338 |
--logging_steps 10 \
|
| 339 |
--metric_for_best_model eval_exact_match_for_rte \
|
| 340 |
-
--
|
| 341 |
--save_strategy steps \
|
| 342 |
--save_total_limit 1 \
|
| 343 |
--load_best_model_at_end \
|
|
@@ -387,7 +387,7 @@ CUDA_VISIBLE_DEVICES=$1 python src/run_t5.py \
|
|
| 387 |
--logging_strategy steps \
|
| 388 |
--logging_steps 10 \
|
| 389 |
--metric_for_best_model eval_exact_match_for_imdb \
|
| 390 |
-
--
|
| 391 |
--save_strategy steps \
|
| 392 |
--save_total_limit 1 \
|
| 393 |
--load_best_model_at_end \
|
|
@@ -437,7 +437,7 @@ CUDA_VISIBLE_DEVICES=$1 python src/run_t5.py \
|
|
| 437 |
--logging_strategy steps \
|
| 438 |
--logging_steps 10 \
|
| 439 |
--metric_for_best_model eval_exact_match_for_sst2 \
|
| 440 |
-
--
|
| 441 |
--save_strategy steps \
|
| 442 |
--save_total_limit 1 \
|
| 443 |
--load_best_model_at_end \
|
|
@@ -487,7 +487,7 @@ CUDA_VISIBLE_DEVICES=$1 python src/run_t5.py \
|
|
| 487 |
--logging_strategy steps \
|
| 488 |
--logging_steps 10 \
|
| 489 |
--metric_for_best_model eval_exact_match_for_dbpedia \
|
| 490 |
-
--
|
| 491 |
--save_strategy steps \
|
| 492 |
--save_total_limit 1 \
|
| 493 |
--load_best_model_at_end \
|
|
@@ -537,7 +537,7 @@ CUDA_VISIBLE_DEVICES=$1 python src/run_t5.py \
|
|
| 537 |
--logging_strategy steps \
|
| 538 |
--logging_steps 10 \
|
| 539 |
--metric_for_best_model eval_exact_match_for_agnews \
|
| 540 |
-
--
|
| 541 |
--save_strategy steps \
|
| 542 |
--save_total_limit 1 \
|
| 543 |
--load_best_model_at_end \
|
|
@@ -587,7 +587,7 @@ CUDA_VISIBLE_DEVICES=$1 python src/run_t5.py \
|
|
| 587 |
--logging_strategy steps \
|
| 588 |
--logging_steps 10 \
|
| 589 |
--metric_for_best_model eval_exact_match_for_yahoo \
|
| 590 |
-
--
|
| 591 |
--save_strategy steps \
|
| 592 |
--save_total_limit 1 \
|
| 593 |
--load_best_model_at_end \
|
|
@@ -637,7 +637,7 @@ CUDA_VISIBLE_DEVICES=$1 python src/run_t5.py \
|
|
| 637 |
--logging_strategy steps \
|
| 638 |
--logging_steps 10 \
|
| 639 |
--metric_for_best_model eval_exact_match_for_multirc \
|
| 640 |
-
--
|
| 641 |
--save_strategy steps \
|
| 642 |
--save_total_limit 1 \
|
| 643 |
--load_best_model_at_end \
|
|
@@ -687,7 +687,7 @@ CUDA_VISIBLE_DEVICES=$1 python src/run_t5.py \
|
|
| 687 |
--logging_strategy steps \
|
| 688 |
--logging_steps 10 \
|
| 689 |
--metric_for_best_model eval_exact_match_for_boolq \
|
| 690 |
-
--
|
| 691 |
--save_strategy steps \
|
| 692 |
--save_total_limit 1 \
|
| 693 |
--load_best_model_at_end \
|
|
@@ -738,7 +738,7 @@ CUDA_VISIBLE_DEVICES=$1 python src/run_t5.py \
|
|
| 738 |
--logging_strategy steps \
|
| 739 |
--logging_steps 10 \
|
| 740 |
--metric_for_best_model eval_exact_match_for_wic \
|
| 741 |
-
--
|
| 742 |
--save_strategy steps \
|
| 743 |
--save_total_limit 1 \
|
| 744 |
--load_best_model_at_end \
|
|
|
|
| 37 |
--logging_strategy steps \
|
| 38 |
--logging_steps 10 \
|
| 39 |
--metric_for_best_model eval_exact_match \
|
| 40 |
+
--evaluation_strategy steps \
|
| 41 |
--save_strategy steps \
|
| 42 |
--save_total_limit 1 \
|
| 43 |
--load_best_model_at_end \
|
|
|
|
| 87 |
--logging_strategy steps \
|
| 88 |
--logging_steps 10 \
|
| 89 |
--metric_for_best_model eval_exact_match_for_amazon \
|
| 90 |
+
--evaluation_strategy steps \
|
| 91 |
--save_strategy steps \
|
| 92 |
--save_total_limit 1 \
|
| 93 |
--load_best_model_at_end \
|
|
|
|
| 137 |
--logging_strategy steps \
|
| 138 |
--logging_steps 10 \
|
| 139 |
--metric_for_best_model eval_exact_match_for_mnli \
|
| 140 |
+
--evaluation_strategy steps \
|
| 141 |
--save_strategy steps \
|
| 142 |
--save_total_limit 1 \
|
| 143 |
--load_best_model_at_end \
|
|
|
|
| 187 |
--logging_strategy steps \
|
| 188 |
--logging_steps 10 \
|
| 189 |
--metric_for_best_model eval_exact_match_for_cb \
|
| 190 |
+
--evaluation_strategy steps \
|
| 191 |
--save_strategy steps \
|
| 192 |
--save_total_limit 1 \
|
| 193 |
--load_best_model_at_end \
|
|
|
|
| 237 |
--logging_strategy steps \
|
| 238 |
--logging_steps 10 \
|
| 239 |
--metric_for_best_model eval_exact_match_for_copa \
|
| 240 |
+
--evaluation_strategy steps \
|
| 241 |
--save_strategy steps \
|
| 242 |
--save_total_limit 1 \
|
| 243 |
--load_best_model_at_end \
|
|
|
|
| 287 |
--logging_strategy steps \
|
| 288 |
--logging_steps 10 \
|
| 289 |
--metric_for_best_model eval_exact_match_for_qqp \
|
| 290 |
+
--evaluation_strategy steps \
|
| 291 |
--save_strategy steps \
|
| 292 |
--save_total_limit 1 \
|
| 293 |
--load_best_model_at_end \
|
|
|
|
| 337 |
--logging_strategy steps \
|
| 338 |
--logging_steps 10 \
|
| 339 |
--metric_for_best_model eval_exact_match_for_rte \
|
| 340 |
+
--evaluation_strategy steps \
|
| 341 |
--save_strategy steps \
|
| 342 |
--save_total_limit 1 \
|
| 343 |
--load_best_model_at_end \
|
|
|
|
| 387 |
--logging_strategy steps \
|
| 388 |
--logging_steps 10 \
|
| 389 |
--metric_for_best_model eval_exact_match_for_imdb \
|
| 390 |
+
--evaluation_strategy steps \
|
| 391 |
--save_strategy steps \
|
| 392 |
--save_total_limit 1 \
|
| 393 |
--load_best_model_at_end \
|
|
|
|
| 437 |
--logging_strategy steps \
|
| 438 |
--logging_steps 10 \
|
| 439 |
--metric_for_best_model eval_exact_match_for_sst2 \
|
| 440 |
+
--evaluation_strategy steps \
|
| 441 |
--save_strategy steps \
|
| 442 |
--save_total_limit 1 \
|
| 443 |
--load_best_model_at_end \
|
|
|
|
| 487 |
--logging_strategy steps \
|
| 488 |
--logging_steps 10 \
|
| 489 |
--metric_for_best_model eval_exact_match_for_dbpedia \
|
| 490 |
+
--evaluation_strategy steps \
|
| 491 |
--save_strategy steps \
|
| 492 |
--save_total_limit 1 \
|
| 493 |
--load_best_model_at_end \
|
|
|
|
| 537 |
--logging_strategy steps \
|
| 538 |
--logging_steps 10 \
|
| 539 |
--metric_for_best_model eval_exact_match_for_agnews \
|
| 540 |
+
--evaluation_strategy steps \
|
| 541 |
--save_strategy steps \
|
| 542 |
--save_total_limit 1 \
|
| 543 |
--load_best_model_at_end \
|
|
|
|
| 587 |
--logging_strategy steps \
|
| 588 |
--logging_steps 10 \
|
| 589 |
--metric_for_best_model eval_exact_match_for_yahoo \
|
| 590 |
+
--evaluation_strategy steps \
|
| 591 |
--save_strategy steps \
|
| 592 |
--save_total_limit 1 \
|
| 593 |
--load_best_model_at_end \
|
|
|
|
| 637 |
--logging_strategy steps \
|
| 638 |
--logging_steps 10 \
|
| 639 |
--metric_for_best_model eval_exact_match_for_multirc \
|
| 640 |
+
--evaluation_strategy steps \
|
| 641 |
--save_strategy steps \
|
| 642 |
--save_total_limit 1 \
|
| 643 |
--load_best_model_at_end \
|
|
|
|
| 687 |
--logging_strategy steps \
|
| 688 |
--logging_steps 10 \
|
| 689 |
--metric_for_best_model eval_exact_match_for_boolq \
|
| 690 |
+
--evaluation_strategy steps \
|
| 691 |
--save_strategy steps \
|
| 692 |
--save_total_limit 1 \
|
| 693 |
--load_best_model_at_end \
|
|
|
|
| 738 |
--logging_strategy steps \
|
| 739 |
--logging_steps 10 \
|
| 740 |
--metric_for_best_model eval_exact_match_for_wic \
|
| 741 |
+
--evaluation_strategy steps \
|
| 742 |
--save_strategy steps \
|
| 743 |
--save_total_limit 1 \
|
| 744 |
--load_best_model_at_end \
|
root_gainlora/gen_script_long_order3_t5_inflora.sh
CHANGED
|
@@ -38,7 +38,7 @@ CUDA_VISIBLE_DEVICES=$1 python src/run_t5.py \
|
|
| 38 |
--logging_strategy steps \
|
| 39 |
--logging_steps 10 \
|
| 40 |
--metric_for_best_model eval_exact_match \
|
| 41 |
-
--
|
| 42 |
--save_strategy steps \
|
| 43 |
--save_total_limit 1 \
|
| 44 |
--load_best_model_at_end \
|
|
@@ -87,7 +87,7 @@ CUDA_VISIBLE_DEVICES=$1 python src/run_t5.py \
|
|
| 87 |
--logging_strategy steps \
|
| 88 |
--logging_steps 10 \
|
| 89 |
--metric_for_best_model eval_exact_match_for_amazon \
|
| 90 |
-
--
|
| 91 |
--save_strategy steps \
|
| 92 |
--save_total_limit 1 \
|
| 93 |
--load_best_model_at_end \
|
|
@@ -136,7 +136,7 @@ CUDA_VISIBLE_DEVICES=$1 python src/run_t5.py \
|
|
| 136 |
--logging_strategy steps \
|
| 137 |
--logging_steps 10 \
|
| 138 |
--metric_for_best_model eval_exact_match_for_mnli \
|
| 139 |
-
--
|
| 140 |
--save_strategy steps \
|
| 141 |
--save_total_limit 1 \
|
| 142 |
--load_best_model_at_end \
|
|
@@ -185,7 +185,7 @@ CUDA_VISIBLE_DEVICES=$1 python src/run_t5.py \
|
|
| 185 |
--logging_strategy steps \
|
| 186 |
--logging_steps 10 \
|
| 187 |
--metric_for_best_model eval_exact_match_for_cb \
|
| 188 |
-
--
|
| 189 |
--save_strategy steps \
|
| 190 |
--save_total_limit 1 \
|
| 191 |
--load_best_model_at_end \
|
|
@@ -234,7 +234,7 @@ CUDA_VISIBLE_DEVICES=$1 python src/run_t5.py \
|
|
| 234 |
--logging_strategy steps \
|
| 235 |
--logging_steps 10 \
|
| 236 |
--metric_for_best_model eval_exact_match_for_copa \
|
| 237 |
-
--
|
| 238 |
--save_strategy steps \
|
| 239 |
--save_total_limit 1 \
|
| 240 |
--load_best_model_at_end \
|
|
@@ -283,7 +283,7 @@ CUDA_VISIBLE_DEVICES=$1 python src/run_t5.py \
|
|
| 283 |
--logging_strategy steps \
|
| 284 |
--logging_steps 10 \
|
| 285 |
--metric_for_best_model eval_exact_match_for_qqp \
|
| 286 |
-
--
|
| 287 |
--save_strategy steps \
|
| 288 |
--save_total_limit 1 \
|
| 289 |
--load_best_model_at_end \
|
|
@@ -332,7 +332,7 @@ CUDA_VISIBLE_DEVICES=$1 python src/run_t5.py \
|
|
| 332 |
--logging_strategy steps \
|
| 333 |
--logging_steps 10 \
|
| 334 |
--metric_for_best_model eval_exact_match_for_rte \
|
| 335 |
-
--
|
| 336 |
--save_strategy steps \
|
| 337 |
--save_total_limit 1 \
|
| 338 |
--load_best_model_at_end \
|
|
@@ -381,7 +381,7 @@ CUDA_VISIBLE_DEVICES=$1 python src/run_t5.py \
|
|
| 381 |
--logging_strategy steps \
|
| 382 |
--logging_steps 10 \
|
| 383 |
--metric_for_best_model eval_exact_match_for_imdb \
|
| 384 |
-
--
|
| 385 |
--save_strategy steps \
|
| 386 |
--save_total_limit 1 \
|
| 387 |
--load_best_model_at_end \
|
|
@@ -430,7 +430,7 @@ CUDA_VISIBLE_DEVICES=$1 python src/run_t5.py \
|
|
| 430 |
--logging_strategy steps \
|
| 431 |
--logging_steps 10 \
|
| 432 |
--metric_for_best_model eval_exact_match_for_sst2 \
|
| 433 |
-
--
|
| 434 |
--save_strategy steps \
|
| 435 |
--save_total_limit 1 \
|
| 436 |
--load_best_model_at_end \
|
|
@@ -479,7 +479,7 @@ CUDA_VISIBLE_DEVICES=$1 python src/run_t5.py \
|
|
| 479 |
--logging_strategy steps \
|
| 480 |
--logging_steps 10 \
|
| 481 |
--metric_for_best_model eval_exact_match_for_dbpedia \
|
| 482 |
-
--
|
| 483 |
--save_strategy steps \
|
| 484 |
--save_total_limit 1 \
|
| 485 |
--load_best_model_at_end \
|
|
@@ -528,7 +528,7 @@ CUDA_VISIBLE_DEVICES=$1 python src/run_t5.py \
|
|
| 528 |
--logging_strategy steps \
|
| 529 |
--logging_steps 10 \
|
| 530 |
--metric_for_best_model eval_exact_match_for_agnews \
|
| 531 |
-
--
|
| 532 |
--save_strategy steps \
|
| 533 |
--save_total_limit 1 \
|
| 534 |
--load_best_model_at_end \
|
|
@@ -577,7 +577,7 @@ CUDA_VISIBLE_DEVICES=$1 python src/run_t5.py \
|
|
| 577 |
--logging_strategy steps \
|
| 578 |
--logging_steps 10 \
|
| 579 |
--metric_for_best_model eval_exact_match_for_yahoo \
|
| 580 |
-
--
|
| 581 |
--save_strategy steps \
|
| 582 |
--save_total_limit 1 \
|
| 583 |
--load_best_model_at_end \
|
|
@@ -626,7 +626,7 @@ CUDA_VISIBLE_DEVICES=$1 python src/run_t5.py \
|
|
| 626 |
--logging_strategy steps \
|
| 627 |
--logging_steps 10 \
|
| 628 |
--metric_for_best_model eval_exact_match_for_multirc \
|
| 629 |
-
--
|
| 630 |
--save_strategy steps \
|
| 631 |
--save_total_limit 1 \
|
| 632 |
--load_best_model_at_end \
|
|
@@ -675,7 +675,7 @@ CUDA_VISIBLE_DEVICES=$1 python src/run_t5.py \
|
|
| 675 |
--logging_strategy steps \
|
| 676 |
--logging_steps 10 \
|
| 677 |
--metric_for_best_model eval_exact_match_for_boolq \
|
| 678 |
-
--
|
| 679 |
--save_strategy steps \
|
| 680 |
--save_total_limit 1 \
|
| 681 |
--load_best_model_at_end \
|
|
@@ -724,7 +724,7 @@ CUDA_VISIBLE_DEVICES=$1 python src/run_t5.py \
|
|
| 724 |
--logging_strategy steps \
|
| 725 |
--logging_steps 10 \
|
| 726 |
--metric_for_best_model eval_exact_match_for_wic \
|
| 727 |
-
--
|
| 728 |
--save_strategy steps \
|
| 729 |
--save_total_limit 1 \
|
| 730 |
--load_best_model_at_end \
|
|
|
|
| 38 |
--logging_strategy steps \
|
| 39 |
--logging_steps 10 \
|
| 40 |
--metric_for_best_model eval_exact_match \
|
| 41 |
+
--evaluation_strategy steps \
|
| 42 |
--save_strategy steps \
|
| 43 |
--save_total_limit 1 \
|
| 44 |
--load_best_model_at_end \
|
|
|
|
| 87 |
--logging_strategy steps \
|
| 88 |
--logging_steps 10 \
|
| 89 |
--metric_for_best_model eval_exact_match_for_amazon \
|
| 90 |
+
--evaluation_strategy steps \
|
| 91 |
--save_strategy steps \
|
| 92 |
--save_total_limit 1 \
|
| 93 |
--load_best_model_at_end \
|
|
|
|
| 136 |
--logging_strategy steps \
|
| 137 |
--logging_steps 10 \
|
| 138 |
--metric_for_best_model eval_exact_match_for_mnli \
|
| 139 |
+
--evaluation_strategy steps \
|
| 140 |
--save_strategy steps \
|
| 141 |
--save_total_limit 1 \
|
| 142 |
--load_best_model_at_end \
|
|
|
|
| 185 |
--logging_strategy steps \
|
| 186 |
--logging_steps 10 \
|
| 187 |
--metric_for_best_model eval_exact_match_for_cb \
|
| 188 |
+
--evaluation_strategy steps \
|
| 189 |
--save_strategy steps \
|
| 190 |
--save_total_limit 1 \
|
| 191 |
--load_best_model_at_end \
|
|
|
|
| 234 |
--logging_strategy steps \
|
| 235 |
--logging_steps 10 \
|
| 236 |
--metric_for_best_model eval_exact_match_for_copa \
|
| 237 |
+
--evaluation_strategy steps \
|
| 238 |
--save_strategy steps \
|
| 239 |
--save_total_limit 1 \
|
| 240 |
--load_best_model_at_end \
|
|
|
|
| 283 |
--logging_strategy steps \
|
| 284 |
--logging_steps 10 \
|
| 285 |
--metric_for_best_model eval_exact_match_for_qqp \
|
| 286 |
+
--evaluation_strategy steps \
|
| 287 |
--save_strategy steps \
|
| 288 |
--save_total_limit 1 \
|
| 289 |
--load_best_model_at_end \
|
|
|
|
| 332 |
--logging_strategy steps \
|
| 333 |
--logging_steps 10 \
|
| 334 |
--metric_for_best_model eval_exact_match_for_rte \
|
| 335 |
+
--evaluation_strategy steps \
|
| 336 |
--save_strategy steps \
|
| 337 |
--save_total_limit 1 \
|
| 338 |
--load_best_model_at_end \
|
|
|
|
| 381 |
--logging_strategy steps \
|
| 382 |
--logging_steps 10 \
|
| 383 |
--metric_for_best_model eval_exact_match_for_imdb \
|
| 384 |
+
--evaluation_strategy steps \
|
| 385 |
--save_strategy steps \
|
| 386 |
--save_total_limit 1 \
|
| 387 |
--load_best_model_at_end \
|
|
|
|
| 430 |
--logging_strategy steps \
|
| 431 |
--logging_steps 10 \
|
| 432 |
--metric_for_best_model eval_exact_match_for_sst2 \
|
| 433 |
+
--evaluation_strategy steps \
|
| 434 |
--save_strategy steps \
|
| 435 |
--save_total_limit 1 \
|
| 436 |
--load_best_model_at_end \
|
|
|
|
| 479 |
--logging_strategy steps \
|
| 480 |
--logging_steps 10 \
|
| 481 |
--metric_for_best_model eval_exact_match_for_dbpedia \
|
| 482 |
+
--evaluation_strategy steps \
|
| 483 |
--save_strategy steps \
|
| 484 |
--save_total_limit 1 \
|
| 485 |
--load_best_model_at_end \
|
|
|
|
| 528 |
--logging_strategy steps \
|
| 529 |
--logging_steps 10 \
|
| 530 |
--metric_for_best_model eval_exact_match_for_agnews \
|
| 531 |
+
--evaluation_strategy steps \
|
| 532 |
--save_strategy steps \
|
| 533 |
--save_total_limit 1 \
|
| 534 |
--load_best_model_at_end \
|
|
|
|
| 577 |
--logging_strategy steps \
|
| 578 |
--logging_steps 10 \
|
| 579 |
--metric_for_best_model eval_exact_match_for_yahoo \
|
| 580 |
+
--evaluation_strategy steps \
|
| 581 |
--save_strategy steps \
|
| 582 |
--save_total_limit 1 \
|
| 583 |
--load_best_model_at_end \
|
|
|
|
| 626 |
--logging_strategy steps \
|
| 627 |
--logging_steps 10 \
|
| 628 |
--metric_for_best_model eval_exact_match_for_multirc \
|
| 629 |
+
--evaluation_strategy steps \
|
| 630 |
--save_strategy steps \
|
| 631 |
--save_total_limit 1 \
|
| 632 |
--load_best_model_at_end \
|
|
|
|
| 675 |
--logging_strategy steps \
|
| 676 |
--logging_steps 10 \
|
| 677 |
--metric_for_best_model eval_exact_match_for_boolq \
|
| 678 |
+
--evaluation_strategy steps \
|
| 679 |
--save_strategy steps \
|
| 680 |
--save_total_limit 1 \
|
| 681 |
--load_best_model_at_end \
|
|
|
|
| 724 |
--logging_strategy steps \
|
| 725 |
--logging_steps 10 \
|
| 726 |
--metric_for_best_model eval_exact_match_for_wic \
|
| 727 |
+
--evaluation_strategy steps \
|
| 728 |
--save_strategy steps \
|
| 729 |
--save_total_limit 1 \
|
| 730 |
--load_best_model_at_end \
|
root_gainlora/gen_script_long_order4_t5_gainlora_inflora.sh
CHANGED
|
@@ -38,7 +38,7 @@ CUDA_VISIBLE_DEVICES=$1 python src/run_t5.py \
|
|
| 38 |
--logging_strategy steps \
|
| 39 |
--logging_steps 10 \
|
| 40 |
--metric_for_best_model eval_exact_match \
|
| 41 |
-
--
|
| 42 |
--save_strategy steps \
|
| 43 |
--save_total_limit 1 \
|
| 44 |
--load_best_model_at_end \
|
|
@@ -89,7 +89,7 @@ CUDA_VISIBLE_DEVICES=$1 python src/run_t5.py \
|
|
| 89 |
--logging_strategy steps \
|
| 90 |
--logging_steps 10 \
|
| 91 |
--metric_for_best_model eval_exact_match_for_cb \
|
| 92 |
-
--
|
| 93 |
--save_strategy steps \
|
| 94 |
--save_total_limit 1 \
|
| 95 |
--load_best_model_at_end \
|
|
@@ -140,7 +140,7 @@ CUDA_VISIBLE_DEVICES=$1 python src/run_t5.py \
|
|
| 140 |
--logging_strategy steps \
|
| 141 |
--logging_steps 10 \
|
| 142 |
--metric_for_best_model eval_exact_match_for_wic \
|
| 143 |
-
--
|
| 144 |
--save_strategy steps \
|
| 145 |
--save_total_limit 1 \
|
| 146 |
--load_best_model_at_end \
|
|
@@ -191,7 +191,7 @@ CUDA_VISIBLE_DEVICES=$1 python src/run_t5.py \
|
|
| 191 |
--logging_strategy steps \
|
| 192 |
--logging_steps 10 \
|
| 193 |
--metric_for_best_model eval_exact_match_for_copa \
|
| 194 |
-
--
|
| 195 |
--save_strategy steps \
|
| 196 |
--save_total_limit 1 \
|
| 197 |
--load_best_model_at_end \
|
|
@@ -242,7 +242,7 @@ CUDA_VISIBLE_DEVICES=$1 python src/run_t5.py \
|
|
| 242 |
--logging_strategy steps \
|
| 243 |
--logging_steps 10 \
|
| 244 |
--metric_for_best_model eval_exact_match_for_qqp \
|
| 245 |
-
--
|
| 246 |
--save_strategy steps \
|
| 247 |
--save_total_limit 1 \
|
| 248 |
--load_best_model_at_end \
|
|
@@ -293,7 +293,7 @@ CUDA_VISIBLE_DEVICES=$1 python src/run_t5.py \
|
|
| 293 |
--logging_strategy steps \
|
| 294 |
--logging_steps 10 \
|
| 295 |
--metric_for_best_model eval_exact_match_for_boolq \
|
| 296 |
-
--
|
| 297 |
--save_strategy steps \
|
| 298 |
--save_total_limit 1 \
|
| 299 |
--load_best_model_at_end \
|
|
@@ -344,7 +344,7 @@ CUDA_VISIBLE_DEVICES=$1 python src/run_t5.py \
|
|
| 344 |
--logging_strategy steps \
|
| 345 |
--logging_steps 10 \
|
| 346 |
--metric_for_best_model eval_exact_match_for_rte \
|
| 347 |
-
--
|
| 348 |
--save_strategy steps \
|
| 349 |
--save_total_limit 1 \
|
| 350 |
--load_best_model_at_end \
|
|
@@ -395,7 +395,7 @@ CUDA_VISIBLE_DEVICES=$1 python src/run_t5.py \
|
|
| 395 |
--logging_strategy steps \
|
| 396 |
--logging_steps 10 \
|
| 397 |
--metric_for_best_model eval_exact_match_for_imdb \
|
| 398 |
-
--
|
| 399 |
--save_strategy steps \
|
| 400 |
--save_total_limit 1 \
|
| 401 |
--load_best_model_at_end \
|
|
@@ -446,7 +446,7 @@ CUDA_VISIBLE_DEVICES=$1 python src/run_t5.py \
|
|
| 446 |
--logging_strategy steps \
|
| 447 |
--logging_steps 10 \
|
| 448 |
--metric_for_best_model eval_exact_match_for_yelp \
|
| 449 |
-
--
|
| 450 |
--save_strategy steps \
|
| 451 |
--save_total_limit 1 \
|
| 452 |
--load_best_model_at_end \
|
|
@@ -497,7 +497,7 @@ CUDA_VISIBLE_DEVICES=$1 python src/run_t5.py \
|
|
| 497 |
--logging_strategy steps \
|
| 498 |
--logging_steps 10 \
|
| 499 |
--metric_for_best_model eval_exact_match_for_amazon \
|
| 500 |
-
--
|
| 501 |
--save_strategy steps \
|
| 502 |
--save_total_limit 1 \
|
| 503 |
--load_best_model_at_end \
|
|
@@ -548,7 +548,7 @@ CUDA_VISIBLE_DEVICES=$1 python src/run_t5.py \
|
|
| 548 |
--logging_strategy steps \
|
| 549 |
--logging_steps 10 \
|
| 550 |
--metric_for_best_model eval_exact_match_for_sst2 \
|
| 551 |
-
--
|
| 552 |
--save_strategy steps \
|
| 553 |
--save_total_limit 1 \
|
| 554 |
--load_best_model_at_end \
|
|
@@ -599,7 +599,7 @@ CUDA_VISIBLE_DEVICES=$1 python src/run_t5.py \
|
|
| 599 |
--logging_strategy steps \
|
| 600 |
--logging_steps 10 \
|
| 601 |
--metric_for_best_model eval_exact_match_for_dbpedia \
|
| 602 |
-
--
|
| 603 |
--save_strategy steps \
|
| 604 |
--save_total_limit 1 \
|
| 605 |
--load_best_model_at_end \
|
|
@@ -650,7 +650,7 @@ CUDA_VISIBLE_DEVICES=$1 python src/run_t5.py \
|
|
| 650 |
--logging_strategy steps \
|
| 651 |
--logging_steps 10 \
|
| 652 |
--metric_for_best_model eval_exact_match_for_agnews \
|
| 653 |
-
--
|
| 654 |
--save_strategy steps \
|
| 655 |
--save_total_limit 1 \
|
| 656 |
--load_best_model_at_end \
|
|
@@ -701,7 +701,7 @@ CUDA_VISIBLE_DEVICES=$1 python src/run_t5.py \
|
|
| 701 |
--logging_strategy steps \
|
| 702 |
--logging_steps 10 \
|
| 703 |
--metric_for_best_model eval_exact_match_for_multirc \
|
| 704 |
-
--
|
| 705 |
--save_strategy steps \
|
| 706 |
--save_total_limit 1 \
|
| 707 |
--load_best_model_at_end \
|
|
@@ -752,7 +752,7 @@ CUDA_VISIBLE_DEVICES=$1 python src/run_t5.py \
|
|
| 752 |
--logging_strategy steps \
|
| 753 |
--logging_steps 10 \
|
| 754 |
--metric_for_best_model eval_exact_match_for_yahoo \
|
| 755 |
-
--
|
| 756 |
--save_strategy steps \
|
| 757 |
--save_total_limit 1 \
|
| 758 |
--load_best_model_at_end \
|
|
|
|
| 38 |
--logging_strategy steps \
|
| 39 |
--logging_steps 10 \
|
| 40 |
--metric_for_best_model eval_exact_match \
|
| 41 |
+
--evaluation_strategy steps \
|
| 42 |
--save_strategy steps \
|
| 43 |
--save_total_limit 1 \
|
| 44 |
--load_best_model_at_end \
|
|
|
|
| 89 |
--logging_strategy steps \
|
| 90 |
--logging_steps 10 \
|
| 91 |
--metric_for_best_model eval_exact_match_for_cb \
|
| 92 |
+
--evaluation_strategy steps \
|
| 93 |
--save_strategy steps \
|
| 94 |
--save_total_limit 1 \
|
| 95 |
--load_best_model_at_end \
|
|
|
|
| 140 |
--logging_strategy steps \
|
| 141 |
--logging_steps 10 \
|
| 142 |
--metric_for_best_model eval_exact_match_for_wic \
|
| 143 |
+
--evaluation_strategy steps \
|
| 144 |
--save_strategy steps \
|
| 145 |
--save_total_limit 1 \
|
| 146 |
--load_best_model_at_end \
|
|
|
|
| 191 |
--logging_strategy steps \
|
| 192 |
--logging_steps 10 \
|
| 193 |
--metric_for_best_model eval_exact_match_for_copa \
|
| 194 |
+
--evaluation_strategy steps \
|
| 195 |
--save_strategy steps \
|
| 196 |
--save_total_limit 1 \
|
| 197 |
--load_best_model_at_end \
|
|
|
|
| 242 |
--logging_strategy steps \
|
| 243 |
--logging_steps 10 \
|
| 244 |
--metric_for_best_model eval_exact_match_for_qqp \
|
| 245 |
+
--evaluation_strategy steps \
|
| 246 |
--save_strategy steps \
|
| 247 |
--save_total_limit 1 \
|
| 248 |
--load_best_model_at_end \
|
|
|
|
| 293 |
--logging_strategy steps \
|
| 294 |
--logging_steps 10 \
|
| 295 |
--metric_for_best_model eval_exact_match_for_boolq \
|
| 296 |
+
--evaluation_strategy steps \
|
| 297 |
--save_strategy steps \
|
| 298 |
--save_total_limit 1 \
|
| 299 |
--load_best_model_at_end \
|
|
|
|
| 344 |
--logging_strategy steps \
|
| 345 |
--logging_steps 10 \
|
| 346 |
--metric_for_best_model eval_exact_match_for_rte \
|
| 347 |
+
--evaluation_strategy steps \
|
| 348 |
--save_strategy steps \
|
| 349 |
--save_total_limit 1 \
|
| 350 |
--load_best_model_at_end \
|
|
|
|
| 395 |
--logging_strategy steps \
|
| 396 |
--logging_steps 10 \
|
| 397 |
--metric_for_best_model eval_exact_match_for_imdb \
|
| 398 |
+
--evaluation_strategy steps \
|
| 399 |
--save_strategy steps \
|
| 400 |
--save_total_limit 1 \
|
| 401 |
--load_best_model_at_end \
|
|
|
|
| 446 |
--logging_strategy steps \
|
| 447 |
--logging_steps 10 \
|
| 448 |
--metric_for_best_model eval_exact_match_for_yelp \
|
| 449 |
+
--evaluation_strategy steps \
|
| 450 |
--save_strategy steps \
|
| 451 |
--save_total_limit 1 \
|
| 452 |
--load_best_model_at_end \
|
|
|
|
| 497 |
--logging_strategy steps \
|
| 498 |
--logging_steps 10 \
|
| 499 |
--metric_for_best_model eval_exact_match_for_amazon \
|
| 500 |
+
--evaluation_strategy steps \
|
| 501 |
--save_strategy steps \
|
| 502 |
--save_total_limit 1 \
|
| 503 |
--load_best_model_at_end \
|
|
|
|
| 548 |
--logging_strategy steps \
|
| 549 |
--logging_steps 10 \
|
| 550 |
--metric_for_best_model eval_exact_match_for_sst2 \
|
| 551 |
+
--evaluation_strategy steps \
|
| 552 |
--save_strategy steps \
|
| 553 |
--save_total_limit 1 \
|
| 554 |
--load_best_model_at_end \
|
|
|
|
| 599 |
--logging_strategy steps \
|
| 600 |
--logging_steps 10 \
|
| 601 |
--metric_for_best_model eval_exact_match_for_dbpedia \
|
| 602 |
+
--evaluation_strategy steps \
|
| 603 |
--save_strategy steps \
|
| 604 |
--save_total_limit 1 \
|
| 605 |
--load_best_model_at_end \
|
|
|
|
| 650 |
--logging_strategy steps \
|
| 651 |
--logging_steps 10 \
|
| 652 |
--metric_for_best_model eval_exact_match_for_agnews \
|
| 653 |
+
--evaluation_strategy steps \
|
| 654 |
--save_strategy steps \
|
| 655 |
--save_total_limit 1 \
|
| 656 |
--load_best_model_at_end \
|
|
|
|
| 701 |
--logging_strategy steps \
|
| 702 |
--logging_steps 10 \
|
| 703 |
--metric_for_best_model eval_exact_match_for_multirc \
|
| 704 |
+
--evaluation_strategy steps \
|
| 705 |
--save_strategy steps \
|
| 706 |
--save_total_limit 1 \
|
| 707 |
--load_best_model_at_end \
|
|
|
|
| 752 |
--logging_strategy steps \
|
| 753 |
--logging_steps 10 \
|
| 754 |
--metric_for_best_model eval_exact_match_for_yahoo \
|
| 755 |
+
--evaluation_strategy steps \
|
| 756 |
--save_strategy steps \
|
| 757 |
--save_total_limit 1 \
|
| 758 |
--load_best_model_at_end \
|
root_gainlora/gen_script_long_order4_t5_inflora.sh
CHANGED
|
@@ -38,7 +38,7 @@ CUDA_VISIBLE_DEVICES=1 python src/run_t5.py \
|
|
| 38 |
--logging_strategy steps \
|
| 39 |
--logging_steps 10 \
|
| 40 |
--metric_for_best_model eval_exact_match \
|
| 41 |
-
--
|
| 42 |
--save_strategy steps \
|
| 43 |
--save_total_limit 1 \
|
| 44 |
--load_best_model_at_end \
|
|
@@ -87,7 +87,7 @@ CUDA_VISIBLE_DEVICES=1 python src/run_t5.py \
|
|
| 87 |
--logging_strategy steps \
|
| 88 |
--logging_steps 10 \
|
| 89 |
--metric_for_best_model eval_exact_match_for_cb \
|
| 90 |
-
--
|
| 91 |
--save_strategy steps \
|
| 92 |
--save_total_limit 1 \
|
| 93 |
--load_best_model_at_end \
|
|
@@ -136,7 +136,7 @@ CUDA_VISIBLE_DEVICES=1 python src/run_t5.py \
|
|
| 136 |
--logging_strategy steps \
|
| 137 |
--logging_steps 10 \
|
| 138 |
--metric_for_best_model eval_exact_match_for_wic \
|
| 139 |
-
--
|
| 140 |
--save_strategy steps \
|
| 141 |
--save_total_limit 1 \
|
| 142 |
--load_best_model_at_end \
|
|
@@ -185,7 +185,7 @@ CUDA_VISIBLE_DEVICES=1 python src/run_t5.py \
|
|
| 185 |
--logging_strategy steps \
|
| 186 |
--logging_steps 10 \
|
| 187 |
--metric_for_best_model eval_exact_match_for_copa \
|
| 188 |
-
--
|
| 189 |
--save_strategy steps \
|
| 190 |
--save_total_limit 1 \
|
| 191 |
--load_best_model_at_end \
|
|
@@ -234,7 +234,7 @@ CUDA_VISIBLE_DEVICES=1 python src/run_t5.py \
|
|
| 234 |
--logging_strategy steps \
|
| 235 |
--logging_steps 10 \
|
| 236 |
--metric_for_best_model eval_exact_match_for_qqp \
|
| 237 |
-
--
|
| 238 |
--save_strategy steps \
|
| 239 |
--save_total_limit 1 \
|
| 240 |
--load_best_model_at_end \
|
|
@@ -283,7 +283,7 @@ CUDA_VISIBLE_DEVICES=1 python src/run_t5.py \
|
|
| 283 |
--logging_strategy steps \
|
| 284 |
--logging_steps 10 \
|
| 285 |
--metric_for_best_model eval_exact_match_for_boolq \
|
| 286 |
-
--
|
| 287 |
--save_strategy steps \
|
| 288 |
--save_total_limit 1 \
|
| 289 |
--load_best_model_at_end \
|
|
@@ -332,7 +332,7 @@ CUDA_VISIBLE_DEVICES=1 python src/run_t5.py \
|
|
| 332 |
--logging_strategy steps \
|
| 333 |
--logging_steps 10 \
|
| 334 |
--metric_for_best_model eval_exact_match_for_rte \
|
| 335 |
-
--
|
| 336 |
--save_strategy steps \
|
| 337 |
--save_total_limit 1 \
|
| 338 |
--load_best_model_at_end \
|
|
@@ -381,7 +381,7 @@ CUDA_VISIBLE_DEVICES=1 python src/run_t5.py \
|
|
| 381 |
--logging_strategy steps \
|
| 382 |
--logging_steps 10 \
|
| 383 |
--metric_for_best_model eval_exact_match_for_imdb \
|
| 384 |
-
--
|
| 385 |
--save_strategy steps \
|
| 386 |
--save_total_limit 1 \
|
| 387 |
--load_best_model_at_end \
|
|
@@ -430,7 +430,7 @@ CUDA_VISIBLE_DEVICES=1 python src/run_t5.py \
|
|
| 430 |
--logging_strategy steps \
|
| 431 |
--logging_steps 10 \
|
| 432 |
--metric_for_best_model eval_exact_match_for_yelp \
|
| 433 |
-
--
|
| 434 |
--save_strategy steps \
|
| 435 |
--save_total_limit 1 \
|
| 436 |
--load_best_model_at_end \
|
|
@@ -479,7 +479,7 @@ CUDA_VISIBLE_DEVICES=1 python src/run_t5.py \
|
|
| 479 |
--logging_strategy steps \
|
| 480 |
--logging_steps 10 \
|
| 481 |
--metric_for_best_model eval_exact_match_for_amazon \
|
| 482 |
-
--
|
| 483 |
--save_strategy steps \
|
| 484 |
--save_total_limit 1 \
|
| 485 |
--load_best_model_at_end \
|
|
@@ -528,7 +528,7 @@ CUDA_VISIBLE_DEVICES=1 python src/run_t5.py \
|
|
| 528 |
--logging_strategy steps \
|
| 529 |
--logging_steps 10 \
|
| 530 |
--metric_for_best_model eval_exact_match_for_sst2 \
|
| 531 |
-
--
|
| 532 |
--save_strategy steps \
|
| 533 |
--save_total_limit 1 \
|
| 534 |
--load_best_model_at_end \
|
|
@@ -577,7 +577,7 @@ CUDA_VISIBLE_DEVICES=1 python src/run_t5.py \
|
|
| 577 |
--logging_strategy steps \
|
| 578 |
--logging_steps 10 \
|
| 579 |
--metric_for_best_model eval_exact_match_for_dbpedia \
|
| 580 |
-
--
|
| 581 |
--save_strategy steps \
|
| 582 |
--save_total_limit 1 \
|
| 583 |
--load_best_model_at_end \
|
|
@@ -626,7 +626,7 @@ CUDA_VISIBLE_DEVICES=1 python src/run_t5.py \
|
|
| 626 |
--logging_strategy steps \
|
| 627 |
--logging_steps 10 \
|
| 628 |
--metric_for_best_model eval_exact_match_for_agnews \
|
| 629 |
-
--
|
| 630 |
--save_strategy steps \
|
| 631 |
--save_total_limit 1 \
|
| 632 |
--load_best_model_at_end \
|
|
@@ -675,7 +675,7 @@ CUDA_VISIBLE_DEVICES=1 python src/run_t5.py \
|
|
| 675 |
--logging_strategy steps \
|
| 676 |
--logging_steps 10 \
|
| 677 |
--metric_for_best_model eval_exact_match_for_multirc \
|
| 678 |
-
--
|
| 679 |
--save_strategy steps \
|
| 680 |
--save_total_limit 1 \
|
| 681 |
--load_best_model_at_end \
|
|
@@ -724,7 +724,7 @@ CUDA_VISIBLE_DEVICES=1 python src/run_t5.py \
|
|
| 724 |
--logging_strategy steps \
|
| 725 |
--logging_steps 10 \
|
| 726 |
--metric_for_best_model eval_exact_match_for_yahoo \
|
| 727 |
-
--
|
| 728 |
--save_strategy steps \
|
| 729 |
--save_total_limit 1 \
|
| 730 |
--load_best_model_at_end \
|
|
|
|
| 38 |
--logging_strategy steps \
|
| 39 |
--logging_steps 10 \
|
| 40 |
--metric_for_best_model eval_exact_match \
|
| 41 |
+
--evaluation_strategy steps \
|
| 42 |
--save_strategy steps \
|
| 43 |
--save_total_limit 1 \
|
| 44 |
--load_best_model_at_end \
|
|
|
|
| 87 |
--logging_strategy steps \
|
| 88 |
--logging_steps 10 \
|
| 89 |
--metric_for_best_model eval_exact_match_for_cb \
|
| 90 |
+
--evaluation_strategy steps \
|
| 91 |
--save_strategy steps \
|
| 92 |
--save_total_limit 1 \
|
| 93 |
--load_best_model_at_end \
|
|
|
|
| 136 |
--logging_strategy steps \
|
| 137 |
--logging_steps 10 \
|
| 138 |
--metric_for_best_model eval_exact_match_for_wic \
|
| 139 |
+
--evaluation_strategy steps \
|
| 140 |
--save_strategy steps \
|
| 141 |
--save_total_limit 1 \
|
| 142 |
--load_best_model_at_end \
|
|
|
|
| 185 |
--logging_strategy steps \
|
| 186 |
--logging_steps 10 \
|
| 187 |
--metric_for_best_model eval_exact_match_for_copa \
|
| 188 |
+
--evaluation_strategy steps \
|
| 189 |
--save_strategy steps \
|
| 190 |
--save_total_limit 1 \
|
| 191 |
--load_best_model_at_end \
|
|
|
|
| 234 |
--logging_strategy steps \
|
| 235 |
--logging_steps 10 \
|
| 236 |
--metric_for_best_model eval_exact_match_for_qqp \
|
| 237 |
+
--evaluation_strategy steps \
|
| 238 |
--save_strategy steps \
|
| 239 |
--save_total_limit 1 \
|
| 240 |
--load_best_model_at_end \
|
|
|
|
| 283 |
--logging_strategy steps \
|
| 284 |
--logging_steps 10 \
|
| 285 |
--metric_for_best_model eval_exact_match_for_boolq \
|
| 286 |
+
--evaluation_strategy steps \
|
| 287 |
--save_strategy steps \
|
| 288 |
--save_total_limit 1 \
|
| 289 |
--load_best_model_at_end \
|
|
|
|
| 332 |
--logging_strategy steps \
|
| 333 |
--logging_steps 10 \
|
| 334 |
--metric_for_best_model eval_exact_match_for_rte \
|
| 335 |
+
--evaluation_strategy steps \
|
| 336 |
--save_strategy steps \
|
| 337 |
--save_total_limit 1 \
|
| 338 |
--load_best_model_at_end \
|
|
|
|
| 381 |
--logging_strategy steps \
|
| 382 |
--logging_steps 10 \
|
| 383 |
--metric_for_best_model eval_exact_match_for_imdb \
|
| 384 |
+
--evaluation_strategy steps \
|
| 385 |
--save_strategy steps \
|
| 386 |
--save_total_limit 1 \
|
| 387 |
--load_best_model_at_end \
|
|
|
|
| 430 |
--logging_strategy steps \
|
| 431 |
--logging_steps 10 \
|
| 432 |
--metric_for_best_model eval_exact_match_for_yelp \
|
| 433 |
+
--evaluation_strategy steps \
|
| 434 |
--save_strategy steps \
|
| 435 |
--save_total_limit 1 \
|
| 436 |
--load_best_model_at_end \
|
|
|
|
| 479 |
--logging_strategy steps \
|
| 480 |
--logging_steps 10 \
|
| 481 |
--metric_for_best_model eval_exact_match_for_amazon \
|
| 482 |
+
--evaluation_strategy steps \
|
| 483 |
--save_strategy steps \
|
| 484 |
--save_total_limit 1 \
|
| 485 |
--load_best_model_at_end \
|
|
|
|
| 528 |
--logging_strategy steps \
|
| 529 |
--logging_steps 10 \
|
| 530 |
--metric_for_best_model eval_exact_match_for_sst2 \
|
| 531 |
+
--evaluation_strategy steps \
|
| 532 |
--save_strategy steps \
|
| 533 |
--save_total_limit 1 \
|
| 534 |
--load_best_model_at_end \
|
|
|
|
| 577 |
--logging_strategy steps \
|
| 578 |
--logging_steps 10 \
|
| 579 |
--metric_for_best_model eval_exact_match_for_dbpedia \
|
| 580 |
+
--evaluation_strategy steps \
|
| 581 |
--save_strategy steps \
|
| 582 |
--save_total_limit 1 \
|
| 583 |
--load_best_model_at_end \
|
|
|
|
| 626 |
--logging_strategy steps \
|
| 627 |
--logging_steps 10 \
|
| 628 |
--metric_for_best_model eval_exact_match_for_agnews \
|
| 629 |
+
--evaluation_strategy steps \
|
| 630 |
--save_strategy steps \
|
| 631 |
--save_total_limit 1 \
|
| 632 |
--load_best_model_at_end \
|
|
|
|
| 675 |
--logging_strategy steps \
|
| 676 |
--logging_steps 10 \
|
| 677 |
--metric_for_best_model eval_exact_match_for_multirc \
|
| 678 |
+
--evaluation_strategy steps \
|
| 679 |
--save_strategy steps \
|
| 680 |
--save_total_limit 1 \
|
| 681 |
--load_best_model_at_end \
|
|
|
|
| 724 |
--logging_strategy steps \
|
| 725 |
--logging_steps 10 \
|
| 726 |
--metric_for_best_model eval_exact_match_for_yahoo \
|
| 727 |
+
--evaluation_strategy steps \
|
| 728 |
--save_strategy steps \
|
| 729 |
--save_total_limit 1 \
|
| 730 |
--load_best_model_at_end \
|
root_gainlora/gen_script_superni_order1_llama_gainlora_inflora.sh
CHANGED
|
@@ -41,7 +41,7 @@ deepspeed --include localhost:${1} --master_port 19500 src/run_llama.py \
|
|
| 41 |
--logging_strategy steps \
|
| 42 |
--logging_steps 10 \
|
| 43 |
--metric_for_best_model eval_rougeL \
|
| 44 |
-
--
|
| 45 |
--save_strategy steps \
|
| 46 |
--save_total_limit 1 \
|
| 47 |
--lora_r 4 \
|
|
@@ -97,7 +97,7 @@ deepspeed --include localhost:${1} --master_port 19500 src/run_llama.py \
|
|
| 97 |
--logging_strategy steps \
|
| 98 |
--logging_steps 10 \
|
| 99 |
--metric_for_best_model eval_rougeL_for_task363_sst2_polarity_classification \
|
| 100 |
-
--
|
| 101 |
--save_strategy steps \
|
| 102 |
--save_total_limit 1 \
|
| 103 |
--load_best_model_at_end \
|
|
@@ -154,7 +154,7 @@ deepspeed --include localhost:${1} --master_port 19500 src/run_llama.py \
|
|
| 154 |
--logging_strategy steps \
|
| 155 |
--logging_steps 10 \
|
| 156 |
--metric_for_best_model eval_rougeL_for_task1290_xsum_summarization \
|
| 157 |
-
--
|
| 158 |
--save_strategy steps \
|
| 159 |
--save_total_limit 1 \
|
| 160 |
--load_best_model_at_end \
|
|
@@ -211,7 +211,7 @@ deepspeed --include localhost:${1} --master_port 19500 src/run_llama.py \
|
|
| 211 |
--logging_strategy steps \
|
| 212 |
--logging_steps 10 \
|
| 213 |
--metric_for_best_model eval_rougeL_for_task181_outcome_extraction \
|
| 214 |
-
--
|
| 215 |
--save_strategy steps \
|
| 216 |
--save_total_limit 1 \
|
| 217 |
--load_best_model_at_end \
|
|
@@ -268,7 +268,7 @@ deepspeed --include localhost:${1} --master_port 19500 src/run_llama.py \
|
|
| 268 |
--logging_strategy steps \
|
| 269 |
--logging_steps 10 \
|
| 270 |
--metric_for_best_model eval_rougeL_for_task002_quoref_answer_generation \
|
| 271 |
-
--
|
| 272 |
--save_strategy steps \
|
| 273 |
--save_total_limit 1 \
|
| 274 |
--load_best_model_at_end \
|
|
@@ -325,7 +325,7 @@ deepspeed --include localhost:${1} --master_port 19500 src/run_llama.py \
|
|
| 325 |
--logging_strategy steps \
|
| 326 |
--logging_steps 10 \
|
| 327 |
--metric_for_best_model eval_rougeL_for_task1510_evalution_relation_extraction \
|
| 328 |
-
--
|
| 329 |
--save_strategy steps \
|
| 330 |
--save_total_limit 1 \
|
| 331 |
--load_best_model_at_end \
|
|
@@ -382,7 +382,7 @@ deepspeed --include localhost:${1} --master_port 19500 src/run_llama.py \
|
|
| 382 |
--logging_strategy steps \
|
| 383 |
--logging_steps 10 \
|
| 384 |
--metric_for_best_model eval_rougeL_for_task639_multi_woz_user_utterance_generation \
|
| 385 |
-
--
|
| 386 |
--save_strategy steps \
|
| 387 |
--save_total_limit 1 \
|
| 388 |
--load_best_model_at_end \
|
|
@@ -439,7 +439,7 @@ deepspeed --include localhost:${1} --master_port 19500 src/run_llama.py \
|
|
| 439 |
--logging_strategy steps \
|
| 440 |
--logging_steps 10 \
|
| 441 |
--metric_for_best_model eval_rougeL_for_task1729_personachat_generate_next \
|
| 442 |
-
--
|
| 443 |
--save_strategy steps \
|
| 444 |
--save_total_limit 1 \
|
| 445 |
--load_best_model_at_end \
|
|
@@ -496,7 +496,7 @@ deepspeed --include localhost:${1} --master_port 19500 src/run_llama.py \
|
|
| 496 |
--logging_strategy steps \
|
| 497 |
--logging_steps 10 \
|
| 498 |
--metric_for_best_model eval_rougeL_for_task073_commonsenseqa_answer_generation \
|
| 499 |
-
--
|
| 500 |
--save_strategy steps \
|
| 501 |
--save_total_limit 1 \
|
| 502 |
--load_best_model_at_end \
|
|
@@ -553,7 +553,7 @@ deepspeed --include localhost:${1} --master_port 19500 src/run_llama.py \
|
|
| 553 |
--logging_strategy steps \
|
| 554 |
--logging_steps 10 \
|
| 555 |
--metric_for_best_model eval_rougeL_for_task1590_diplomacy_text_generation \
|
| 556 |
-
--
|
| 557 |
--save_strategy steps \
|
| 558 |
--save_total_limit 1 \
|
| 559 |
--load_best_model_at_end \
|
|
@@ -610,7 +610,7 @@ deepspeed --include localhost:${1} --master_port 19500 src/run_llama.py \
|
|
| 610 |
--logging_strategy steps \
|
| 611 |
--logging_steps 10 \
|
| 612 |
--metric_for_best_model eval_rougeL_for_task748_glucose_reverse_cause_event_detection \
|
| 613 |
-
--
|
| 614 |
--save_strategy steps \
|
| 615 |
--save_total_limit 1 \
|
| 616 |
--load_best_model_at_end \
|
|
@@ -667,7 +667,7 @@ deepspeed --include localhost:${1} --master_port 19500 src/run_llama.py \
|
|
| 667 |
--logging_strategy steps \
|
| 668 |
--logging_steps 10 \
|
| 669 |
--metric_for_best_model eval_rougeL_for_task511_reddit_tifu_long_text_summarization \
|
| 670 |
-
--
|
| 671 |
--save_strategy steps \
|
| 672 |
--save_total_limit 1 \
|
| 673 |
--load_best_model_at_end \
|
|
@@ -724,7 +724,7 @@ deepspeed --include localhost:${1} --master_port 19500 src/run_llama.py \
|
|
| 724 |
--logging_strategy steps \
|
| 725 |
--logging_steps 10 \
|
| 726 |
--metric_for_best_model eval_rougeL_for_task591_sciq_answer_generation \
|
| 727 |
-
--
|
| 728 |
--save_strategy steps \
|
| 729 |
--save_total_limit 1 \
|
| 730 |
--load_best_model_at_end \
|
|
@@ -781,7 +781,7 @@ deepspeed --include localhost:${1} --master_port 19500 src/run_llama.py \
|
|
| 781 |
--logging_strategy steps \
|
| 782 |
--logging_steps 10 \
|
| 783 |
--metric_for_best_model eval_rougeL_for_task1687_sentiment140_classification \
|
| 784 |
-
--
|
| 785 |
--save_strategy steps \
|
| 786 |
--save_total_limit 1 \
|
| 787 |
--load_best_model_at_end \
|
|
@@ -838,7 +838,7 @@ deepspeed --include localhost:${1} --master_port 19500 src/run_llama.py \
|
|
| 838 |
--logging_strategy steps \
|
| 839 |
--logging_steps 10 \
|
| 840 |
--metric_for_best_model eval_rougeL_for_task875_emotion_classification \
|
| 841 |
-
--
|
| 842 |
--save_strategy steps \
|
| 843 |
--save_total_limit 1 \
|
| 844 |
--load_best_model_at_end \
|
|
|
|
| 41 |
--logging_strategy steps \
|
| 42 |
--logging_steps 10 \
|
| 43 |
--metric_for_best_model eval_rougeL \
|
| 44 |
+
--evaluation_strategy steps \
|
| 45 |
--save_strategy steps \
|
| 46 |
--save_total_limit 1 \
|
| 47 |
--lora_r 4 \
|
|
|
|
| 97 |
--logging_strategy steps \
|
| 98 |
--logging_steps 10 \
|
| 99 |
--metric_for_best_model eval_rougeL_for_task363_sst2_polarity_classification \
|
| 100 |
+
--evaluation_strategy steps \
|
| 101 |
--save_strategy steps \
|
| 102 |
--save_total_limit 1 \
|
| 103 |
--load_best_model_at_end \
|
|
|
|
| 154 |
--logging_strategy steps \
|
| 155 |
--logging_steps 10 \
|
| 156 |
--metric_for_best_model eval_rougeL_for_task1290_xsum_summarization \
|
| 157 |
+
--evaluation_strategy steps \
|
| 158 |
--save_strategy steps \
|
| 159 |
--save_total_limit 1 \
|
| 160 |
--load_best_model_at_end \
|
|
|
|
| 211 |
--logging_strategy steps \
|
| 212 |
--logging_steps 10 \
|
| 213 |
--metric_for_best_model eval_rougeL_for_task181_outcome_extraction \
|
| 214 |
+
--evaluation_strategy steps \
|
| 215 |
--save_strategy steps \
|
| 216 |
--save_total_limit 1 \
|
| 217 |
--load_best_model_at_end \
|
|
|
|
| 268 |
--logging_strategy steps \
|
| 269 |
--logging_steps 10 \
|
| 270 |
--metric_for_best_model eval_rougeL_for_task002_quoref_answer_generation \
|
| 271 |
+
--evaluation_strategy steps \
|
| 272 |
--save_strategy steps \
|
| 273 |
--save_total_limit 1 \
|
| 274 |
--load_best_model_at_end \
|
|
|
|
| 325 |
--logging_strategy steps \
|
| 326 |
--logging_steps 10 \
|
| 327 |
--metric_for_best_model eval_rougeL_for_task1510_evalution_relation_extraction \
|
| 328 |
+
--evaluation_strategy steps \
|
| 329 |
--save_strategy steps \
|
| 330 |
--save_total_limit 1 \
|
| 331 |
--load_best_model_at_end \
|
|
|
|
| 382 |
--logging_strategy steps \
|
| 383 |
--logging_steps 10 \
|
| 384 |
--metric_for_best_model eval_rougeL_for_task639_multi_woz_user_utterance_generation \
|
| 385 |
+
--evaluation_strategy steps \
|
| 386 |
--save_strategy steps \
|
| 387 |
--save_total_limit 1 \
|
| 388 |
--load_best_model_at_end \
|
|
|
|
| 439 |
--logging_strategy steps \
|
| 440 |
--logging_steps 10 \
|
| 441 |
--metric_for_best_model eval_rougeL_for_task1729_personachat_generate_next \
|
| 442 |
+
--evaluation_strategy steps \
|
| 443 |
--save_strategy steps \
|
| 444 |
--save_total_limit 1 \
|
| 445 |
--load_best_model_at_end \
|
|
|
|
| 496 |
--logging_strategy steps \
|
| 497 |
--logging_steps 10 \
|
| 498 |
--metric_for_best_model eval_rougeL_for_task073_commonsenseqa_answer_generation \
|
| 499 |
+
--evaluation_strategy steps \
|
| 500 |
--save_strategy steps \
|
| 501 |
--save_total_limit 1 \
|
| 502 |
--load_best_model_at_end \
|
|
|
|
| 553 |
--logging_strategy steps \
|
| 554 |
--logging_steps 10 \
|
| 555 |
--metric_for_best_model eval_rougeL_for_task1590_diplomacy_text_generation \
|
| 556 |
+
--evaluation_strategy steps \
|
| 557 |
--save_strategy steps \
|
| 558 |
--save_total_limit 1 \
|
| 559 |
--load_best_model_at_end \
|
|
|
|
| 610 |
--logging_strategy steps \
|
| 611 |
--logging_steps 10 \
|
| 612 |
--metric_for_best_model eval_rougeL_for_task748_glucose_reverse_cause_event_detection \
|
| 613 |
+
--evaluation_strategy steps \
|
| 614 |
--save_strategy steps \
|
| 615 |
--save_total_limit 1 \
|
| 616 |
--load_best_model_at_end \
|
|
|
|
| 667 |
--logging_strategy steps \
|
| 668 |
--logging_steps 10 \
|
| 669 |
--metric_for_best_model eval_rougeL_for_task511_reddit_tifu_long_text_summarization \
|
| 670 |
+
--evaluation_strategy steps \
|
| 671 |
--save_strategy steps \
|
| 672 |
--save_total_limit 1 \
|
| 673 |
--load_best_model_at_end \
|
|
|
|
| 724 |
--logging_strategy steps \
|
| 725 |
--logging_steps 10 \
|
| 726 |
--metric_for_best_model eval_rougeL_for_task591_sciq_answer_generation \
|
| 727 |
+
--evaluation_strategy steps \
|
| 728 |
--save_strategy steps \
|
| 729 |
--save_total_limit 1 \
|
| 730 |
--load_best_model_at_end \
|
|
|
|
| 781 |
--logging_strategy steps \
|
| 782 |
--logging_steps 10 \
|
| 783 |
--metric_for_best_model eval_rougeL_for_task1687_sentiment140_classification \
|
| 784 |
+
--evaluation_strategy steps \
|
| 785 |
--save_strategy steps \
|
| 786 |
--save_total_limit 1 \
|
| 787 |
--load_best_model_at_end \
|
|
|
|
| 838 |
--logging_strategy steps \
|
| 839 |
--logging_steps 10 \
|
| 840 |
--metric_for_best_model eval_rougeL_for_task875_emotion_classification \
|
| 841 |
+
--evaluation_strategy steps \
|
| 842 |
--save_strategy steps \
|
| 843 |
--save_total_limit 1 \
|
| 844 |
--load_best_model_at_end \
|
root_gainlora/gen_script_superni_order1_llama_gainlora_olora.sh
CHANGED
|
@@ -41,7 +41,7 @@ deepspeed --include localhost:${1} --master_port 39500 src/run_llama.py \
|
|
| 41 |
--logging_strategy steps \
|
| 42 |
--logging_steps 10 \
|
| 43 |
--metric_for_best_model eval_rougeL \
|
| 44 |
-
--
|
| 45 |
--save_strategy steps \
|
| 46 |
--save_total_limit 1 \
|
| 47 |
--lora_r 4 \
|
|
@@ -98,7 +98,7 @@ deepspeed --include localhost:${1} --master_port 39500 src/run_llama.py \
|
|
| 98 |
--logging_strategy steps \
|
| 99 |
--logging_steps 10 \
|
| 100 |
--metric_for_best_model eval_rougeL_for_task363_sst2_polarity_classification \
|
| 101 |
-
--
|
| 102 |
--save_strategy steps \
|
| 103 |
--save_total_limit 1 \
|
| 104 |
--load_best_model_at_end \
|
|
@@ -156,7 +156,7 @@ deepspeed --include localhost:${1} --master_port 39500 src/run_llama.py \
|
|
| 156 |
--logging_strategy steps \
|
| 157 |
--logging_steps 10 \
|
| 158 |
--metric_for_best_model eval_rougeL_for_task1290_xsum_summarization \
|
| 159 |
-
--
|
| 160 |
--save_strategy steps \
|
| 161 |
--save_total_limit 1 \
|
| 162 |
--load_best_model_at_end \
|
|
@@ -214,7 +214,7 @@ deepspeed --include localhost:${1} --master_port 39500 src/run_llama.py \
|
|
| 214 |
--logging_strategy steps \
|
| 215 |
--logging_steps 10 \
|
| 216 |
--metric_for_best_model eval_rougeL_for_task181_outcome_extraction \
|
| 217 |
-
--
|
| 218 |
--save_strategy steps \
|
| 219 |
--save_total_limit 1 \
|
| 220 |
--load_best_model_at_end \
|
|
@@ -272,7 +272,7 @@ deepspeed --include localhost:${1} --master_port 39500 src/run_llama.py \
|
|
| 272 |
--logging_strategy steps \
|
| 273 |
--logging_steps 10 \
|
| 274 |
--metric_for_best_model eval_rougeL_for_task002_quoref_answer_generation \
|
| 275 |
-
--
|
| 276 |
--save_strategy steps \
|
| 277 |
--save_total_limit 1 \
|
| 278 |
--load_best_model_at_end \
|
|
@@ -330,7 +330,7 @@ deepspeed --include localhost:${1} --master_port 39500 src/run_llama.py \
|
|
| 330 |
--logging_strategy steps \
|
| 331 |
--logging_steps 10 \
|
| 332 |
--metric_for_best_model eval_rougeL_for_task1510_evalution_relation_extraction \
|
| 333 |
-
--
|
| 334 |
--save_strategy steps \
|
| 335 |
--save_total_limit 1 \
|
| 336 |
--load_best_model_at_end \
|
|
@@ -388,7 +388,7 @@ deepspeed --include localhost:${1} --master_port 39500 src/run_llama.py \
|
|
| 388 |
--logging_strategy steps \
|
| 389 |
--logging_steps 10 \
|
| 390 |
--metric_for_best_model eval_rougeL_for_task639_multi_woz_user_utterance_generation \
|
| 391 |
-
--
|
| 392 |
--save_strategy steps \
|
| 393 |
--save_total_limit 1 \
|
| 394 |
--load_best_model_at_end \
|
|
@@ -446,7 +446,7 @@ deepspeed --include localhost:${1} --master_port 39500 src/run_llama.py \
|
|
| 446 |
--logging_strategy steps \
|
| 447 |
--logging_steps 10 \
|
| 448 |
--metric_for_best_model eval_rougeL_for_task1729_personachat_generate_next \
|
| 449 |
-
--
|
| 450 |
--save_strategy steps \
|
| 451 |
--save_total_limit 1 \
|
| 452 |
--load_best_model_at_end \
|
|
@@ -504,7 +504,7 @@ deepspeed --include localhost:${1} --master_port 39500 src/run_llama.py \
|
|
| 504 |
--logging_strategy steps \
|
| 505 |
--logging_steps 10 \
|
| 506 |
--metric_for_best_model eval_rougeL_for_task073_commonsenseqa_answer_generation \
|
| 507 |
-
--
|
| 508 |
--save_strategy steps \
|
| 509 |
--save_total_limit 1 \
|
| 510 |
--load_best_model_at_end \
|
|
@@ -562,7 +562,7 @@ deepspeed --include localhost:${1} --master_port 39500 src/run_llama.py \
|
|
| 562 |
--logging_strategy steps \
|
| 563 |
--logging_steps 10 \
|
| 564 |
--metric_for_best_model eval_rougeL_for_task1590_diplomacy_text_generation \
|
| 565 |
-
--
|
| 566 |
--save_strategy steps \
|
| 567 |
--save_total_limit 1 \
|
| 568 |
--load_best_model_at_end \
|
|
@@ -620,7 +620,7 @@ deepspeed --include localhost:${1} --master_port 39500 src/run_llama.py \
|
|
| 620 |
--logging_strategy steps \
|
| 621 |
--logging_steps 10 \
|
| 622 |
--metric_for_best_model eval_rougeL_for_task748_glucose_reverse_cause_event_detection \
|
| 623 |
-
--
|
| 624 |
--save_strategy steps \
|
| 625 |
--save_total_limit 1 \
|
| 626 |
--load_best_model_at_end \
|
|
@@ -678,7 +678,7 @@ deepspeed --include localhost:${1} --master_port 39500 src/run_llama.py \
|
|
| 678 |
--logging_strategy steps \
|
| 679 |
--logging_steps 10 \
|
| 680 |
--metric_for_best_model eval_rougeL_for_task511_reddit_tifu_long_text_summarization \
|
| 681 |
-
--
|
| 682 |
--save_strategy steps \
|
| 683 |
--save_total_limit 1 \
|
| 684 |
--load_best_model_at_end \
|
|
@@ -736,7 +736,7 @@ deepspeed --include localhost:${1} --master_port 39500 src/run_llama.py \
|
|
| 736 |
--logging_strategy steps \
|
| 737 |
--logging_steps 10 \
|
| 738 |
--metric_for_best_model eval_rougeL_for_task591_sciq_answer_generation \
|
| 739 |
-
--
|
| 740 |
--save_strategy steps \
|
| 741 |
--save_total_limit 1 \
|
| 742 |
--load_best_model_at_end \
|
|
@@ -794,7 +794,7 @@ deepspeed --include localhost:${1} --master_port 39500 src/run_llama.py \
|
|
| 794 |
--logging_strategy steps \
|
| 795 |
--logging_steps 10 \
|
| 796 |
--metric_for_best_model eval_rougeL_for_task1687_sentiment140_classification \
|
| 797 |
-
--
|
| 798 |
--save_strategy steps \
|
| 799 |
--save_total_limit 1 \
|
| 800 |
--load_best_model_at_end \
|
|
@@ -852,7 +852,7 @@ deepspeed --include localhost:${1} --master_port 39500 src/run_llama.py \
|
|
| 852 |
--logging_strategy steps \
|
| 853 |
--logging_steps 10 \
|
| 854 |
--metric_for_best_model eval_rougeL_for_task875_emotion_classification \
|
| 855 |
-
--
|
| 856 |
--save_strategy steps \
|
| 857 |
--save_total_limit 1 \
|
| 858 |
--load_best_model_at_end \
|
|
|
|
| 41 |
--logging_strategy steps \
|
| 42 |
--logging_steps 10 \
|
| 43 |
--metric_for_best_model eval_rougeL \
|
| 44 |
+
--evaluation_strategy steps \
|
| 45 |
--save_strategy steps \
|
| 46 |
--save_total_limit 1 \
|
| 47 |
--lora_r 4 \
|
|
|
|
| 98 |
--logging_strategy steps \
|
| 99 |
--logging_steps 10 \
|
| 100 |
--metric_for_best_model eval_rougeL_for_task363_sst2_polarity_classification \
|
| 101 |
+
--evaluation_strategy steps \
|
| 102 |
--save_strategy steps \
|
| 103 |
--save_total_limit 1 \
|
| 104 |
--load_best_model_at_end \
|
|
|
|
| 156 |
--logging_strategy steps \
|
| 157 |
--logging_steps 10 \
|
| 158 |
--metric_for_best_model eval_rougeL_for_task1290_xsum_summarization \
|
| 159 |
+
--evaluation_strategy steps \
|
| 160 |
--save_strategy steps \
|
| 161 |
--save_total_limit 1 \
|
| 162 |
--load_best_model_at_end \
|
|
|
|
| 214 |
--logging_strategy steps \
|
| 215 |
--logging_steps 10 \
|
| 216 |
--metric_for_best_model eval_rougeL_for_task181_outcome_extraction \
|
| 217 |
+
--evaluation_strategy steps \
|
| 218 |
--save_strategy steps \
|
| 219 |
--save_total_limit 1 \
|
| 220 |
--load_best_model_at_end \
|
|
|
|
| 272 |
--logging_strategy steps \
|
| 273 |
--logging_steps 10 \
|
| 274 |
--metric_for_best_model eval_rougeL_for_task002_quoref_answer_generation \
|
| 275 |
+
--evaluation_strategy steps \
|
| 276 |
--save_strategy steps \
|
| 277 |
--save_total_limit 1 \
|
| 278 |
--load_best_model_at_end \
|
|
|
|
| 330 |
--logging_strategy steps \
|
| 331 |
--logging_steps 10 \
|
| 332 |
--metric_for_best_model eval_rougeL_for_task1510_evalution_relation_extraction \
|
| 333 |
+
--evaluation_strategy steps \
|
| 334 |
--save_strategy steps \
|
| 335 |
--save_total_limit 1 \
|
| 336 |
--load_best_model_at_end \
|
|
|
|
| 388 |
--logging_strategy steps \
|
| 389 |
--logging_steps 10 \
|
| 390 |
--metric_for_best_model eval_rougeL_for_task639_multi_woz_user_utterance_generation \
|
| 391 |
+
--evaluation_strategy steps \
|
| 392 |
--save_strategy steps \
|
| 393 |
--save_total_limit 1 \
|
| 394 |
--load_best_model_at_end \
|
|
|
|
| 446 |
--logging_strategy steps \
|
| 447 |
--logging_steps 10 \
|
| 448 |
--metric_for_best_model eval_rougeL_for_task1729_personachat_generate_next \
|
| 449 |
+
--evaluation_strategy steps \
|
| 450 |
--save_strategy steps \
|
| 451 |
--save_total_limit 1 \
|
| 452 |
--load_best_model_at_end \
|
|
|
|
| 504 |
--logging_strategy steps \
|
| 505 |
--logging_steps 10 \
|
| 506 |
--metric_for_best_model eval_rougeL_for_task073_commonsenseqa_answer_generation \
|
| 507 |
+
--evaluation_strategy steps \
|
| 508 |
--save_strategy steps \
|
| 509 |
--save_total_limit 1 \
|
| 510 |
--load_best_model_at_end \
|
|
|
|
| 562 |
--logging_strategy steps \
|
| 563 |
--logging_steps 10 \
|
| 564 |
--metric_for_best_model eval_rougeL_for_task1590_diplomacy_text_generation \
|
| 565 |
+
--evaluation_strategy steps \
|
| 566 |
--save_strategy steps \
|
| 567 |
--save_total_limit 1 \
|
| 568 |
--load_best_model_at_end \
|
|
|
|
| 620 |
--logging_strategy steps \
|
| 621 |
--logging_steps 10 \
|
| 622 |
--metric_for_best_model eval_rougeL_for_task748_glucose_reverse_cause_event_detection \
|
| 623 |
+
--evaluation_strategy steps \
|
| 624 |
--save_strategy steps \
|
| 625 |
--save_total_limit 1 \
|
| 626 |
--load_best_model_at_end \
|
|
|
|
| 678 |
--logging_strategy steps \
|
| 679 |
--logging_steps 10 \
|
| 680 |
--metric_for_best_model eval_rougeL_for_task511_reddit_tifu_long_text_summarization \
|
| 681 |
+
--evaluation_strategy steps \
|
| 682 |
--save_strategy steps \
|
| 683 |
--save_total_limit 1 \
|
| 684 |
--load_best_model_at_end \
|
|
|
|
| 736 |
--logging_strategy steps \
|
| 737 |
--logging_steps 10 \
|
| 738 |
--metric_for_best_model eval_rougeL_for_task591_sciq_answer_generation \
|
| 739 |
+
--evaluation_strategy steps \
|
| 740 |
--save_strategy steps \
|
| 741 |
--save_total_limit 1 \
|
| 742 |
--load_best_model_at_end \
|
|
|
|
| 794 |
--logging_strategy steps \
|
| 795 |
--logging_steps 10 \
|
| 796 |
--metric_for_best_model eval_rougeL_for_task1687_sentiment140_classification \
|
| 797 |
+
--evaluation_strategy steps \
|
| 798 |
--save_strategy steps \
|
| 799 |
--save_total_limit 1 \
|
| 800 |
--load_best_model_at_end \
|
|
|
|
| 852 |
--logging_strategy steps \
|
| 853 |
--logging_steps 10 \
|
| 854 |
--metric_for_best_model eval_rougeL_for_task875_emotion_classification \
|
| 855 |
+
--evaluation_strategy steps \
|
| 856 |
--save_strategy steps \
|
| 857 |
--save_total_limit 1 \
|
| 858 |
--load_best_model_at_end \
|
root_gainlora/gen_script_superni_order1_llama_inflora.sh
CHANGED
|
@@ -41,7 +41,7 @@ deepspeed --include localhost:${1} --master_port 9500 src/run_llama.py \
|
|
| 41 |
--logging_strategy steps \
|
| 42 |
--logging_steps 10 \
|
| 43 |
--metric_for_best_model eval_rougeL \
|
| 44 |
-
--
|
| 45 |
--save_strategy steps \
|
| 46 |
--save_total_limit 1 \
|
| 47 |
--lora_r 4 \
|
|
@@ -97,7 +97,7 @@ deepspeed --include localhost:${1} --master_port 9500 src/run_llama.py \
|
|
| 97 |
--logging_strategy steps \
|
| 98 |
--logging_steps 10 \
|
| 99 |
--metric_for_best_model eval_rougeL_for_task363_sst2_polarity_classification \
|
| 100 |
-
--
|
| 101 |
--save_strategy steps \
|
| 102 |
--save_total_limit 1 \
|
| 103 |
--load_best_model_at_end \
|
|
@@ -154,7 +154,7 @@ deepspeed --include localhost:${1} --master_port 9500 src/run_llama.py \
|
|
| 154 |
--logging_strategy steps \
|
| 155 |
--logging_steps 10 \
|
| 156 |
--metric_for_best_model eval_rougeL_for_task1290_xsum_summarization \
|
| 157 |
-
--
|
| 158 |
--save_strategy steps \
|
| 159 |
--save_total_limit 1 \
|
| 160 |
--load_best_model_at_end \
|
|
@@ -211,7 +211,7 @@ deepspeed --include localhost:${1} --master_port 9500 src/run_llama.py \
|
|
| 211 |
--logging_strategy steps \
|
| 212 |
--logging_steps 10 \
|
| 213 |
--metric_for_best_model eval_rougeL_for_task181_outcome_extraction \
|
| 214 |
-
--
|
| 215 |
--save_strategy steps \
|
| 216 |
--save_total_limit 1 \
|
| 217 |
--load_best_model_at_end \
|
|
@@ -268,7 +268,7 @@ deepspeed --include localhost:${1} --master_port 9500 src/run_llama.py \
|
|
| 268 |
--logging_strategy steps \
|
| 269 |
--logging_steps 10 \
|
| 270 |
--metric_for_best_model eval_rougeL_for_task002_quoref_answer_generation \
|
| 271 |
-
--
|
| 272 |
--save_strategy steps \
|
| 273 |
--save_total_limit 1 \
|
| 274 |
--load_best_model_at_end \
|
|
@@ -325,7 +325,7 @@ deepspeed --include localhost:${1} --master_port 9500 src/run_llama.py \
|
|
| 325 |
--logging_strategy steps \
|
| 326 |
--logging_steps 10 \
|
| 327 |
--metric_for_best_model eval_rougeL_for_task1510_evalution_relation_extraction \
|
| 328 |
-
--
|
| 329 |
--save_strategy steps \
|
| 330 |
--save_total_limit 1 \
|
| 331 |
--load_best_model_at_end \
|
|
@@ -382,7 +382,7 @@ deepspeed --include localhost:${1} --master_port 9500 src/run_llama.py \
|
|
| 382 |
--logging_strategy steps \
|
| 383 |
--logging_steps 10 \
|
| 384 |
--metric_for_best_model eval_rougeL_for_task639_multi_woz_user_utterance_generation \
|
| 385 |
-
--
|
| 386 |
--save_strategy steps \
|
| 387 |
--save_total_limit 1 \
|
| 388 |
--load_best_model_at_end \
|
|
@@ -439,7 +439,7 @@ deepspeed --include localhost:${1} --master_port 9500 src/run_llama.py \
|
|
| 439 |
--logging_strategy steps \
|
| 440 |
--logging_steps 10 \
|
| 441 |
--metric_for_best_model eval_rougeL_for_task1729_personachat_generate_next \
|
| 442 |
-
--
|
| 443 |
--save_strategy steps \
|
| 444 |
--save_total_limit 1 \
|
| 445 |
--load_best_model_at_end \
|
|
@@ -496,7 +496,7 @@ deepspeed --include localhost:${1} --master_port 9500 src/run_llama.py \
|
|
| 496 |
--logging_strategy steps \
|
| 497 |
--logging_steps 10 \
|
| 498 |
--metric_for_best_model eval_rougeL_for_task073_commonsenseqa_answer_generation \
|
| 499 |
-
--
|
| 500 |
--save_strategy steps \
|
| 501 |
--save_total_limit 1 \
|
| 502 |
--load_best_model_at_end \
|
|
@@ -553,7 +553,7 @@ deepspeed --include localhost:${1} --master_port 9500 src/run_llama.py \
|
|
| 553 |
--logging_strategy steps \
|
| 554 |
--logging_steps 10 \
|
| 555 |
--metric_for_best_model eval_rougeL_for_task1590_diplomacy_text_generation \
|
| 556 |
-
--
|
| 557 |
--save_strategy steps \
|
| 558 |
--save_total_limit 1 \
|
| 559 |
--load_best_model_at_end \
|
|
@@ -610,7 +610,7 @@ deepspeed --include localhost:${1} --master_port 9500 src/run_llama.py \
|
|
| 610 |
--logging_strategy steps \
|
| 611 |
--logging_steps 10 \
|
| 612 |
--metric_for_best_model eval_rougeL_for_task748_glucose_reverse_cause_event_detection \
|
| 613 |
-
--
|
| 614 |
--save_strategy steps \
|
| 615 |
--save_total_limit 1 \
|
| 616 |
--load_best_model_at_end \
|
|
@@ -667,7 +667,7 @@ deepspeed --include localhost:${1} --master_port 9500 src/run_llama.py \
|
|
| 667 |
--logging_strategy steps \
|
| 668 |
--logging_steps 10 \
|
| 669 |
--metric_for_best_model eval_rougeL_for_task511_reddit_tifu_long_text_summarization \
|
| 670 |
-
--
|
| 671 |
--save_strategy steps \
|
| 672 |
--save_total_limit 1 \
|
| 673 |
--load_best_model_at_end \
|
|
@@ -724,7 +724,7 @@ deepspeed --include localhost:${1} --master_port 9500 src/run_llama.py \
|
|
| 724 |
--logging_strategy steps \
|
| 725 |
--logging_steps 10 \
|
| 726 |
--metric_for_best_model eval_rougeL_for_task591_sciq_answer_generation \
|
| 727 |
-
--
|
| 728 |
--save_strategy steps \
|
| 729 |
--save_total_limit 1 \
|
| 730 |
--load_best_model_at_end \
|
|
@@ -781,7 +781,7 @@ deepspeed --include localhost:${1} --master_port 9500 src/run_llama.py \
|
|
| 781 |
--logging_strategy steps \
|
| 782 |
--logging_steps 10 \
|
| 783 |
--metric_for_best_model eval_rougeL_for_task1687_sentiment140_classification \
|
| 784 |
-
--
|
| 785 |
--save_strategy steps \
|
| 786 |
--save_total_limit 1 \
|
| 787 |
--load_best_model_at_end \
|
|
@@ -838,7 +838,7 @@ deepspeed --include localhost:${1} --master_port 9500 src/run_llama.py \
|
|
| 838 |
--logging_strategy steps \
|
| 839 |
--logging_steps 10 \
|
| 840 |
--metric_for_best_model eval_rougeL_for_task875_emotion_classification \
|
| 841 |
-
--
|
| 842 |
--save_strategy steps \
|
| 843 |
--save_total_limit 1 \
|
| 844 |
--load_best_model_at_end \
|
|
|
|
| 41 |
--logging_strategy steps \
|
| 42 |
--logging_steps 10 \
|
| 43 |
--metric_for_best_model eval_rougeL \
|
| 44 |
+
--evaluation_strategy steps \
|
| 45 |
--save_strategy steps \
|
| 46 |
--save_total_limit 1 \
|
| 47 |
--lora_r 4 \
|
|
|
|
| 97 |
--logging_strategy steps \
|
| 98 |
--logging_steps 10 \
|
| 99 |
--metric_for_best_model eval_rougeL_for_task363_sst2_polarity_classification \
|
| 100 |
+
--evaluation_strategy steps \
|
| 101 |
--save_strategy steps \
|
| 102 |
--save_total_limit 1 \
|
| 103 |
--load_best_model_at_end \
|
|
|
|
| 154 |
--logging_strategy steps \
|
| 155 |
--logging_steps 10 \
|
| 156 |
--metric_for_best_model eval_rougeL_for_task1290_xsum_summarization \
|
| 157 |
+
--evaluation_strategy steps \
|
| 158 |
--save_strategy steps \
|
| 159 |
--save_total_limit 1 \
|
| 160 |
--load_best_model_at_end \
|
|
|
|
| 211 |
--logging_strategy steps \
|
| 212 |
--logging_steps 10 \
|
| 213 |
--metric_for_best_model eval_rougeL_for_task181_outcome_extraction \
|
| 214 |
+
--evaluation_strategy steps \
|
| 215 |
--save_strategy steps \
|
| 216 |
--save_total_limit 1 \
|
| 217 |
--load_best_model_at_end \
|
|
|
|
| 268 |
--logging_strategy steps \
|
| 269 |
--logging_steps 10 \
|
| 270 |
--metric_for_best_model eval_rougeL_for_task002_quoref_answer_generation \
|
| 271 |
+
--evaluation_strategy steps \
|
| 272 |
--save_strategy steps \
|
| 273 |
--save_total_limit 1 \
|
| 274 |
--load_best_model_at_end \
|
|
|
|
| 325 |
--logging_strategy steps \
|
| 326 |
--logging_steps 10 \
|
| 327 |
--metric_for_best_model eval_rougeL_for_task1510_evalution_relation_extraction \
|
| 328 |
+
--evaluation_strategy steps \
|
| 329 |
--save_strategy steps \
|
| 330 |
--save_total_limit 1 \
|
| 331 |
--load_best_model_at_end \
|
|
|
|
| 382 |
--logging_strategy steps \
|
| 383 |
--logging_steps 10 \
|
| 384 |
--metric_for_best_model eval_rougeL_for_task639_multi_woz_user_utterance_generation \
|
| 385 |
+
--evaluation_strategy steps \
|
| 386 |
--save_strategy steps \
|
| 387 |
--save_total_limit 1 \
|
| 388 |
--load_best_model_at_end \
|
|
|
|
| 439 |
--logging_strategy steps \
|
| 440 |
--logging_steps 10 \
|
| 441 |
--metric_for_best_model eval_rougeL_for_task1729_personachat_generate_next \
|
| 442 |
+
--evaluation_strategy steps \
|
| 443 |
--save_strategy steps \
|
| 444 |
--save_total_limit 1 \
|
| 445 |
--load_best_model_at_end \
|
|
|
|
| 496 |
--logging_strategy steps \
|
| 497 |
--logging_steps 10 \
|
| 498 |
--metric_for_best_model eval_rougeL_for_task073_commonsenseqa_answer_generation \
|
| 499 |
+
--evaluation_strategy steps \
|
| 500 |
--save_strategy steps \
|
| 501 |
--save_total_limit 1 \
|
| 502 |
--load_best_model_at_end \
|
|
|
|
| 553 |
--logging_strategy steps \
|
| 554 |
--logging_steps 10 \
|
| 555 |
--metric_for_best_model eval_rougeL_for_task1590_diplomacy_text_generation \
|
| 556 |
+
--evaluation_strategy steps \
|
| 557 |
--save_strategy steps \
|
| 558 |
--save_total_limit 1 \
|
| 559 |
--load_best_model_at_end \
|
|
|
|
| 610 |
--logging_strategy steps \
|
| 611 |
--logging_steps 10 \
|
| 612 |
--metric_for_best_model eval_rougeL_for_task748_glucose_reverse_cause_event_detection \
|
| 613 |
+
--evaluation_strategy steps \
|
| 614 |
--save_strategy steps \
|
| 615 |
--save_total_limit 1 \
|
| 616 |
--load_best_model_at_end \
|
|
|
|
| 667 |
--logging_strategy steps \
|
| 668 |
--logging_steps 10 \
|
| 669 |
--metric_for_best_model eval_rougeL_for_task511_reddit_tifu_long_text_summarization \
|
| 670 |
+
--evaluation_strategy steps \
|
| 671 |
--save_strategy steps \
|
| 672 |
--save_total_limit 1 \
|
| 673 |
--load_best_model_at_end \
|
|
|
|
| 724 |
--logging_strategy steps \
|
| 725 |
--logging_steps 10 \
|
| 726 |
--metric_for_best_model eval_rougeL_for_task591_sciq_answer_generation \
|
| 727 |
+
--evaluation_strategy steps \
|
| 728 |
--save_strategy steps \
|
| 729 |
--save_total_limit 1 \
|
| 730 |
--load_best_model_at_end \
|
|
|
|
| 781 |
--logging_strategy steps \
|
| 782 |
--logging_steps 10 \
|
| 783 |
--metric_for_best_model eval_rougeL_for_task1687_sentiment140_classification \
|
| 784 |
+
--evaluation_strategy steps \
|
| 785 |
--save_strategy steps \
|
| 786 |
--save_total_limit 1 \
|
| 787 |
--load_best_model_at_end \
|
|
|
|
| 838 |
--logging_strategy steps \
|
| 839 |
--logging_steps 10 \
|
| 840 |
--metric_for_best_model eval_rougeL_for_task875_emotion_classification \
|
| 841 |
+
--evaluation_strategy steps \
|
| 842 |
--save_strategy steps \
|
| 843 |
--save_total_limit 1 \
|
| 844 |
--load_best_model_at_end \
|
root_gainlora/gen_script_superni_order1_llama_olora.sh
CHANGED
|
@@ -41,7 +41,7 @@ deepspeed --include localhost:${1} --master_port 29500 src/run_llama.py \
|
|
| 41 |
--logging_strategy steps \
|
| 42 |
--logging_steps 10 \
|
| 43 |
--metric_for_best_model eval_rougeL \
|
| 44 |
-
--
|
| 45 |
--save_strategy steps \
|
| 46 |
--save_total_limit 1 \
|
| 47 |
--lora_r 4 \
|
|
@@ -96,7 +96,7 @@ deepspeed --include localhost:${1} --master_port 29500 src/run_llama.py \
|
|
| 96 |
--logging_strategy steps \
|
| 97 |
--logging_steps 10 \
|
| 98 |
--metric_for_best_model eval_rougeL_for_task363_sst2_polarity_classification \
|
| 99 |
-
--
|
| 100 |
--save_strategy steps \
|
| 101 |
--save_total_limit 1 \
|
| 102 |
--load_best_model_at_end \
|
|
@@ -152,7 +152,7 @@ deepspeed --include localhost:${1} --master_port 29500 src/run_llama.py \
|
|
| 152 |
--logging_strategy steps \
|
| 153 |
--logging_steps 10 \
|
| 154 |
--metric_for_best_model eval_rougeL_for_task1290_xsum_summarization \
|
| 155 |
-
--
|
| 156 |
--save_strategy steps \
|
| 157 |
--save_total_limit 1 \
|
| 158 |
--load_best_model_at_end \
|
|
@@ -208,7 +208,7 @@ deepspeed --include localhost:${1} --master_port 29500 src/run_llama.py \
|
|
| 208 |
--logging_strategy steps \
|
| 209 |
--logging_steps 10 \
|
| 210 |
--metric_for_best_model eval_rougeL_for_task181_outcome_extraction \
|
| 211 |
-
--
|
| 212 |
--save_strategy steps \
|
| 213 |
--save_total_limit 1 \
|
| 214 |
--load_best_model_at_end \
|
|
@@ -264,7 +264,7 @@ deepspeed --include localhost:${1} --master_port 29500 src/run_llama.py \
|
|
| 264 |
--logging_strategy steps \
|
| 265 |
--logging_steps 10 \
|
| 266 |
--metric_for_best_model eval_rougeL_for_task002_quoref_answer_generation \
|
| 267 |
-
--
|
| 268 |
--save_strategy steps \
|
| 269 |
--save_total_limit 1 \
|
| 270 |
--load_best_model_at_end \
|
|
@@ -320,7 +320,7 @@ deepspeed --include localhost:${1} --master_port 29500 src/run_llama.py \
|
|
| 320 |
--logging_strategy steps \
|
| 321 |
--logging_steps 10 \
|
| 322 |
--metric_for_best_model eval_rougeL_for_task1510_evalution_relation_extraction \
|
| 323 |
-
--
|
| 324 |
--save_strategy steps \
|
| 325 |
--save_total_limit 1 \
|
| 326 |
--load_best_model_at_end \
|
|
@@ -376,7 +376,7 @@ deepspeed --include localhost:${1} --master_port 29500 src/run_llama.py \
|
|
| 376 |
--logging_strategy steps \
|
| 377 |
--logging_steps 10 \
|
| 378 |
--metric_for_best_model eval_rougeL_for_task639_multi_woz_user_utterance_generation \
|
| 379 |
-
--
|
| 380 |
--save_strategy steps \
|
| 381 |
--save_total_limit 1 \
|
| 382 |
--load_best_model_at_end \
|
|
@@ -432,7 +432,7 @@ deepspeed --include localhost:${1} --master_port 29500 src/run_llama.py \
|
|
| 432 |
--logging_strategy steps \
|
| 433 |
--logging_steps 10 \
|
| 434 |
--metric_for_best_model eval_rougeL_for_task1729_personachat_generate_next \
|
| 435 |
-
--
|
| 436 |
--save_strategy steps \
|
| 437 |
--save_total_limit 1 \
|
| 438 |
--load_best_model_at_end \
|
|
@@ -488,7 +488,7 @@ deepspeed --include localhost:${1} --master_port 29500 src/run_llama.py \
|
|
| 488 |
--logging_strategy steps \
|
| 489 |
--logging_steps 10 \
|
| 490 |
--metric_for_best_model eval_rougeL_for_task073_commonsenseqa_answer_generation \
|
| 491 |
-
--
|
| 492 |
--save_strategy steps \
|
| 493 |
--save_total_limit 1 \
|
| 494 |
--load_best_model_at_end \
|
|
@@ -544,7 +544,7 @@ deepspeed --include localhost:${1} --master_port 29500 src/run_llama.py \
|
|
| 544 |
--logging_strategy steps \
|
| 545 |
--logging_steps 10 \
|
| 546 |
--metric_for_best_model eval_rougeL_for_task1590_diplomacy_text_generation \
|
| 547 |
-
--
|
| 548 |
--save_strategy steps \
|
| 549 |
--save_total_limit 1 \
|
| 550 |
--load_best_model_at_end \
|
|
@@ -600,7 +600,7 @@ deepspeed --include localhost:${1} --master_port 29500 src/run_llama.py \
|
|
| 600 |
--logging_strategy steps \
|
| 601 |
--logging_steps 10 \
|
| 602 |
--metric_for_best_model eval_rougeL_for_task748_glucose_reverse_cause_event_detection \
|
| 603 |
-
--
|
| 604 |
--save_strategy steps \
|
| 605 |
--save_total_limit 1 \
|
| 606 |
--load_best_model_at_end \
|
|
@@ -656,7 +656,7 @@ deepspeed --include localhost:${1} --master_port 29500 src/run_llama.py \
|
|
| 656 |
--logging_strategy steps \
|
| 657 |
--logging_steps 10 \
|
| 658 |
--metric_for_best_model eval_rougeL_for_task511_reddit_tifu_long_text_summarization \
|
| 659 |
-
--
|
| 660 |
--save_strategy steps \
|
| 661 |
--save_total_limit 1 \
|
| 662 |
--load_best_model_at_end \
|
|
@@ -712,7 +712,7 @@ deepspeed --include localhost:${1} --master_port 29500 src/run_llama.py \
|
|
| 712 |
--logging_strategy steps \
|
| 713 |
--logging_steps 10 \
|
| 714 |
--metric_for_best_model eval_rougeL_for_task591_sciq_answer_generation \
|
| 715 |
-
--
|
| 716 |
--save_strategy steps \
|
| 717 |
--save_total_limit 1 \
|
| 718 |
--load_best_model_at_end \
|
|
@@ -768,7 +768,7 @@ deepspeed --include localhost:${1} --master_port 29500 src/run_llama.py \
|
|
| 768 |
--logging_strategy steps \
|
| 769 |
--logging_steps 10 \
|
| 770 |
--metric_for_best_model eval_rougeL_for_task1687_sentiment140_classification \
|
| 771 |
-
--
|
| 772 |
--save_strategy steps \
|
| 773 |
--save_total_limit 1 \
|
| 774 |
--load_best_model_at_end \
|
|
@@ -824,7 +824,7 @@ deepspeed --include localhost:${1} --master_port 29500 src/run_llama.py \
|
|
| 824 |
--logging_strategy steps \
|
| 825 |
--logging_steps 10 \
|
| 826 |
--metric_for_best_model eval_rougeL_for_task875_emotion_classification \
|
| 827 |
-
--
|
| 828 |
--save_strategy steps \
|
| 829 |
--save_total_limit 1 \
|
| 830 |
--load_best_model_at_end \
|
|
|
|
| 41 |
--logging_strategy steps \
|
| 42 |
--logging_steps 10 \
|
| 43 |
--metric_for_best_model eval_rougeL \
|
| 44 |
+
--evaluation_strategy steps \
|
| 45 |
--save_strategy steps \
|
| 46 |
--save_total_limit 1 \
|
| 47 |
--lora_r 4 \
|
|
|
|
| 96 |
--logging_strategy steps \
|
| 97 |
--logging_steps 10 \
|
| 98 |
--metric_for_best_model eval_rougeL_for_task363_sst2_polarity_classification \
|
| 99 |
+
--evaluation_strategy steps \
|
| 100 |
--save_strategy steps \
|
| 101 |
--save_total_limit 1 \
|
| 102 |
--load_best_model_at_end \
|
|
|
|
| 152 |
--logging_strategy steps \
|
| 153 |
--logging_steps 10 \
|
| 154 |
--metric_for_best_model eval_rougeL_for_task1290_xsum_summarization \
|
| 155 |
+
--evaluation_strategy steps \
|
| 156 |
--save_strategy steps \
|
| 157 |
--save_total_limit 1 \
|
| 158 |
--load_best_model_at_end \
|
|
|
|
| 208 |
--logging_strategy steps \
|
| 209 |
--logging_steps 10 \
|
| 210 |
--metric_for_best_model eval_rougeL_for_task181_outcome_extraction \
|
| 211 |
+
--evaluation_strategy steps \
|
| 212 |
--save_strategy steps \
|
| 213 |
--save_total_limit 1 \
|
| 214 |
--load_best_model_at_end \
|
|
|
|
| 264 |
--logging_strategy steps \
|
| 265 |
--logging_steps 10 \
|
| 266 |
--metric_for_best_model eval_rougeL_for_task002_quoref_answer_generation \
|
| 267 |
+
--evaluation_strategy steps \
|
| 268 |
--save_strategy steps \
|
| 269 |
--save_total_limit 1 \
|
| 270 |
--load_best_model_at_end \
|
|
|
|
| 320 |
--logging_strategy steps \
|
| 321 |
--logging_steps 10 \
|
| 322 |
--metric_for_best_model eval_rougeL_for_task1510_evalution_relation_extraction \
|
| 323 |
+
--evaluation_strategy steps \
|
| 324 |
--save_strategy steps \
|
| 325 |
--save_total_limit 1 \
|
| 326 |
--load_best_model_at_end \
|
|
|
|
| 376 |
--logging_strategy steps \
|
| 377 |
--logging_steps 10 \
|
| 378 |
--metric_for_best_model eval_rougeL_for_task639_multi_woz_user_utterance_generation \
|
| 379 |
+
--evaluation_strategy steps \
|
| 380 |
--save_strategy steps \
|
| 381 |
--save_total_limit 1 \
|
| 382 |
--load_best_model_at_end \
|
|
|
|
| 432 |
--logging_strategy steps \
|
| 433 |
--logging_steps 10 \
|
| 434 |
--metric_for_best_model eval_rougeL_for_task1729_personachat_generate_next \
|
| 435 |
+
--evaluation_strategy steps \
|
| 436 |
--save_strategy steps \
|
| 437 |
--save_total_limit 1 \
|
| 438 |
--load_best_model_at_end \
|
|
|
|
| 488 |
--logging_strategy steps \
|
| 489 |
--logging_steps 10 \
|
| 490 |
--metric_for_best_model eval_rougeL_for_task073_commonsenseqa_answer_generation \
|
| 491 |
+
--evaluation_strategy steps \
|
| 492 |
--save_strategy steps \
|
| 493 |
--save_total_limit 1 \
|
| 494 |
--load_best_model_at_end \
|
|
|
|
| 544 |
--logging_strategy steps \
|
| 545 |
--logging_steps 10 \
|
| 546 |
--metric_for_best_model eval_rougeL_for_task1590_diplomacy_text_generation \
|
| 547 |
+
--evaluation_strategy steps \
|
| 548 |
--save_strategy steps \
|
| 549 |
--save_total_limit 1 \
|
| 550 |
--load_best_model_at_end \
|
|
|
|
| 600 |
--logging_strategy steps \
|
| 601 |
--logging_steps 10 \
|
| 602 |
--metric_for_best_model eval_rougeL_for_task748_glucose_reverse_cause_event_detection \
|
| 603 |
+
--evaluation_strategy steps \
|
| 604 |
--save_strategy steps \
|
| 605 |
--save_total_limit 1 \
|
| 606 |
--load_best_model_at_end \
|
|
|
|
| 656 |
--logging_strategy steps \
|
| 657 |
--logging_steps 10 \
|
| 658 |
--metric_for_best_model eval_rougeL_for_task511_reddit_tifu_long_text_summarization \
|
| 659 |
+
--evaluation_strategy steps \
|
| 660 |
--save_strategy steps \
|
| 661 |
--save_total_limit 1 \
|
| 662 |
--load_best_model_at_end \
|
|
|
|
| 712 |
--logging_strategy steps \
|
| 713 |
--logging_steps 10 \
|
| 714 |
--metric_for_best_model eval_rougeL_for_task591_sciq_answer_generation \
|
| 715 |
+
--evaluation_strategy steps \
|
| 716 |
--save_strategy steps \
|
| 717 |
--save_total_limit 1 \
|
| 718 |
--load_best_model_at_end \
|
|
|
|
| 768 |
--logging_strategy steps \
|
| 769 |
--logging_steps 10 \
|
| 770 |
--metric_for_best_model eval_rougeL_for_task1687_sentiment140_classification \
|
| 771 |
+
--evaluation_strategy steps \
|
| 772 |
--save_strategy steps \
|
| 773 |
--save_total_limit 1 \
|
| 774 |
--load_best_model_at_end \
|
|
|
|
| 824 |
--logging_strategy steps \
|
| 825 |
--logging_steps 10 \
|
| 826 |
--metric_for_best_model eval_rougeL_for_task875_emotion_classification \
|
| 827 |
+
--evaluation_strategy steps \
|
| 828 |
--save_strategy steps \
|
| 829 |
--save_total_limit 1 \
|
| 830 |
--load_best_model_at_end \
|
root_gainlora/gen_script_superni_order1_t5_gainlora_inflora.sh
CHANGED
|
@@ -38,7 +38,7 @@ CUDA_VISIBLE_DEVICES=$1 python src/run_t5.py \
|
|
| 38 |
--logging_strategy steps \
|
| 39 |
--logging_steps 10 \
|
| 40 |
--metric_for_best_model eval_rougeL \
|
| 41 |
-
--
|
| 42 |
--save_strategy steps \
|
| 43 |
--save_total_limit 1 \
|
| 44 |
--lora_r 4 \
|
|
@@ -87,7 +87,7 @@ CUDA_VISIBLE_DEVICES=$1 python src/run_t5.py \
|
|
| 87 |
--logging_strategy steps \
|
| 88 |
--logging_steps 10 \
|
| 89 |
--metric_for_best_model eval_rougeL_for_task363_sst2_polarity_classification \
|
| 90 |
-
--
|
| 91 |
--save_strategy steps \
|
| 92 |
--save_total_limit 1 \
|
| 93 |
--load_best_model_at_end \
|
|
@@ -136,7 +136,7 @@ CUDA_VISIBLE_DEVICES=$1 python src/run_t5.py \
|
|
| 136 |
--logging_strategy steps \
|
| 137 |
--logging_steps 10 \
|
| 138 |
--metric_for_best_model eval_rougeL_for_task1290_xsum_summarization \
|
| 139 |
-
--
|
| 140 |
--save_strategy steps \
|
| 141 |
--save_total_limit 1 \
|
| 142 |
--load_best_model_at_end \
|
|
@@ -185,7 +185,7 @@ CUDA_VISIBLE_DEVICES=$1 python src/run_t5.py \
|
|
| 185 |
--logging_strategy steps \
|
| 186 |
--logging_steps 10 \
|
| 187 |
--metric_for_best_model eval_rougeL_for_task181_outcome_extraction \
|
| 188 |
-
--
|
| 189 |
--save_strategy steps \
|
| 190 |
--save_total_limit 1 \
|
| 191 |
--load_best_model_at_end \
|
|
@@ -234,7 +234,7 @@ CUDA_VISIBLE_DEVICES=$1 python src/run_t5.py \
|
|
| 234 |
--logging_strategy steps \
|
| 235 |
--logging_steps 10 \
|
| 236 |
--metric_for_best_model eval_rougeL_for_task002_quoref_answer_generation \
|
| 237 |
-
--
|
| 238 |
--save_strategy steps \
|
| 239 |
--save_total_limit 1 \
|
| 240 |
--load_best_model_at_end \
|
|
@@ -283,7 +283,7 @@ CUDA_VISIBLE_DEVICES=$1 python src/run_t5.py \
|
|
| 283 |
--logging_strategy steps \
|
| 284 |
--logging_steps 10 \
|
| 285 |
--metric_for_best_model eval_rougeL_for_task1510_evalution_relation_extraction \
|
| 286 |
-
--
|
| 287 |
--save_strategy steps \
|
| 288 |
--save_total_limit 1 \
|
| 289 |
--load_best_model_at_end \
|
|
@@ -332,7 +332,7 @@ CUDA_VISIBLE_DEVICES=$1 python src/run_t5.py \
|
|
| 332 |
--logging_strategy steps \
|
| 333 |
--logging_steps 10 \
|
| 334 |
--metric_for_best_model eval_rougeL_for_task639_multi_woz_user_utterance_generation \
|
| 335 |
-
--
|
| 336 |
--save_strategy steps \
|
| 337 |
--save_total_limit 1 \
|
| 338 |
--load_best_model_at_end \
|
|
@@ -381,7 +381,7 @@ CUDA_VISIBLE_DEVICES=$1 python src/run_t5.py \
|
|
| 381 |
--logging_strategy steps \
|
| 382 |
--logging_steps 10 \
|
| 383 |
--metric_for_best_model eval_rougeL_for_task1729_personachat_generate_next \
|
| 384 |
-
--
|
| 385 |
--save_strategy steps \
|
| 386 |
--save_total_limit 1 \
|
| 387 |
--load_best_model_at_end \
|
|
@@ -430,7 +430,7 @@ CUDA_VISIBLE_DEVICES=$1 python src/run_t5.py \
|
|
| 430 |
--logging_strategy steps \
|
| 431 |
--logging_steps 10 \
|
| 432 |
--metric_for_best_model eval_rougeL_for_task073_commonsenseqa_answer_generation \
|
| 433 |
-
--
|
| 434 |
--save_strategy steps \
|
| 435 |
--save_total_limit 1 \
|
| 436 |
--load_best_model_at_end \
|
|
@@ -479,7 +479,7 @@ CUDA_VISIBLE_DEVICES=$1 python src/run_t5.py \
|
|
| 479 |
--logging_strategy steps \
|
| 480 |
--logging_steps 10 \
|
| 481 |
--metric_for_best_model eval_rougeL_for_task1590_diplomacy_text_generation \
|
| 482 |
-
--
|
| 483 |
--save_strategy steps \
|
| 484 |
--save_total_limit 1 \
|
| 485 |
--load_best_model_at_end \
|
|
@@ -528,7 +528,7 @@ CUDA_VISIBLE_DEVICES=$1 python src/run_t5.py \
|
|
| 528 |
--logging_strategy steps \
|
| 529 |
--logging_steps 10 \
|
| 530 |
--metric_for_best_model eval_rougeL_for_task748_glucose_reverse_cause_event_detection \
|
| 531 |
-
--
|
| 532 |
--save_strategy steps \
|
| 533 |
--save_total_limit 1 \
|
| 534 |
--load_best_model_at_end \
|
|
@@ -577,7 +577,7 @@ CUDA_VISIBLE_DEVICES=$1 python src/run_t5.py \
|
|
| 577 |
--logging_strategy steps \
|
| 578 |
--logging_steps 10 \
|
| 579 |
--metric_for_best_model eval_rougeL_for_task511_reddit_tifu_long_text_summarization \
|
| 580 |
-
--
|
| 581 |
--save_strategy steps \
|
| 582 |
--save_total_limit 1 \
|
| 583 |
--load_best_model_at_end \
|
|
@@ -626,7 +626,7 @@ CUDA_VISIBLE_DEVICES=$1 python src/run_t5.py \
|
|
| 626 |
--logging_strategy steps \
|
| 627 |
--logging_steps 10 \
|
| 628 |
--metric_for_best_model eval_rougeL_for_task591_sciq_answer_generation \
|
| 629 |
-
--
|
| 630 |
--save_strategy steps \
|
| 631 |
--save_total_limit 1 \
|
| 632 |
--load_best_model_at_end \
|
|
@@ -675,7 +675,7 @@ CUDA_VISIBLE_DEVICES=$1 python src/run_t5.py \
|
|
| 675 |
--logging_strategy steps \
|
| 676 |
--logging_steps 10 \
|
| 677 |
--metric_for_best_model eval_rougeL_for_task1687_sentiment140_classification \
|
| 678 |
-
--
|
| 679 |
--save_strategy steps \
|
| 680 |
--save_total_limit 1 \
|
| 681 |
--load_best_model_at_end \
|
|
@@ -724,7 +724,7 @@ CUDA_VISIBLE_DEVICES=$1 python src/run_t5.py \
|
|
| 724 |
--logging_strategy steps \
|
| 725 |
--logging_steps 10 \
|
| 726 |
--metric_for_best_model eval_rougeL_for_task875_emotion_classification \
|
| 727 |
-
--
|
| 728 |
--save_strategy steps \
|
| 729 |
--save_total_limit 1 \
|
| 730 |
--load_best_model_at_end \
|
|
|
|
| 38 |
--logging_strategy steps \
|
| 39 |
--logging_steps 10 \
|
| 40 |
--metric_for_best_model eval_rougeL \
|
| 41 |
+
--evaluation_strategy steps \
|
| 42 |
--save_strategy steps \
|
| 43 |
--save_total_limit 1 \
|
| 44 |
--lora_r 4 \
|
|
|
|
| 87 |
--logging_strategy steps \
|
| 88 |
--logging_steps 10 \
|
| 89 |
--metric_for_best_model eval_rougeL_for_task363_sst2_polarity_classification \
|
| 90 |
+
--evaluation_strategy steps \
|
| 91 |
--save_strategy steps \
|
| 92 |
--save_total_limit 1 \
|
| 93 |
--load_best_model_at_end \
|
|
|
|
| 136 |
--logging_strategy steps \
|
| 137 |
--logging_steps 10 \
|
| 138 |
--metric_for_best_model eval_rougeL_for_task1290_xsum_summarization \
|
| 139 |
+
--evaluation_strategy steps \
|
| 140 |
--save_strategy steps \
|
| 141 |
--save_total_limit 1 \
|
| 142 |
--load_best_model_at_end \
|
|
|
|
| 185 |
--logging_strategy steps \
|
| 186 |
--logging_steps 10 \
|
| 187 |
--metric_for_best_model eval_rougeL_for_task181_outcome_extraction \
|
| 188 |
+
--evaluation_strategy steps \
|
| 189 |
--save_strategy steps \
|
| 190 |
--save_total_limit 1 \
|
| 191 |
--load_best_model_at_end \
|
|
|
|
| 234 |
--logging_strategy steps \
|
| 235 |
--logging_steps 10 \
|
| 236 |
--metric_for_best_model eval_rougeL_for_task002_quoref_answer_generation \
|
| 237 |
+
--evaluation_strategy steps \
|
| 238 |
--save_strategy steps \
|
| 239 |
--save_total_limit 1 \
|
| 240 |
--load_best_model_at_end \
|
|
|
|
| 283 |
--logging_strategy steps \
|
| 284 |
--logging_steps 10 \
|
| 285 |
--metric_for_best_model eval_rougeL_for_task1510_evalution_relation_extraction \
|
| 286 |
+
--evaluation_strategy steps \
|
| 287 |
--save_strategy steps \
|
| 288 |
--save_total_limit 1 \
|
| 289 |
--load_best_model_at_end \
|
|
|
|
| 332 |
--logging_strategy steps \
|
| 333 |
--logging_steps 10 \
|
| 334 |
--metric_for_best_model eval_rougeL_for_task639_multi_woz_user_utterance_generation \
|
| 335 |
+
--evaluation_strategy steps \
|
| 336 |
--save_strategy steps \
|
| 337 |
--save_total_limit 1 \
|
| 338 |
--load_best_model_at_end \
|
|
|
|
| 381 |
--logging_strategy steps \
|
| 382 |
--logging_steps 10 \
|
| 383 |
--metric_for_best_model eval_rougeL_for_task1729_personachat_generate_next \
|
| 384 |
+
--evaluation_strategy steps \
|
| 385 |
--save_strategy steps \
|
| 386 |
--save_total_limit 1 \
|
| 387 |
--load_best_model_at_end \
|
|
|
|
| 430 |
--logging_strategy steps \
|
| 431 |
--logging_steps 10 \
|
| 432 |
--metric_for_best_model eval_rougeL_for_task073_commonsenseqa_answer_generation \
|
| 433 |
+
--evaluation_strategy steps \
|
| 434 |
--save_strategy steps \
|
| 435 |
--save_total_limit 1 \
|
| 436 |
--load_best_model_at_end \
|
|
|
|
| 479 |
--logging_strategy steps \
|
| 480 |
--logging_steps 10 \
|
| 481 |
--metric_for_best_model eval_rougeL_for_task1590_diplomacy_text_generation \
|
| 482 |
+
--evaluation_strategy steps \
|
| 483 |
--save_strategy steps \
|
| 484 |
--save_total_limit 1 \
|
| 485 |
--load_best_model_at_end \
|
|
|
|
| 528 |
--logging_strategy steps \
|
| 529 |
--logging_steps 10 \
|
| 530 |
--metric_for_best_model eval_rougeL_for_task748_glucose_reverse_cause_event_detection \
|
| 531 |
+
--evaluation_strategy steps \
|
| 532 |
--save_strategy steps \
|
| 533 |
--save_total_limit 1 \
|
| 534 |
--load_best_model_at_end \
|
|
|
|
| 577 |
--logging_strategy steps \
|
| 578 |
--logging_steps 10 \
|
| 579 |
--metric_for_best_model eval_rougeL_for_task511_reddit_tifu_long_text_summarization \
|
| 580 |
+
--evaluation_strategy steps \
|
| 581 |
--save_strategy steps \
|
| 582 |
--save_total_limit 1 \
|
| 583 |
--load_best_model_at_end \
|
|
|
|
| 626 |
--logging_strategy steps \
|
| 627 |
--logging_steps 10 \
|
| 628 |
--metric_for_best_model eval_rougeL_for_task591_sciq_answer_generation \
|
| 629 |
+
--evaluation_strategy steps \
|
| 630 |
--save_strategy steps \
|
| 631 |
--save_total_limit 1 \
|
| 632 |
--load_best_model_at_end \
|
|
|
|
| 675 |
--logging_strategy steps \
|
| 676 |
--logging_steps 10 \
|
| 677 |
--metric_for_best_model eval_rougeL_for_task1687_sentiment140_classification \
|
| 678 |
+
--evaluation_strategy steps \
|
| 679 |
--save_strategy steps \
|
| 680 |
--save_total_limit 1 \
|
| 681 |
--load_best_model_at_end \
|
|
|
|
| 724 |
--logging_strategy steps \
|
| 725 |
--logging_steps 10 \
|
| 726 |
--metric_for_best_model eval_rougeL_for_task875_emotion_classification \
|
| 727 |
+
--evaluation_strategy steps \
|
| 728 |
--save_strategy steps \
|
| 729 |
--save_total_limit 1 \
|
| 730 |
--load_best_model_at_end \
|
root_gainlora/gen_script_superni_order1_t5_inflora.sh
CHANGED
|
@@ -38,7 +38,7 @@ CUDA_VISIBLE_DEVICES=$1 python src/run_t5.py \
|
|
| 38 |
--logging_strategy steps \
|
| 39 |
--logging_steps 10 \
|
| 40 |
--metric_for_best_model eval_rougeL \
|
| 41 |
-
--
|
| 42 |
--save_strategy steps \
|
| 43 |
--save_total_limit 1 \
|
| 44 |
--lora_r 4 \
|
|
@@ -84,7 +84,7 @@ CUDA_VISIBLE_DEVICES=$1 python src/run_t5.py \
|
|
| 84 |
--logging_strategy steps \
|
| 85 |
--logging_steps 10 \
|
| 86 |
--metric_for_best_model eval_rougeL_for_task363_sst2_polarity_classification \
|
| 87 |
-
--
|
| 88 |
--save_strategy steps \
|
| 89 |
--save_total_limit 1 \
|
| 90 |
--load_best_model_at_end \
|
|
@@ -131,7 +131,7 @@ CUDA_VISIBLE_DEVICES=$1 python src/run_t5.py \
|
|
| 131 |
--logging_strategy steps \
|
| 132 |
--logging_steps 10 \
|
| 133 |
--metric_for_best_model eval_rougeL_for_task1290_xsum_summarization \
|
| 134 |
-
--
|
| 135 |
--save_strategy steps \
|
| 136 |
--save_total_limit 1 \
|
| 137 |
--load_best_model_at_end \
|
|
@@ -178,7 +178,7 @@ CUDA_VISIBLE_DEVICES=$1 python src/run_t5.py \
|
|
| 178 |
--logging_strategy steps \
|
| 179 |
--logging_steps 10 \
|
| 180 |
--metric_for_best_model eval_rougeL_for_task181_outcome_extraction \
|
| 181 |
-
--
|
| 182 |
--save_strategy steps \
|
| 183 |
--save_total_limit 1 \
|
| 184 |
--load_best_model_at_end \
|
|
@@ -225,7 +225,7 @@ CUDA_VISIBLE_DEVICES=$1 python src/run_t5.py \
|
|
| 225 |
--logging_strategy steps \
|
| 226 |
--logging_steps 10 \
|
| 227 |
--metric_for_best_model eval_rougeL_for_task002_quoref_answer_generation \
|
| 228 |
-
--
|
| 229 |
--save_strategy steps \
|
| 230 |
--save_total_limit 1 \
|
| 231 |
--load_best_model_at_end \
|
|
@@ -272,7 +272,7 @@ CUDA_VISIBLE_DEVICES=$1 python src/run_t5.py \
|
|
| 272 |
--logging_strategy steps \
|
| 273 |
--logging_steps 10 \
|
| 274 |
--metric_for_best_model eval_rougeL_for_task1510_evalution_relation_extraction \
|
| 275 |
-
--
|
| 276 |
--save_strategy steps \
|
| 277 |
--save_total_limit 1 \
|
| 278 |
--load_best_model_at_end \
|
|
@@ -319,7 +319,7 @@ CUDA_VISIBLE_DEVICES=$1 python src/run_t5.py \
|
|
| 319 |
--logging_strategy steps \
|
| 320 |
--logging_steps 10 \
|
| 321 |
--metric_for_best_model eval_rougeL_for_task639_multi_woz_user_utterance_generation \
|
| 322 |
-
--
|
| 323 |
--save_strategy steps \
|
| 324 |
--save_total_limit 1 \
|
| 325 |
--load_best_model_at_end \
|
|
@@ -366,7 +366,7 @@ CUDA_VISIBLE_DEVICES=$1 python src/run_t5.py \
|
|
| 366 |
--logging_strategy steps \
|
| 367 |
--logging_steps 10 \
|
| 368 |
--metric_for_best_model eval_rougeL_for_task1729_personachat_generate_next \
|
| 369 |
-
--
|
| 370 |
--save_strategy steps \
|
| 371 |
--save_total_limit 1 \
|
| 372 |
--load_best_model_at_end \
|
|
@@ -413,7 +413,7 @@ CUDA_VISIBLE_DEVICES=$1 python src/run_t5.py \
|
|
| 413 |
--logging_strategy steps \
|
| 414 |
--logging_steps 10 \
|
| 415 |
--metric_for_best_model eval_rougeL_for_task073_commonsenseqa_answer_generation \
|
| 416 |
-
--
|
| 417 |
--save_strategy steps \
|
| 418 |
--save_total_limit 1 \
|
| 419 |
--load_best_model_at_end \
|
|
@@ -460,7 +460,7 @@ CUDA_VISIBLE_DEVICES=$1 python src/run_t5.py \
|
|
| 460 |
--logging_strategy steps \
|
| 461 |
--logging_steps 10 \
|
| 462 |
--metric_for_best_model eval_rougeL_for_task1590_diplomacy_text_generation \
|
| 463 |
-
--
|
| 464 |
--save_strategy steps \
|
| 465 |
--save_total_limit 1 \
|
| 466 |
--load_best_model_at_end \
|
|
@@ -507,7 +507,7 @@ CUDA_VISIBLE_DEVICES=$1 python src/run_t5.py \
|
|
| 507 |
--logging_strategy steps \
|
| 508 |
--logging_steps 10 \
|
| 509 |
--metric_for_best_model eval_rougeL_for_task748_glucose_reverse_cause_event_detection \
|
| 510 |
-
--
|
| 511 |
--save_strategy steps \
|
| 512 |
--save_total_limit 1 \
|
| 513 |
--load_best_model_at_end \
|
|
@@ -554,7 +554,7 @@ CUDA_VISIBLE_DEVICES=$1 python src/run_t5.py \
|
|
| 554 |
--logging_strategy steps \
|
| 555 |
--logging_steps 10 \
|
| 556 |
--metric_for_best_model eval_rougeL_for_task511_reddit_tifu_long_text_summarization \
|
| 557 |
-
--
|
| 558 |
--save_strategy steps \
|
| 559 |
--save_total_limit 1 \
|
| 560 |
--load_best_model_at_end \
|
|
@@ -601,7 +601,7 @@ CUDA_VISIBLE_DEVICES=$1 python src/run_t5.py \
|
|
| 601 |
--logging_strategy steps \
|
| 602 |
--logging_steps 10 \
|
| 603 |
--metric_for_best_model eval_rougeL_for_task591_sciq_answer_generation \
|
| 604 |
-
--
|
| 605 |
--save_strategy steps \
|
| 606 |
--save_total_limit 1 \
|
| 607 |
--load_best_model_at_end \
|
|
@@ -648,7 +648,7 @@ CUDA_VISIBLE_DEVICES=$1 python src/run_t5.py \
|
|
| 648 |
--logging_strategy steps \
|
| 649 |
--logging_steps 10 \
|
| 650 |
--metric_for_best_model eval_rougeL_for_task1687_sentiment140_classification \
|
| 651 |
-
--
|
| 652 |
--save_strategy steps \
|
| 653 |
--save_total_limit 1 \
|
| 654 |
--load_best_model_at_end \
|
|
@@ -695,7 +695,7 @@ CUDA_VISIBLE_DEVICES=$1 python src/run_t5.py \
|
|
| 695 |
--logging_strategy steps \
|
| 696 |
--logging_steps 10 \
|
| 697 |
--metric_for_best_model eval_rougeL_for_task875_emotion_classification \
|
| 698 |
-
--
|
| 699 |
--save_strategy steps \
|
| 700 |
--save_total_limit 1 \
|
| 701 |
--load_best_model_at_end \
|
|
|
|
| 38 |
--logging_strategy steps \
|
| 39 |
--logging_steps 10 \
|
| 40 |
--metric_for_best_model eval_rougeL \
|
| 41 |
+
--evaluation_strategy steps \
|
| 42 |
--save_strategy steps \
|
| 43 |
--save_total_limit 1 \
|
| 44 |
--lora_r 4 \
|
|
|
|
| 84 |
--logging_strategy steps \
|
| 85 |
--logging_steps 10 \
|
| 86 |
--metric_for_best_model eval_rougeL_for_task363_sst2_polarity_classification \
|
| 87 |
+
--evaluation_strategy steps \
|
| 88 |
--save_strategy steps \
|
| 89 |
--save_total_limit 1 \
|
| 90 |
--load_best_model_at_end \
|
|
|
|
| 131 |
--logging_strategy steps \
|
| 132 |
--logging_steps 10 \
|
| 133 |
--metric_for_best_model eval_rougeL_for_task1290_xsum_summarization \
|
| 134 |
+
--evaluation_strategy steps \
|
| 135 |
--save_strategy steps \
|
| 136 |
--save_total_limit 1 \
|
| 137 |
--load_best_model_at_end \
|
|
|
|
| 178 |
--logging_strategy steps \
|
| 179 |
--logging_steps 10 \
|
| 180 |
--metric_for_best_model eval_rougeL_for_task181_outcome_extraction \
|
| 181 |
+
--evaluation_strategy steps \
|
| 182 |
--save_strategy steps \
|
| 183 |
--save_total_limit 1 \
|
| 184 |
--load_best_model_at_end \
|
|
|
|
| 225 |
--logging_strategy steps \
|
| 226 |
--logging_steps 10 \
|
| 227 |
--metric_for_best_model eval_rougeL_for_task002_quoref_answer_generation \
|
| 228 |
+
--evaluation_strategy steps \
|
| 229 |
--save_strategy steps \
|
| 230 |
--save_total_limit 1 \
|
| 231 |
--load_best_model_at_end \
|
|
|
|
| 272 |
--logging_strategy steps \
|
| 273 |
--logging_steps 10 \
|
| 274 |
--metric_for_best_model eval_rougeL_for_task1510_evalution_relation_extraction \
|
| 275 |
+
--evaluation_strategy steps \
|
| 276 |
--save_strategy steps \
|
| 277 |
--save_total_limit 1 \
|
| 278 |
--load_best_model_at_end \
|
|
|
|
| 319 |
--logging_strategy steps \
|
| 320 |
--logging_steps 10 \
|
| 321 |
--metric_for_best_model eval_rougeL_for_task639_multi_woz_user_utterance_generation \
|
| 322 |
+
--evaluation_strategy steps \
|
| 323 |
--save_strategy steps \
|
| 324 |
--save_total_limit 1 \
|
| 325 |
--load_best_model_at_end \
|
|
|
|
| 366 |
--logging_strategy steps \
|
| 367 |
--logging_steps 10 \
|
| 368 |
--metric_for_best_model eval_rougeL_for_task1729_personachat_generate_next \
|
| 369 |
+
--evaluation_strategy steps \
|
| 370 |
--save_strategy steps \
|
| 371 |
--save_total_limit 1 \
|
| 372 |
--load_best_model_at_end \
|
|
|
|
| 413 |
--logging_strategy steps \
|
| 414 |
--logging_steps 10 \
|
| 415 |
--metric_for_best_model eval_rougeL_for_task073_commonsenseqa_answer_generation \
|
| 416 |
+
--evaluation_strategy steps \
|
| 417 |
--save_strategy steps \
|
| 418 |
--save_total_limit 1 \
|
| 419 |
--load_best_model_at_end \
|
|
|
|
| 460 |
--logging_strategy steps \
|
| 461 |
--logging_steps 10 \
|
| 462 |
--metric_for_best_model eval_rougeL_for_task1590_diplomacy_text_generation \
|
| 463 |
+
--evaluation_strategy steps \
|
| 464 |
--save_strategy steps \
|
| 465 |
--save_total_limit 1 \
|
| 466 |
--load_best_model_at_end \
|
|
|
|
| 507 |
--logging_strategy steps \
|
| 508 |
--logging_steps 10 \
|
| 509 |
--metric_for_best_model eval_rougeL_for_task748_glucose_reverse_cause_event_detection \
|
| 510 |
+
--evaluation_strategy steps \
|
| 511 |
--save_strategy steps \
|
| 512 |
--save_total_limit 1 \
|
| 513 |
--load_best_model_at_end \
|
|
|
|
| 554 |
--logging_strategy steps \
|
| 555 |
--logging_steps 10 \
|
| 556 |
--metric_for_best_model eval_rougeL_for_task511_reddit_tifu_long_text_summarization \
|
| 557 |
+
--evaluation_strategy steps \
|
| 558 |
--save_strategy steps \
|
| 559 |
--save_total_limit 1 \
|
| 560 |
--load_best_model_at_end \
|
|
|
|
| 601 |
--logging_strategy steps \
|
| 602 |
--logging_steps 10 \
|
| 603 |
--metric_for_best_model eval_rougeL_for_task591_sciq_answer_generation \
|
| 604 |
+
--evaluation_strategy steps \
|
| 605 |
--save_strategy steps \
|
| 606 |
--save_total_limit 1 \
|
| 607 |
--load_best_model_at_end \
|
|
|
|
| 648 |
--logging_strategy steps \
|
| 649 |
--logging_steps 10 \
|
| 650 |
--metric_for_best_model eval_rougeL_for_task1687_sentiment140_classification \
|
| 651 |
+
--evaluation_strategy steps \
|
| 652 |
--save_strategy steps \
|
| 653 |
--save_total_limit 1 \
|
| 654 |
--load_best_model_at_end \
|
|
|
|
| 695 |
--logging_strategy steps \
|
| 696 |
--logging_steps 10 \
|
| 697 |
--metric_for_best_model eval_rougeL_for_task875_emotion_classification \
|
| 698 |
+
--evaluation_strategy steps \
|
| 699 |
--save_strategy steps \
|
| 700 |
--save_total_limit 1 \
|
| 701 |
--load_best_model_at_end \
|
root_gainlora/gen_script_superni_order2_llama_gainlora_inflora.sh
CHANGED
|
@@ -41,7 +41,7 @@ deepspeed --include localhost:${1} --master_port 19500 src/run_llama.py \
|
|
| 41 |
--logging_strategy steps \
|
| 42 |
--logging_steps 10 \
|
| 43 |
--metric_for_best_model eval_rougeL \
|
| 44 |
-
--
|
| 45 |
--save_strategy steps \
|
| 46 |
--save_total_limit 1 \
|
| 47 |
--lora_r 4 \
|
|
@@ -98,7 +98,7 @@ deepspeed --include localhost:${1} --master_port 19500 src/run_llama.py \
|
|
| 98 |
--logging_strategy steps \
|
| 99 |
--logging_steps 10 \
|
| 100 |
--metric_for_best_model eval_rougeL_for_task073_commonsenseqa_answer_generation \
|
| 101 |
-
--
|
| 102 |
--save_strategy steps \
|
| 103 |
--save_total_limit 1 \
|
| 104 |
--load_best_model_at_end \
|
|
@@ -156,7 +156,7 @@ deepspeed --include localhost:${1} --master_port 19500 src/run_llama.py \
|
|
| 156 |
--logging_strategy steps \
|
| 157 |
--logging_steps 10 \
|
| 158 |
--metric_for_best_model eval_rougeL_for_task1590_diplomacy_text_generation \
|
| 159 |
-
--
|
| 160 |
--save_strategy steps \
|
| 161 |
--save_total_limit 1 \
|
| 162 |
--load_best_model_at_end \
|
|
@@ -214,7 +214,7 @@ deepspeed --include localhost:${1} --master_port 19500 src/run_llama.py \
|
|
| 214 |
--logging_strategy steps \
|
| 215 |
--logging_steps 10 \
|
| 216 |
--metric_for_best_model eval_rougeL_for_task639_multi_woz_user_utterance_generation \
|
| 217 |
-
--
|
| 218 |
--save_strategy steps \
|
| 219 |
--save_total_limit 1 \
|
| 220 |
--load_best_model_at_end \
|
|
@@ -272,7 +272,7 @@ deepspeed --include localhost:${1} --master_port 19500 src/run_llama.py \
|
|
| 272 |
--logging_strategy steps \
|
| 273 |
--logging_steps 10 \
|
| 274 |
--metric_for_best_model eval_rougeL_for_task1572_samsum_summary \
|
| 275 |
-
--
|
| 276 |
--save_strategy steps \
|
| 277 |
--save_total_limit 1 \
|
| 278 |
--load_best_model_at_end \
|
|
@@ -330,7 +330,7 @@ deepspeed --include localhost:${1} --master_port 19500 src/run_llama.py \
|
|
| 330 |
--logging_strategy steps \
|
| 331 |
--logging_steps 10 \
|
| 332 |
--metric_for_best_model eval_rougeL_for_task1687_sentiment140_classification \
|
| 333 |
-
--
|
| 334 |
--save_strategy steps \
|
| 335 |
--save_total_limit 1 \
|
| 336 |
--load_best_model_at_end \
|
|
@@ -388,7 +388,7 @@ deepspeed --include localhost:${1} --master_port 19500 src/run_llama.py \
|
|
| 388 |
--logging_strategy steps \
|
| 389 |
--logging_steps 10 \
|
| 390 |
--metric_for_best_model eval_rougeL_for_task591_sciq_answer_generation \
|
| 391 |
-
--
|
| 392 |
--save_strategy steps \
|
| 393 |
--save_total_limit 1 \
|
| 394 |
--load_best_model_at_end \
|
|
@@ -446,7 +446,7 @@ deepspeed --include localhost:${1} --master_port 19500 src/run_llama.py \
|
|
| 446 |
--logging_strategy steps \
|
| 447 |
--logging_steps 10 \
|
| 448 |
--metric_for_best_model eval_rougeL_for_task363_sst2_polarity_classification \
|
| 449 |
-
--
|
| 450 |
--save_strategy steps \
|
| 451 |
--save_total_limit 1 \
|
| 452 |
--load_best_model_at_end \
|
|
@@ -504,7 +504,7 @@ deepspeed --include localhost:${1} --master_port 19500 src/run_llama.py \
|
|
| 504 |
--logging_strategy steps \
|
| 505 |
--logging_steps 10 \
|
| 506 |
--metric_for_best_model eval_rougeL_for_task1510_evalution_relation_extraction \
|
| 507 |
-
--
|
| 508 |
--save_strategy steps \
|
| 509 |
--save_total_limit 1 \
|
| 510 |
--load_best_model_at_end \
|
|
@@ -562,7 +562,7 @@ deepspeed --include localhost:${1} --master_port 19500 src/run_llama.py \
|
|
| 562 |
--logging_strategy steps \
|
| 563 |
--logging_steps 10 \
|
| 564 |
--metric_for_best_model eval_rougeL_for_task1729_personachat_generate_next \
|
| 565 |
-
--
|
| 566 |
--save_strategy steps \
|
| 567 |
--save_total_limit 1 \
|
| 568 |
--load_best_model_at_end \
|
|
@@ -620,7 +620,7 @@ deepspeed --include localhost:${1} --master_port 19500 src/run_llama.py \
|
|
| 620 |
--logging_strategy steps \
|
| 621 |
--logging_steps 10 \
|
| 622 |
--metric_for_best_model eval_rougeL_for_task181_outcome_extraction \
|
| 623 |
-
--
|
| 624 |
--save_strategy steps \
|
| 625 |
--save_total_limit 1 \
|
| 626 |
--load_best_model_at_end \
|
|
@@ -678,7 +678,7 @@ deepspeed --include localhost:${1} --master_port 19500 src/run_llama.py \
|
|
| 678 |
--logging_strategy steps \
|
| 679 |
--logging_steps 10 \
|
| 680 |
--metric_for_best_model eval_rougeL_for_task511_reddit_tifu_long_text_summarization \
|
| 681 |
-
--
|
| 682 |
--save_strategy steps \
|
| 683 |
--save_total_limit 1 \
|
| 684 |
--load_best_model_at_end \
|
|
@@ -736,7 +736,7 @@ deepspeed --include localhost:${1} --master_port 19500 src/run_llama.py \
|
|
| 736 |
--logging_strategy steps \
|
| 737 |
--logging_steps 10 \
|
| 738 |
--metric_for_best_model eval_rougeL_for_task002_quoref_answer_generation \
|
| 739 |
-
--
|
| 740 |
--save_strategy steps \
|
| 741 |
--save_total_limit 1 \
|
| 742 |
--load_best_model_at_end \
|
|
@@ -794,7 +794,7 @@ deepspeed --include localhost:${1} --master_port 19500 src/run_llama.py \
|
|
| 794 |
--logging_strategy steps \
|
| 795 |
--logging_steps 10 \
|
| 796 |
--metric_for_best_model eval_rougeL_for_task1290_xsum_summarization \
|
| 797 |
-
--
|
| 798 |
--save_strategy steps \
|
| 799 |
--save_total_limit 1 \
|
| 800 |
--load_best_model_at_end \
|
|
@@ -852,7 +852,7 @@ deepspeed --include localhost:${1} --master_port 19500 src/run_llama.py \
|
|
| 852 |
--logging_strategy steps \
|
| 853 |
--logging_steps 10 \
|
| 854 |
--metric_for_best_model eval_rougeL_for_task875_emotion_classification \
|
| 855 |
-
--
|
| 856 |
--save_strategy steps \
|
| 857 |
--save_total_limit 1 \
|
| 858 |
--load_best_model_at_end \
|
|
|
|
| 41 |
--logging_strategy steps \
|
| 42 |
--logging_steps 10 \
|
| 43 |
--metric_for_best_model eval_rougeL \
|
| 44 |
+
--evaluation_strategy steps \
|
| 45 |
--save_strategy steps \
|
| 46 |
--save_total_limit 1 \
|
| 47 |
--lora_r 4 \
|
|
|
|
| 98 |
--logging_strategy steps \
|
| 99 |
--logging_steps 10 \
|
| 100 |
--metric_for_best_model eval_rougeL_for_task073_commonsenseqa_answer_generation \
|
| 101 |
+
--evaluation_strategy steps \
|
| 102 |
--save_strategy steps \
|
| 103 |
--save_total_limit 1 \
|
| 104 |
--load_best_model_at_end \
|
|
|
|
| 156 |
--logging_strategy steps \
|
| 157 |
--logging_steps 10 \
|
| 158 |
--metric_for_best_model eval_rougeL_for_task1590_diplomacy_text_generation \
|
| 159 |
+
--evaluation_strategy steps \
|
| 160 |
--save_strategy steps \
|
| 161 |
--save_total_limit 1 \
|
| 162 |
--load_best_model_at_end \
|
|
|
|
| 214 |
--logging_strategy steps \
|
| 215 |
--logging_steps 10 \
|
| 216 |
--metric_for_best_model eval_rougeL_for_task639_multi_woz_user_utterance_generation \
|
| 217 |
+
--evaluation_strategy steps \
|
| 218 |
--save_strategy steps \
|
| 219 |
--save_total_limit 1 \
|
| 220 |
--load_best_model_at_end \
|
|
|
|
| 272 |
--logging_strategy steps \
|
| 273 |
--logging_steps 10 \
|
| 274 |
--metric_for_best_model eval_rougeL_for_task1572_samsum_summary \
|
| 275 |
+
--evaluation_strategy steps \
|
| 276 |
--save_strategy steps \
|
| 277 |
--save_total_limit 1 \
|
| 278 |
--load_best_model_at_end \
|
|
|
|
| 330 |
--logging_strategy steps \
|
| 331 |
--logging_steps 10 \
|
| 332 |
--metric_for_best_model eval_rougeL_for_task1687_sentiment140_classification \
|
| 333 |
+
--evaluation_strategy steps \
|
| 334 |
--save_strategy steps \
|
| 335 |
--save_total_limit 1 \
|
| 336 |
--load_best_model_at_end \
|
|
|
|
| 388 |
--logging_strategy steps \
|
| 389 |
--logging_steps 10 \
|
| 390 |
--metric_for_best_model eval_rougeL_for_task591_sciq_answer_generation \
|
| 391 |
+
--evaluation_strategy steps \
|
| 392 |
--save_strategy steps \
|
| 393 |
--save_total_limit 1 \
|
| 394 |
--load_best_model_at_end \
|
|
|
|
| 446 |
--logging_strategy steps \
|
| 447 |
--logging_steps 10 \
|
| 448 |
--metric_for_best_model eval_rougeL_for_task363_sst2_polarity_classification \
|
| 449 |
+
--evaluation_strategy steps \
|
| 450 |
--save_strategy steps \
|
| 451 |
--save_total_limit 1 \
|
| 452 |
--load_best_model_at_end \
|
|
|
|
| 504 |
--logging_strategy steps \
|
| 505 |
--logging_steps 10 \
|
| 506 |
--metric_for_best_model eval_rougeL_for_task1510_evalution_relation_extraction \
|
| 507 |
+
--evaluation_strategy steps \
|
| 508 |
--save_strategy steps \
|
| 509 |
--save_total_limit 1 \
|
| 510 |
--load_best_model_at_end \
|
|
|
|
| 562 |
--logging_strategy steps \
|
| 563 |
--logging_steps 10 \
|
| 564 |
--metric_for_best_model eval_rougeL_for_task1729_personachat_generate_next \
|
| 565 |
+
--evaluation_strategy steps \
|
| 566 |
--save_strategy steps \
|
| 567 |
--save_total_limit 1 \
|
| 568 |
--load_best_model_at_end \
|
|
|
|
| 620 |
--logging_strategy steps \
|
| 621 |
--logging_steps 10 \
|
| 622 |
--metric_for_best_model eval_rougeL_for_task181_outcome_extraction \
|
| 623 |
+
--evaluation_strategy steps \
|
| 624 |
--save_strategy steps \
|
| 625 |
--save_total_limit 1 \
|
| 626 |
--load_best_model_at_end \
|
|
|
|
| 678 |
--logging_strategy steps \
|
| 679 |
--logging_steps 10 \
|
| 680 |
--metric_for_best_model eval_rougeL_for_task511_reddit_tifu_long_text_summarization \
|
| 681 |
+
--evaluation_strategy steps \
|
| 682 |
--save_strategy steps \
|
| 683 |
--save_total_limit 1 \
|
| 684 |
--load_best_model_at_end \
|
|
|
|
| 736 |
--logging_strategy steps \
|
| 737 |
--logging_steps 10 \
|
| 738 |
--metric_for_best_model eval_rougeL_for_task002_quoref_answer_generation \
|
| 739 |
+
--evaluation_strategy steps \
|
| 740 |
--save_strategy steps \
|
| 741 |
--save_total_limit 1 \
|
| 742 |
--load_best_model_at_end \
|
|
|
|
| 794 |
--logging_strategy steps \
|
| 795 |
--logging_steps 10 \
|
| 796 |
--metric_for_best_model eval_rougeL_for_task1290_xsum_summarization \
|
| 797 |
+
--evaluation_strategy steps \
|
| 798 |
--save_strategy steps \
|
| 799 |
--save_total_limit 1 \
|
| 800 |
--load_best_model_at_end \
|
|
|
|
| 852 |
--logging_strategy steps \
|
| 853 |
--logging_steps 10 \
|
| 854 |
--metric_for_best_model eval_rougeL_for_task875_emotion_classification \
|
| 855 |
+
--evaluation_strategy steps \
|
| 856 |
--save_strategy steps \
|
| 857 |
--save_total_limit 1 \
|
| 858 |
--load_best_model_at_end \
|
root_gainlora/gen_script_superni_order2_llama_gainlora_olora.sh
CHANGED
|
@@ -41,7 +41,7 @@ deepspeed --include localhost:${1} --master_port 39500 src/run_llama.py \
|
|
| 41 |
--logging_strategy steps \
|
| 42 |
--logging_steps 10 \
|
| 43 |
--metric_for_best_model eval_rougeL \
|
| 44 |
-
--
|
| 45 |
--save_strategy steps \
|
| 46 |
--save_total_limit 1 \
|
| 47 |
--lora_r 4 \
|
|
@@ -99,7 +99,7 @@ deepspeed --include localhost:${1} --master_port 39500 src/run_llama.py \
|
|
| 99 |
--logging_strategy steps \
|
| 100 |
--logging_steps 10 \
|
| 101 |
--metric_for_best_model eval_rougeL_for_task073_commonsenseqa_answer_generation \
|
| 102 |
-
--
|
| 103 |
--save_strategy steps \
|
| 104 |
--save_total_limit 1 \
|
| 105 |
--load_best_model_at_end \
|
|
@@ -158,7 +158,7 @@ deepspeed --include localhost:${1} --master_port 39500 src/run_llama.py \
|
|
| 158 |
--logging_strategy steps \
|
| 159 |
--logging_steps 10 \
|
| 160 |
--metric_for_best_model eval_rougeL_for_task1590_diplomacy_text_generation \
|
| 161 |
-
--
|
| 162 |
--save_strategy steps \
|
| 163 |
--save_total_limit 1 \
|
| 164 |
--load_best_model_at_end \
|
|
@@ -217,7 +217,7 @@ deepspeed --include localhost:${1} --master_port 39500 src/run_llama.py \
|
|
| 217 |
--logging_strategy steps \
|
| 218 |
--logging_steps 10 \
|
| 219 |
--metric_for_best_model eval_rougeL_for_task639_multi_woz_user_utterance_generation \
|
| 220 |
-
--
|
| 221 |
--save_strategy steps \
|
| 222 |
--save_total_limit 1 \
|
| 223 |
--load_best_model_at_end \
|
|
@@ -276,7 +276,7 @@ deepspeed --include localhost:${1} --master_port 39500 src/run_llama.py \
|
|
| 276 |
--logging_strategy steps \
|
| 277 |
--logging_steps 10 \
|
| 278 |
--metric_for_best_model eval_rougeL_for_task1572_samsum_summary \
|
| 279 |
-
--
|
| 280 |
--save_strategy steps \
|
| 281 |
--save_total_limit 1 \
|
| 282 |
--load_best_model_at_end \
|
|
@@ -335,7 +335,7 @@ deepspeed --include localhost:${1} --master_port 39500 src/run_llama.py \
|
|
| 335 |
--logging_strategy steps \
|
| 336 |
--logging_steps 10 \
|
| 337 |
--metric_for_best_model eval_rougeL_for_task1687_sentiment140_classification \
|
| 338 |
-
--
|
| 339 |
--save_strategy steps \
|
| 340 |
--save_total_limit 1 \
|
| 341 |
--load_best_model_at_end \
|
|
@@ -394,7 +394,7 @@ deepspeed --include localhost:${1} --master_port 39500 src/run_llama.py \
|
|
| 394 |
--logging_strategy steps \
|
| 395 |
--logging_steps 10 \
|
| 396 |
--metric_for_best_model eval_rougeL_for_task591_sciq_answer_generation \
|
| 397 |
-
--
|
| 398 |
--save_strategy steps \
|
| 399 |
--save_total_limit 1 \
|
| 400 |
--load_best_model_at_end \
|
|
@@ -453,7 +453,7 @@ deepspeed --include localhost:${1} --master_port 39500 src/run_llama.py \
|
|
| 453 |
--logging_strategy steps \
|
| 454 |
--logging_steps 10 \
|
| 455 |
--metric_for_best_model eval_rougeL_for_task363_sst2_polarity_classification \
|
| 456 |
-
--
|
| 457 |
--save_strategy steps \
|
| 458 |
--save_total_limit 1 \
|
| 459 |
--load_best_model_at_end \
|
|
@@ -512,7 +512,7 @@ deepspeed --include localhost:${1} --master_port 39500 src/run_llama.py \
|
|
| 512 |
--logging_strategy steps \
|
| 513 |
--logging_steps 10 \
|
| 514 |
--metric_for_best_model eval_rougeL_for_task1510_evalution_relation_extraction \
|
| 515 |
-
--
|
| 516 |
--save_strategy steps \
|
| 517 |
--save_total_limit 1 \
|
| 518 |
--load_best_model_at_end \
|
|
@@ -571,7 +571,7 @@ deepspeed --include localhost:${1} --master_port 39500 src/run_llama.py \
|
|
| 571 |
--logging_strategy steps \
|
| 572 |
--logging_steps 10 \
|
| 573 |
--metric_for_best_model eval_rougeL_for_task1729_personachat_generate_next \
|
| 574 |
-
--
|
| 575 |
--save_strategy steps \
|
| 576 |
--save_total_limit 1 \
|
| 577 |
--load_best_model_at_end \
|
|
@@ -630,7 +630,7 @@ deepspeed --include localhost:${1} --master_port 39500 src/run_llama.py \
|
|
| 630 |
--logging_strategy steps \
|
| 631 |
--logging_steps 10 \
|
| 632 |
--metric_for_best_model eval_rougeL_for_task181_outcome_extraction \
|
| 633 |
-
--
|
| 634 |
--save_strategy steps \
|
| 635 |
--save_total_limit 1 \
|
| 636 |
--load_best_model_at_end \
|
|
@@ -689,7 +689,7 @@ deepspeed --include localhost:${1} --master_port 39500 src/run_llama.py \
|
|
| 689 |
--logging_strategy steps \
|
| 690 |
--logging_steps 10 \
|
| 691 |
--metric_for_best_model eval_rougeL_for_task511_reddit_tifu_long_text_summarization \
|
| 692 |
-
--
|
| 693 |
--save_strategy steps \
|
| 694 |
--save_total_limit 1 \
|
| 695 |
--load_best_model_at_end \
|
|
@@ -748,7 +748,7 @@ deepspeed --include localhost:${1} --master_port 39500 src/run_llama.py \
|
|
| 748 |
--logging_strategy steps \
|
| 749 |
--logging_steps 10 \
|
| 750 |
--metric_for_best_model eval_rougeL_for_task002_quoref_answer_generation \
|
| 751 |
-
--
|
| 752 |
--save_strategy steps \
|
| 753 |
--save_total_limit 1 \
|
| 754 |
--load_best_model_at_end \
|
|
@@ -807,7 +807,7 @@ deepspeed --include localhost:${1} --master_port 39500 src/run_llama.py \
|
|
| 807 |
--logging_strategy steps \
|
| 808 |
--logging_steps 10 \
|
| 809 |
--metric_for_best_model eval_rougeL_for_task1290_xsum_summarization \
|
| 810 |
-
--
|
| 811 |
--save_strategy steps \
|
| 812 |
--save_total_limit 1 \
|
| 813 |
--load_best_model_at_end \
|
|
@@ -866,7 +866,7 @@ deepspeed --include localhost:${1} --master_port 39500 src/run_llama.py \
|
|
| 866 |
--logging_strategy steps \
|
| 867 |
--logging_steps 10 \
|
| 868 |
--metric_for_best_model eval_rougeL_for_task875_emotion_classification \
|
| 869 |
-
--
|
| 870 |
--save_strategy steps \
|
| 871 |
--save_total_limit 1 \
|
| 872 |
--load_best_model_at_end \
|
|
|
|
| 41 |
--logging_strategy steps \
|
| 42 |
--logging_steps 10 \
|
| 43 |
--metric_for_best_model eval_rougeL \
|
| 44 |
+
--evaluation_strategy steps \
|
| 45 |
--save_strategy steps \
|
| 46 |
--save_total_limit 1 \
|
| 47 |
--lora_r 4 \
|
|
|
|
| 99 |
--logging_strategy steps \
|
| 100 |
--logging_steps 10 \
|
| 101 |
--metric_for_best_model eval_rougeL_for_task073_commonsenseqa_answer_generation \
|
| 102 |
+
--evaluation_strategy steps \
|
| 103 |
--save_strategy steps \
|
| 104 |
--save_total_limit 1 \
|
| 105 |
--load_best_model_at_end \
|
|
|
|
| 158 |
--logging_strategy steps \
|
| 159 |
--logging_steps 10 \
|
| 160 |
--metric_for_best_model eval_rougeL_for_task1590_diplomacy_text_generation \
|
| 161 |
+
--evaluation_strategy steps \
|
| 162 |
--save_strategy steps \
|
| 163 |
--save_total_limit 1 \
|
| 164 |
--load_best_model_at_end \
|
|
|
|
| 217 |
--logging_strategy steps \
|
| 218 |
--logging_steps 10 \
|
| 219 |
--metric_for_best_model eval_rougeL_for_task639_multi_woz_user_utterance_generation \
|
| 220 |
+
--evaluation_strategy steps \
|
| 221 |
--save_strategy steps \
|
| 222 |
--save_total_limit 1 \
|
| 223 |
--load_best_model_at_end \
|
|
|
|
| 276 |
--logging_strategy steps \
|
| 277 |
--logging_steps 10 \
|
| 278 |
--metric_for_best_model eval_rougeL_for_task1572_samsum_summary \
|
| 279 |
+
--evaluation_strategy steps \
|
| 280 |
--save_strategy steps \
|
| 281 |
--save_total_limit 1 \
|
| 282 |
--load_best_model_at_end \
|
|
|
|
| 335 |
--logging_strategy steps \
|
| 336 |
--logging_steps 10 \
|
| 337 |
--metric_for_best_model eval_rougeL_for_task1687_sentiment140_classification \
|
| 338 |
+
--evaluation_strategy steps \
|
| 339 |
--save_strategy steps \
|
| 340 |
--save_total_limit 1 \
|
| 341 |
--load_best_model_at_end \
|
|
|
|
| 394 |
--logging_strategy steps \
|
| 395 |
--logging_steps 10 \
|
| 396 |
--metric_for_best_model eval_rougeL_for_task591_sciq_answer_generation \
|
| 397 |
+
--evaluation_strategy steps \
|
| 398 |
--save_strategy steps \
|
| 399 |
--save_total_limit 1 \
|
| 400 |
--load_best_model_at_end \
|
|
|
|
| 453 |
--logging_strategy steps \
|
| 454 |
--logging_steps 10 \
|
| 455 |
--metric_for_best_model eval_rougeL_for_task363_sst2_polarity_classification \
|
| 456 |
+
--evaluation_strategy steps \
|
| 457 |
--save_strategy steps \
|
| 458 |
--save_total_limit 1 \
|
| 459 |
--load_best_model_at_end \
|
|
|
|
| 512 |
--logging_strategy steps \
|
| 513 |
--logging_steps 10 \
|
| 514 |
--metric_for_best_model eval_rougeL_for_task1510_evalution_relation_extraction \
|
| 515 |
+
--evaluation_strategy steps \
|
| 516 |
--save_strategy steps \
|
| 517 |
--save_total_limit 1 \
|
| 518 |
--load_best_model_at_end \
|
|
|
|
| 571 |
--logging_strategy steps \
|
| 572 |
--logging_steps 10 \
|
| 573 |
--metric_for_best_model eval_rougeL_for_task1729_personachat_generate_next \
|
| 574 |
+
--evaluation_strategy steps \
|
| 575 |
--save_strategy steps \
|
| 576 |
--save_total_limit 1 \
|
| 577 |
--load_best_model_at_end \
|
|
|
|
| 630 |
--logging_strategy steps \
|
| 631 |
--logging_steps 10 \
|
| 632 |
--metric_for_best_model eval_rougeL_for_task181_outcome_extraction \
|
| 633 |
+
--evaluation_strategy steps \
|
| 634 |
--save_strategy steps \
|
| 635 |
--save_total_limit 1 \
|
| 636 |
--load_best_model_at_end \
|
|
|
|
| 689 |
--logging_strategy steps \
|
| 690 |
--logging_steps 10 \
|
| 691 |
--metric_for_best_model eval_rougeL_for_task511_reddit_tifu_long_text_summarization \
|
| 692 |
+
--evaluation_strategy steps \
|
| 693 |
--save_strategy steps \
|
| 694 |
--save_total_limit 1 \
|
| 695 |
--load_best_model_at_end \
|
|
|
|
| 748 |
--logging_strategy steps \
|
| 749 |
--logging_steps 10 \
|
| 750 |
--metric_for_best_model eval_rougeL_for_task002_quoref_answer_generation \
|
| 751 |
+
--evaluation_strategy steps \
|
| 752 |
--save_strategy steps \
|
| 753 |
--save_total_limit 1 \
|
| 754 |
--load_best_model_at_end \
|
|
|
|
| 807 |
--logging_strategy steps \
|
| 808 |
--logging_steps 10 \
|
| 809 |
--metric_for_best_model eval_rougeL_for_task1290_xsum_summarization \
|
| 810 |
+
--evaluation_strategy steps \
|
| 811 |
--save_strategy steps \
|
| 812 |
--save_total_limit 1 \
|
| 813 |
--load_best_model_at_end \
|
|
|
|
| 866 |
--logging_strategy steps \
|
| 867 |
--logging_steps 10 \
|
| 868 |
--metric_for_best_model eval_rougeL_for_task875_emotion_classification \
|
| 869 |
+
--evaluation_strategy steps \
|
| 870 |
--save_strategy steps \
|
| 871 |
--save_total_limit 1 \
|
| 872 |
--load_best_model_at_end \
|
root_gainlora/gen_script_superni_order2_llama_inflora.sh
CHANGED
|
@@ -41,7 +41,7 @@ deepspeed --include localhost:${1} --master_port 9500 src/run_llama.py \
|
|
| 41 |
--logging_strategy steps \
|
| 42 |
--logging_steps 10 \
|
| 43 |
--metric_for_best_model eval_rougeL \
|
| 44 |
-
--
|
| 45 |
--save_strategy steps \
|
| 46 |
--save_total_limit 1 \
|
| 47 |
--lora_r 4 \
|
|
@@ -97,7 +97,7 @@ deepspeed --include localhost:${1} --master_port 9500 src/run_llama.py \
|
|
| 97 |
--logging_strategy steps \
|
| 98 |
--logging_steps 10 \
|
| 99 |
--metric_for_best_model eval_rougeL_for_task073_commonsenseqa_answer_generation \
|
| 100 |
-
--
|
| 101 |
--save_strategy steps \
|
| 102 |
--save_total_limit 1 \
|
| 103 |
--load_best_model_at_end \
|
|
@@ -154,7 +154,7 @@ deepspeed --include localhost:${1} --master_port 9500 src/run_llama.py \
|
|
| 154 |
--logging_strategy steps \
|
| 155 |
--logging_steps 10 \
|
| 156 |
--metric_for_best_model eval_rougeL_for_task1590_diplomacy_text_generation \
|
| 157 |
-
--
|
| 158 |
--save_strategy steps \
|
| 159 |
--save_total_limit 1 \
|
| 160 |
--load_best_model_at_end \
|
|
@@ -211,7 +211,7 @@ deepspeed --include localhost:${1} --master_port 9500 src/run_llama.py \
|
|
| 211 |
--logging_strategy steps \
|
| 212 |
--logging_steps 10 \
|
| 213 |
--metric_for_best_model eval_rougeL_for_task639_multi_woz_user_utterance_generation \
|
| 214 |
-
--
|
| 215 |
--save_strategy steps \
|
| 216 |
--save_total_limit 1 \
|
| 217 |
--load_best_model_at_end \
|
|
@@ -268,7 +268,7 @@ deepspeed --include localhost:${1} --master_port 9500 src/run_llama.py \
|
|
| 268 |
--logging_strategy steps \
|
| 269 |
--logging_steps 10 \
|
| 270 |
--metric_for_best_model eval_rougeL_for_task1572_samsum_summary \
|
| 271 |
-
--
|
| 272 |
--save_strategy steps \
|
| 273 |
--save_total_limit 1 \
|
| 274 |
--load_best_model_at_end \
|
|
@@ -325,7 +325,7 @@ deepspeed --include localhost:${1} --master_port 9500 src/run_llama.py \
|
|
| 325 |
--logging_strategy steps \
|
| 326 |
--logging_steps 10 \
|
| 327 |
--metric_for_best_model eval_rougeL_for_task1687_sentiment140_classification \
|
| 328 |
-
--
|
| 329 |
--save_strategy steps \
|
| 330 |
--save_total_limit 1 \
|
| 331 |
--load_best_model_at_end \
|
|
@@ -382,7 +382,7 @@ deepspeed --include localhost:${1} --master_port 9500 src/run_llama.py \
|
|
| 382 |
--logging_strategy steps \
|
| 383 |
--logging_steps 10 \
|
| 384 |
--metric_for_best_model eval_rougeL_for_task591_sciq_answer_generation \
|
| 385 |
-
--
|
| 386 |
--save_strategy steps \
|
| 387 |
--save_total_limit 1 \
|
| 388 |
--load_best_model_at_end \
|
|
@@ -439,7 +439,7 @@ deepspeed --include localhost:${1} --master_port 9500 src/run_llama.py \
|
|
| 439 |
--logging_strategy steps \
|
| 440 |
--logging_steps 10 \
|
| 441 |
--metric_for_best_model eval_rougeL_for_task363_sst2_polarity_classification \
|
| 442 |
-
--
|
| 443 |
--save_strategy steps \
|
| 444 |
--save_total_limit 1 \
|
| 445 |
--load_best_model_at_end \
|
|
@@ -496,7 +496,7 @@ deepspeed --include localhost:${1} --master_port 9500 src/run_llama.py \
|
|
| 496 |
--logging_strategy steps \
|
| 497 |
--logging_steps 10 \
|
| 498 |
--metric_for_best_model eval_rougeL_for_task1510_evalution_relation_extraction \
|
| 499 |
-
--
|
| 500 |
--save_strategy steps \
|
| 501 |
--save_total_limit 1 \
|
| 502 |
--load_best_model_at_end \
|
|
@@ -553,7 +553,7 @@ deepspeed --include localhost:${1} --master_port 9500 src/run_llama.py \
|
|
| 553 |
--logging_strategy steps \
|
| 554 |
--logging_steps 10 \
|
| 555 |
--metric_for_best_model eval_rougeL_for_task1729_personachat_generate_next \
|
| 556 |
-
--
|
| 557 |
--save_strategy steps \
|
| 558 |
--save_total_limit 1 \
|
| 559 |
--load_best_model_at_end \
|
|
@@ -610,7 +610,7 @@ deepspeed --include localhost:${1} --master_port 9500 src/run_llama.py \
|
|
| 610 |
--logging_strategy steps \
|
| 611 |
--logging_steps 10 \
|
| 612 |
--metric_for_best_model eval_rougeL_for_task181_outcome_extraction \
|
| 613 |
-
--
|
| 614 |
--save_strategy steps \
|
| 615 |
--save_total_limit 1 \
|
| 616 |
--load_best_model_at_end \
|
|
@@ -667,7 +667,7 @@ deepspeed --include localhost:${1} --master_port 9500 src/run_llama.py \
|
|
| 667 |
--logging_strategy steps \
|
| 668 |
--logging_steps 10 \
|
| 669 |
--metric_for_best_model eval_rougeL_for_task511_reddit_tifu_long_text_summarization \
|
| 670 |
-
--
|
| 671 |
--save_strategy steps \
|
| 672 |
--save_total_limit 1 \
|
| 673 |
--load_best_model_at_end \
|
|
@@ -724,7 +724,7 @@ deepspeed --include localhost:${1} --master_port 9500 src/run_llama.py \
|
|
| 724 |
--logging_strategy steps \
|
| 725 |
--logging_steps 10 \
|
| 726 |
--metric_for_best_model eval_rougeL_for_task002_quoref_answer_generation \
|
| 727 |
-
--
|
| 728 |
--save_strategy steps \
|
| 729 |
--save_total_limit 1 \
|
| 730 |
--load_best_model_at_end \
|
|
@@ -781,7 +781,7 @@ deepspeed --include localhost:${1} --master_port 9500 src/run_llama.py \
|
|
| 781 |
--logging_strategy steps \
|
| 782 |
--logging_steps 10 \
|
| 783 |
--metric_for_best_model eval_rougeL_for_task1290_xsum_summarization \
|
| 784 |
-
--
|
| 785 |
--save_strategy steps \
|
| 786 |
--save_total_limit 1 \
|
| 787 |
--load_best_model_at_end \
|
|
@@ -838,7 +838,7 @@ deepspeed --include localhost:${1} --master_port 9500 src/run_llama.py \
|
|
| 838 |
--logging_strategy steps \
|
| 839 |
--logging_steps 10 \
|
| 840 |
--metric_for_best_model eval_rougeL_for_task875_emotion_classification \
|
| 841 |
-
--
|
| 842 |
--save_strategy steps \
|
| 843 |
--save_total_limit 1 \
|
| 844 |
--load_best_model_at_end \
|
|
|
|
| 41 |
--logging_strategy steps \
|
| 42 |
--logging_steps 10 \
|
| 43 |
--metric_for_best_model eval_rougeL \
|
| 44 |
+
--evaluation_strategy steps \
|
| 45 |
--save_strategy steps \
|
| 46 |
--save_total_limit 1 \
|
| 47 |
--lora_r 4 \
|
|
|
|
| 97 |
--logging_strategy steps \
|
| 98 |
--logging_steps 10 \
|
| 99 |
--metric_for_best_model eval_rougeL_for_task073_commonsenseqa_answer_generation \
|
| 100 |
+
--evaluation_strategy steps \
|
| 101 |
--save_strategy steps \
|
| 102 |
--save_total_limit 1 \
|
| 103 |
--load_best_model_at_end \
|
|
|
|
| 154 |
--logging_strategy steps \
|
| 155 |
--logging_steps 10 \
|
| 156 |
--metric_for_best_model eval_rougeL_for_task1590_diplomacy_text_generation \
|
| 157 |
+
--evaluation_strategy steps \
|
| 158 |
--save_strategy steps \
|
| 159 |
--save_total_limit 1 \
|
| 160 |
--load_best_model_at_end \
|
|
|
|
| 211 |
--logging_strategy steps \
|
| 212 |
--logging_steps 10 \
|
| 213 |
--metric_for_best_model eval_rougeL_for_task639_multi_woz_user_utterance_generation \
|
| 214 |
+
--evaluation_strategy steps \
|
| 215 |
--save_strategy steps \
|
| 216 |
--save_total_limit 1 \
|
| 217 |
--load_best_model_at_end \
|
|
|
|
| 268 |
--logging_strategy steps \
|
| 269 |
--logging_steps 10 \
|
| 270 |
--metric_for_best_model eval_rougeL_for_task1572_samsum_summary \
|
| 271 |
+
--evaluation_strategy steps \
|
| 272 |
--save_strategy steps \
|
| 273 |
--save_total_limit 1 \
|
| 274 |
--load_best_model_at_end \
|
|
|
|
| 325 |
--logging_strategy steps \
|
| 326 |
--logging_steps 10 \
|
| 327 |
--metric_for_best_model eval_rougeL_for_task1687_sentiment140_classification \
|
| 328 |
+
--evaluation_strategy steps \
|
| 329 |
--save_strategy steps \
|
| 330 |
--save_total_limit 1 \
|
| 331 |
--load_best_model_at_end \
|
|
|
|
| 382 |
--logging_strategy steps \
|
| 383 |
--logging_steps 10 \
|
| 384 |
--metric_for_best_model eval_rougeL_for_task591_sciq_answer_generation \
|
| 385 |
+
--evaluation_strategy steps \
|
| 386 |
--save_strategy steps \
|
| 387 |
--save_total_limit 1 \
|
| 388 |
--load_best_model_at_end \
|
|
|
|
| 439 |
--logging_strategy steps \
|
| 440 |
--logging_steps 10 \
|
| 441 |
--metric_for_best_model eval_rougeL_for_task363_sst2_polarity_classification \
|
| 442 |
+
--evaluation_strategy steps \
|
| 443 |
--save_strategy steps \
|
| 444 |
--save_total_limit 1 \
|
| 445 |
--load_best_model_at_end \
|
|
|
|
| 496 |
--logging_strategy steps \
|
| 497 |
--logging_steps 10 \
|
| 498 |
--metric_for_best_model eval_rougeL_for_task1510_evalution_relation_extraction \
|
| 499 |
+
--evaluation_strategy steps \
|
| 500 |
--save_strategy steps \
|
| 501 |
--save_total_limit 1 \
|
| 502 |
--load_best_model_at_end \
|
|
|
|
| 553 |
--logging_strategy steps \
|
| 554 |
--logging_steps 10 \
|
| 555 |
--metric_for_best_model eval_rougeL_for_task1729_personachat_generate_next \
|
| 556 |
+
--evaluation_strategy steps \
|
| 557 |
--save_strategy steps \
|
| 558 |
--save_total_limit 1 \
|
| 559 |
--load_best_model_at_end \
|
|
|
|
| 610 |
--logging_strategy steps \
|
| 611 |
--logging_steps 10 \
|
| 612 |
--metric_for_best_model eval_rougeL_for_task181_outcome_extraction \
|
| 613 |
+
--evaluation_strategy steps \
|
| 614 |
--save_strategy steps \
|
| 615 |
--save_total_limit 1 \
|
| 616 |
--load_best_model_at_end \
|
|
|
|
| 667 |
--logging_strategy steps \
|
| 668 |
--logging_steps 10 \
|
| 669 |
--metric_for_best_model eval_rougeL_for_task511_reddit_tifu_long_text_summarization \
|
| 670 |
+
--evaluation_strategy steps \
|
| 671 |
--save_strategy steps \
|
| 672 |
--save_total_limit 1 \
|
| 673 |
--load_best_model_at_end \
|
|
|
|
| 724 |
--logging_strategy steps \
|
| 725 |
--logging_steps 10 \
|
| 726 |
--metric_for_best_model eval_rougeL_for_task002_quoref_answer_generation \
|
| 727 |
+
--evaluation_strategy steps \
|
| 728 |
--save_strategy steps \
|
| 729 |
--save_total_limit 1 \
|
| 730 |
--load_best_model_at_end \
|
|
|
|
| 781 |
--logging_strategy steps \
|
| 782 |
--logging_steps 10 \
|
| 783 |
--metric_for_best_model eval_rougeL_for_task1290_xsum_summarization \
|
| 784 |
+
--evaluation_strategy steps \
|
| 785 |
--save_strategy steps \
|
| 786 |
--save_total_limit 1 \
|
| 787 |
--load_best_model_at_end \
|
|
|
|
| 838 |
--logging_strategy steps \
|
| 839 |
--logging_steps 10 \
|
| 840 |
--metric_for_best_model eval_rougeL_for_task875_emotion_classification \
|
| 841 |
+
--evaluation_strategy steps \
|
| 842 |
--save_strategy steps \
|
| 843 |
--save_total_limit 1 \
|
| 844 |
--load_best_model_at_end \
|
root_gainlora/gen_script_superni_order2_llama_olora.sh
CHANGED
|
@@ -41,7 +41,7 @@ deepspeed --include localhost:${1} --master_port 29500 src/run_llama.py \
|
|
| 41 |
--logging_strategy steps \
|
| 42 |
--logging_steps 10 \
|
| 43 |
--metric_for_best_model eval_rougeL \
|
| 44 |
-
--
|
| 45 |
--save_strategy steps \
|
| 46 |
--save_total_limit 1 \
|
| 47 |
--lora_r 4 \
|
|
@@ -96,7 +96,7 @@ deepspeed --include localhost:${1} --master_port 29500 src/run_llama.py \
|
|
| 96 |
--logging_strategy steps \
|
| 97 |
--logging_steps 10 \
|
| 98 |
--metric_for_best_model eval_rougeL_for_task073_commonsenseqa_answer_generation \
|
| 99 |
-
--
|
| 100 |
--save_strategy steps \
|
| 101 |
--save_total_limit 1 \
|
| 102 |
--load_best_model_at_end \
|
|
@@ -152,7 +152,7 @@ deepspeed --include localhost:${1} --master_port 29500 src/run_llama.py \
|
|
| 152 |
--logging_strategy steps \
|
| 153 |
--logging_steps 10 \
|
| 154 |
--metric_for_best_model eval_rougeL_for_task1590_diplomacy_text_generation \
|
| 155 |
-
--
|
| 156 |
--save_strategy steps \
|
| 157 |
--save_total_limit 1 \
|
| 158 |
--load_best_model_at_end \
|
|
@@ -208,7 +208,7 @@ deepspeed --include localhost:${1} --master_port 29500 src/run_llama.py \
|
|
| 208 |
--logging_strategy steps \
|
| 209 |
--logging_steps 10 \
|
| 210 |
--metric_for_best_model eval_rougeL_for_task639_multi_woz_user_utterance_generation \
|
| 211 |
-
--
|
| 212 |
--save_strategy steps \
|
| 213 |
--save_total_limit 1 \
|
| 214 |
--load_best_model_at_end \
|
|
@@ -264,7 +264,7 @@ deepspeed --include localhost:${1} --master_port 29500 src/run_llama.py \
|
|
| 264 |
--logging_strategy steps \
|
| 265 |
--logging_steps 10 \
|
| 266 |
--metric_for_best_model eval_rougeL_for_task1572_samsum_summary \
|
| 267 |
-
--
|
| 268 |
--save_strategy steps \
|
| 269 |
--save_total_limit 1 \
|
| 270 |
--load_best_model_at_end \
|
|
@@ -320,7 +320,7 @@ deepspeed --include localhost:${1} --master_port 29500 src/run_llama.py \
|
|
| 320 |
--logging_strategy steps \
|
| 321 |
--logging_steps 10 \
|
| 322 |
--metric_for_best_model eval_rougeL_for_task1687_sentiment140_classification \
|
| 323 |
-
--
|
| 324 |
--save_strategy steps \
|
| 325 |
--save_total_limit 1 \
|
| 326 |
--load_best_model_at_end \
|
|
@@ -376,7 +376,7 @@ deepspeed --include localhost:${1} --master_port 29500 src/run_llama.py \
|
|
| 376 |
--logging_strategy steps \
|
| 377 |
--logging_steps 10 \
|
| 378 |
--metric_for_best_model eval_rougeL_for_task591_sciq_answer_generation \
|
| 379 |
-
--
|
| 380 |
--save_strategy steps \
|
| 381 |
--save_total_limit 1 \
|
| 382 |
--load_best_model_at_end \
|
|
@@ -432,7 +432,7 @@ deepspeed --include localhost:${1} --master_port 29500 src/run_llama.py \
|
|
| 432 |
--logging_strategy steps \
|
| 433 |
--logging_steps 10 \
|
| 434 |
--metric_for_best_model eval_rougeL_for_task363_sst2_polarity_classification \
|
| 435 |
-
--
|
| 436 |
--save_strategy steps \
|
| 437 |
--save_total_limit 1 \
|
| 438 |
--load_best_model_at_end \
|
|
@@ -488,7 +488,7 @@ deepspeed --include localhost:${1} --master_port 29500 src/run_llama.py \
|
|
| 488 |
--logging_strategy steps \
|
| 489 |
--logging_steps 10 \
|
| 490 |
--metric_for_best_model eval_rougeL_for_task1510_evalution_relation_extraction \
|
| 491 |
-
--
|
| 492 |
--save_strategy steps \
|
| 493 |
--save_total_limit 1 \
|
| 494 |
--load_best_model_at_end \
|
|
@@ -544,7 +544,7 @@ deepspeed --include localhost:${1} --master_port 29500 src/run_llama.py \
|
|
| 544 |
--logging_strategy steps \
|
| 545 |
--logging_steps 10 \
|
| 546 |
--metric_for_best_model eval_rougeL_for_task1729_personachat_generate_next \
|
| 547 |
-
--
|
| 548 |
--save_strategy steps \
|
| 549 |
--save_total_limit 1 \
|
| 550 |
--load_best_model_at_end \
|
|
@@ -600,7 +600,7 @@ deepspeed --include localhost:${1} --master_port 29500 src/run_llama.py \
|
|
| 600 |
--logging_strategy steps \
|
| 601 |
--logging_steps 10 \
|
| 602 |
--metric_for_best_model eval_rougeL_for_task181_outcome_extraction \
|
| 603 |
-
--
|
| 604 |
--save_strategy steps \
|
| 605 |
--save_total_limit 1 \
|
| 606 |
--load_best_model_at_end \
|
|
@@ -656,7 +656,7 @@ deepspeed --include localhost:${1} --master_port 29500 src/run_llama.py \
|
|
| 656 |
--logging_strategy steps \
|
| 657 |
--logging_steps 10 \
|
| 658 |
--metric_for_best_model eval_rougeL_for_task511_reddit_tifu_long_text_summarization \
|
| 659 |
-
--
|
| 660 |
--save_strategy steps \
|
| 661 |
--save_total_limit 1 \
|
| 662 |
--load_best_model_at_end \
|
|
@@ -712,7 +712,7 @@ deepspeed --include localhost:${1} --master_port 29500 src/run_llama.py \
|
|
| 712 |
--logging_strategy steps \
|
| 713 |
--logging_steps 10 \
|
| 714 |
--metric_for_best_model eval_rougeL_for_task002_quoref_answer_generation \
|
| 715 |
-
--
|
| 716 |
--save_strategy steps \
|
| 717 |
--save_total_limit 1 \
|
| 718 |
--load_best_model_at_end \
|
|
@@ -768,7 +768,7 @@ deepspeed --include localhost:${1} --master_port 29500 src/run_llama.py \
|
|
| 768 |
--logging_strategy steps \
|
| 769 |
--logging_steps 10 \
|
| 770 |
--metric_for_best_model eval_rougeL_for_task1290_xsum_summarization \
|
| 771 |
-
--
|
| 772 |
--save_strategy steps \
|
| 773 |
--save_total_limit 1 \
|
| 774 |
--load_best_model_at_end \
|
|
@@ -824,7 +824,7 @@ deepspeed --include localhost:${1} --master_port 29500 src/run_llama.py \
|
|
| 824 |
--logging_strategy steps \
|
| 825 |
--logging_steps 10 \
|
| 826 |
--metric_for_best_model eval_rougeL_for_task875_emotion_classification \
|
| 827 |
-
--
|
| 828 |
--save_strategy steps \
|
| 829 |
--save_total_limit 1 \
|
| 830 |
--load_best_model_at_end \
|
|
|
|
| 41 |
--logging_strategy steps \
|
| 42 |
--logging_steps 10 \
|
| 43 |
--metric_for_best_model eval_rougeL \
|
| 44 |
+
--evaluation_strategy steps \
|
| 45 |
--save_strategy steps \
|
| 46 |
--save_total_limit 1 \
|
| 47 |
--lora_r 4 \
|
|
|
|
| 96 |
--logging_strategy steps \
|
| 97 |
--logging_steps 10 \
|
| 98 |
--metric_for_best_model eval_rougeL_for_task073_commonsenseqa_answer_generation \
|
| 99 |
+
--evaluation_strategy steps \
|
| 100 |
--save_strategy steps \
|
| 101 |
--save_total_limit 1 \
|
| 102 |
--load_best_model_at_end \
|
|
|
|
| 152 |
--logging_strategy steps \
|
| 153 |
--logging_steps 10 \
|
| 154 |
--metric_for_best_model eval_rougeL_for_task1590_diplomacy_text_generation \
|
| 155 |
+
--evaluation_strategy steps \
|
| 156 |
--save_strategy steps \
|
| 157 |
--save_total_limit 1 \
|
| 158 |
--load_best_model_at_end \
|
|
|
|
| 208 |
--logging_strategy steps \
|
| 209 |
--logging_steps 10 \
|
| 210 |
--metric_for_best_model eval_rougeL_for_task639_multi_woz_user_utterance_generation \
|
| 211 |
+
--evaluation_strategy steps \
|
| 212 |
--save_strategy steps \
|
| 213 |
--save_total_limit 1 \
|
| 214 |
--load_best_model_at_end \
|
|
|
|
| 264 |
--logging_strategy steps \
|
| 265 |
--logging_steps 10 \
|
| 266 |
--metric_for_best_model eval_rougeL_for_task1572_samsum_summary \
|
| 267 |
+
--evaluation_strategy steps \
|
| 268 |
--save_strategy steps \
|
| 269 |
--save_total_limit 1 \
|
| 270 |
--load_best_model_at_end \
|
|
|
|
| 320 |
--logging_strategy steps \
|
| 321 |
--logging_steps 10 \
|
| 322 |
--metric_for_best_model eval_rougeL_for_task1687_sentiment140_classification \
|
| 323 |
+
--evaluation_strategy steps \
|
| 324 |
--save_strategy steps \
|
| 325 |
--save_total_limit 1 \
|
| 326 |
--load_best_model_at_end \
|
|
|
|
| 376 |
--logging_strategy steps \
|
| 377 |
--logging_steps 10 \
|
| 378 |
--metric_for_best_model eval_rougeL_for_task591_sciq_answer_generation \
|
| 379 |
+
--evaluation_strategy steps \
|
| 380 |
--save_strategy steps \
|
| 381 |
--save_total_limit 1 \
|
| 382 |
--load_best_model_at_end \
|
|
|
|
| 432 |
--logging_strategy steps \
|
| 433 |
--logging_steps 10 \
|
| 434 |
--metric_for_best_model eval_rougeL_for_task363_sst2_polarity_classification \
|
| 435 |
+
--evaluation_strategy steps \
|
| 436 |
--save_strategy steps \
|
| 437 |
--save_total_limit 1 \
|
| 438 |
--load_best_model_at_end \
|
|
|
|
| 488 |
--logging_strategy steps \
|
| 489 |
--logging_steps 10 \
|
| 490 |
--metric_for_best_model eval_rougeL_for_task1510_evalution_relation_extraction \
|
| 491 |
+
--evaluation_strategy steps \
|
| 492 |
--save_strategy steps \
|
| 493 |
--save_total_limit 1 \
|
| 494 |
--load_best_model_at_end \
|
|
|
|
| 544 |
--logging_strategy steps \
|
| 545 |
--logging_steps 10 \
|
| 546 |
--metric_for_best_model eval_rougeL_for_task1729_personachat_generate_next \
|
| 547 |
+
--evaluation_strategy steps \
|
| 548 |
--save_strategy steps \
|
| 549 |
--save_total_limit 1 \
|
| 550 |
--load_best_model_at_end \
|
|
|
|
| 600 |
--logging_strategy steps \
|
| 601 |
--logging_steps 10 \
|
| 602 |
--metric_for_best_model eval_rougeL_for_task181_outcome_extraction \
|
| 603 |
+
--evaluation_strategy steps \
|
| 604 |
--save_strategy steps \
|
| 605 |
--save_total_limit 1 \
|
| 606 |
--load_best_model_at_end \
|
|
|
|
| 656 |
--logging_strategy steps \
|
| 657 |
--logging_steps 10 \
|
| 658 |
--metric_for_best_model eval_rougeL_for_task511_reddit_tifu_long_text_summarization \
|
| 659 |
+
--evaluation_strategy steps \
|
| 660 |
--save_strategy steps \
|
| 661 |
--save_total_limit 1 \
|
| 662 |
--load_best_model_at_end \
|
|
|
|
| 712 |
--logging_strategy steps \
|
| 713 |
--logging_steps 10 \
|
| 714 |
--metric_for_best_model eval_rougeL_for_task002_quoref_answer_generation \
|
| 715 |
+
--evaluation_strategy steps \
|
| 716 |
--save_strategy steps \
|
| 717 |
--save_total_limit 1 \
|
| 718 |
--load_best_model_at_end \
|
|
|
|
| 768 |
--logging_strategy steps \
|
| 769 |
--logging_steps 10 \
|
| 770 |
--metric_for_best_model eval_rougeL_for_task1290_xsum_summarization \
|
| 771 |
+
--evaluation_strategy steps \
|
| 772 |
--save_strategy steps \
|
| 773 |
--save_total_limit 1 \
|
| 774 |
--load_best_model_at_end \
|
|
|
|
| 824 |
--logging_strategy steps \
|
| 825 |
--logging_steps 10 \
|
| 826 |
--metric_for_best_model eval_rougeL_for_task875_emotion_classification \
|
| 827 |
+
--evaluation_strategy steps \
|
| 828 |
--save_strategy steps \
|
| 829 |
--save_total_limit 1 \
|
| 830 |
--load_best_model_at_end \
|
root_gainlora/gen_script_superni_order2_t5_gainlora_inflora.sh
CHANGED
|
@@ -38,7 +38,7 @@ CUDA_VISIBLE_DEVICES=$1 python src/run_t5.py \
|
|
| 38 |
--logging_strategy steps \
|
| 39 |
--logging_steps 10 \
|
| 40 |
--metric_for_best_model eval_rougeL \
|
| 41 |
-
--
|
| 42 |
--save_strategy steps \
|
| 43 |
--save_total_limit 1 \
|
| 44 |
--lora_r 4 \
|
|
@@ -86,7 +86,7 @@ CUDA_VISIBLE_DEVICES=$1 python src/run_t5.py \
|
|
| 86 |
--logging_strategy steps \
|
| 87 |
--logging_steps 10 \
|
| 88 |
--metric_for_best_model eval_rougeL_for_task073_commonsenseqa_answer_generation \
|
| 89 |
-
--
|
| 90 |
--save_strategy steps \
|
| 91 |
--save_total_limit 1 \
|
| 92 |
--load_best_model_at_end \
|
|
@@ -135,7 +135,7 @@ CUDA_VISIBLE_DEVICES=$1 python src/run_t5.py \
|
|
| 135 |
--logging_strategy steps \
|
| 136 |
--logging_steps 10 \
|
| 137 |
--metric_for_best_model eval_rougeL_for_task1590_diplomacy_text_generation \
|
| 138 |
-
--
|
| 139 |
--save_strategy steps \
|
| 140 |
--save_total_limit 1 \
|
| 141 |
--load_best_model_at_end \
|
|
@@ -184,7 +184,7 @@ CUDA_VISIBLE_DEVICES=$1 python src/run_t5.py \
|
|
| 184 |
--logging_strategy steps \
|
| 185 |
--logging_steps 10 \
|
| 186 |
--metric_for_best_model eval_rougeL_for_task639_multi_woz_user_utterance_generation \
|
| 187 |
-
--
|
| 188 |
--save_strategy steps \
|
| 189 |
--save_total_limit 1 \
|
| 190 |
--load_best_model_at_end \
|
|
@@ -233,7 +233,7 @@ CUDA_VISIBLE_DEVICES=$1 python src/run_t5.py \
|
|
| 233 |
--logging_strategy steps \
|
| 234 |
--logging_steps 10 \
|
| 235 |
--metric_for_best_model eval_rougeL_for_task1572_samsum_summary \
|
| 236 |
-
--
|
| 237 |
--save_strategy steps \
|
| 238 |
--save_total_limit 1 \
|
| 239 |
--load_best_model_at_end \
|
|
@@ -282,7 +282,7 @@ CUDA_VISIBLE_DEVICES=$1 python src/run_t5.py \
|
|
| 282 |
--logging_strategy steps \
|
| 283 |
--logging_steps 10 \
|
| 284 |
--metric_for_best_model eval_rougeL_for_task1687_sentiment140_classification \
|
| 285 |
-
--
|
| 286 |
--save_strategy steps \
|
| 287 |
--save_total_limit 1 \
|
| 288 |
--load_best_model_at_end \
|
|
@@ -331,7 +331,7 @@ CUDA_VISIBLE_DEVICES=$1 python src/run_t5.py \
|
|
| 331 |
--logging_strategy steps \
|
| 332 |
--logging_steps 10 \
|
| 333 |
--metric_for_best_model eval_rougeL_for_task591_sciq_answer_generation \
|
| 334 |
-
--
|
| 335 |
--save_strategy steps \
|
| 336 |
--save_total_limit 1 \
|
| 337 |
--load_best_model_at_end \
|
|
@@ -380,7 +380,7 @@ CUDA_VISIBLE_DEVICES=$1 python src/run_t5.py \
|
|
| 380 |
--logging_strategy steps \
|
| 381 |
--logging_steps 10 \
|
| 382 |
--metric_for_best_model eval_rougeL_for_task363_sst2_polarity_classification \
|
| 383 |
-
--
|
| 384 |
--save_strategy steps \
|
| 385 |
--save_total_limit 1 \
|
| 386 |
--load_best_model_at_end \
|
|
@@ -429,7 +429,7 @@ CUDA_VISIBLE_DEVICES=$1 python src/run_t5.py \
|
|
| 429 |
--logging_strategy steps \
|
| 430 |
--logging_steps 10 \
|
| 431 |
--metric_for_best_model eval_rougeL_for_task1510_evalution_relation_extraction \
|
| 432 |
-
--
|
| 433 |
--save_strategy steps \
|
| 434 |
--save_total_limit 1 \
|
| 435 |
--load_best_model_at_end \
|
|
@@ -478,7 +478,7 @@ CUDA_VISIBLE_DEVICES=$1 python src/run_t5.py \
|
|
| 478 |
--logging_strategy steps \
|
| 479 |
--logging_steps 10 \
|
| 480 |
--metric_for_best_model eval_rougeL_for_task1729_personachat_generate_next \
|
| 481 |
-
--
|
| 482 |
--save_strategy steps \
|
| 483 |
--save_total_limit 1 \
|
| 484 |
--load_best_model_at_end \
|
|
@@ -527,7 +527,7 @@ CUDA_VISIBLE_DEVICES=$1 python src/run_t5.py \
|
|
| 527 |
--logging_strategy steps \
|
| 528 |
--logging_steps 10 \
|
| 529 |
--metric_for_best_model eval_rougeL_for_task181_outcome_extraction \
|
| 530 |
-
--
|
| 531 |
--save_strategy steps \
|
| 532 |
--save_total_limit 1 \
|
| 533 |
--load_best_model_at_end \
|
|
@@ -576,7 +576,7 @@ CUDA_VISIBLE_DEVICES=$1 python src/run_t5.py \
|
|
| 576 |
--logging_strategy steps \
|
| 577 |
--logging_steps 10 \
|
| 578 |
--metric_for_best_model eval_rougeL_for_task511_reddit_tifu_long_text_summarization \
|
| 579 |
-
--
|
| 580 |
--save_strategy steps \
|
| 581 |
--save_total_limit 1 \
|
| 582 |
--load_best_model_at_end \
|
|
@@ -625,7 +625,7 @@ CUDA_VISIBLE_DEVICES=$1 python src/run_t5.py \
|
|
| 625 |
--logging_strategy steps \
|
| 626 |
--logging_steps 10 \
|
| 627 |
--metric_for_best_model eval_rougeL_for_task002_quoref_answer_generation \
|
| 628 |
-
--
|
| 629 |
--save_strategy steps \
|
| 630 |
--save_total_limit 1 \
|
| 631 |
--load_best_model_at_end \
|
|
@@ -674,7 +674,7 @@ CUDA_VISIBLE_DEVICES=$1 python src/run_t5.py \
|
|
| 674 |
--logging_strategy steps \
|
| 675 |
--logging_steps 10 \
|
| 676 |
--metric_for_best_model eval_rougeL_for_task1290_xsum_summarization \
|
| 677 |
-
--
|
| 678 |
--save_strategy steps \
|
| 679 |
--save_total_limit 1 \
|
| 680 |
--load_best_model_at_end \
|
|
@@ -723,7 +723,7 @@ CUDA_VISIBLE_DEVICES=$1 python src/run_t5.py \
|
|
| 723 |
--logging_strategy steps \
|
| 724 |
--logging_steps 10 \
|
| 725 |
--metric_for_best_model eval_rougeL_for_task875_emotion_classification \
|
| 726 |
-
--
|
| 727 |
--save_strategy steps \
|
| 728 |
--save_total_limit 1 \
|
| 729 |
--load_best_model_at_end \
|
|
|
|
| 38 |
--logging_strategy steps \
|
| 39 |
--logging_steps 10 \
|
| 40 |
--metric_for_best_model eval_rougeL \
|
| 41 |
+
--evaluation_strategy steps \
|
| 42 |
--save_strategy steps \
|
| 43 |
--save_total_limit 1 \
|
| 44 |
--lora_r 4 \
|
|
|
|
| 86 |
--logging_strategy steps \
|
| 87 |
--logging_steps 10 \
|
| 88 |
--metric_for_best_model eval_rougeL_for_task073_commonsenseqa_answer_generation \
|
| 89 |
+
--evaluation_strategy steps \
|
| 90 |
--save_strategy steps \
|
| 91 |
--save_total_limit 1 \
|
| 92 |
--load_best_model_at_end \
|
|
|
|
| 135 |
--logging_strategy steps \
|
| 136 |
--logging_steps 10 \
|
| 137 |
--metric_for_best_model eval_rougeL_for_task1590_diplomacy_text_generation \
|
| 138 |
+
--evaluation_strategy steps \
|
| 139 |
--save_strategy steps \
|
| 140 |
--save_total_limit 1 \
|
| 141 |
--load_best_model_at_end \
|
|
|
|
| 184 |
--logging_strategy steps \
|
| 185 |
--logging_steps 10 \
|
| 186 |
--metric_for_best_model eval_rougeL_for_task639_multi_woz_user_utterance_generation \
|
| 187 |
+
--evaluation_strategy steps \
|
| 188 |
--save_strategy steps \
|
| 189 |
--save_total_limit 1 \
|
| 190 |
--load_best_model_at_end \
|
|
|
|
| 233 |
--logging_strategy steps \
|
| 234 |
--logging_steps 10 \
|
| 235 |
--metric_for_best_model eval_rougeL_for_task1572_samsum_summary \
|
| 236 |
+
--evaluation_strategy steps \
|
| 237 |
--save_strategy steps \
|
| 238 |
--save_total_limit 1 \
|
| 239 |
--load_best_model_at_end \
|
|
|
|
| 282 |
--logging_strategy steps \
|
| 283 |
--logging_steps 10 \
|
| 284 |
--metric_for_best_model eval_rougeL_for_task1687_sentiment140_classification \
|
| 285 |
+
--evaluation_strategy steps \
|
| 286 |
--save_strategy steps \
|
| 287 |
--save_total_limit 1 \
|
| 288 |
--load_best_model_at_end \
|
|
|
|
| 331 |
--logging_strategy steps \
|
| 332 |
--logging_steps 10 \
|
| 333 |
--metric_for_best_model eval_rougeL_for_task591_sciq_answer_generation \
|
| 334 |
+
--evaluation_strategy steps \
|
| 335 |
--save_strategy steps \
|
| 336 |
--save_total_limit 1 \
|
| 337 |
--load_best_model_at_end \
|
|
|
|
| 380 |
--logging_strategy steps \
|
| 381 |
--logging_steps 10 \
|
| 382 |
--metric_for_best_model eval_rougeL_for_task363_sst2_polarity_classification \
|
| 383 |
+
--evaluation_strategy steps \
|
| 384 |
--save_strategy steps \
|
| 385 |
--save_total_limit 1 \
|
| 386 |
--load_best_model_at_end \
|
|
|
|
| 429 |
--logging_strategy steps \
|
| 430 |
--logging_steps 10 \
|
| 431 |
--metric_for_best_model eval_rougeL_for_task1510_evalution_relation_extraction \
|
| 432 |
+
--evaluation_strategy steps \
|
| 433 |
--save_strategy steps \
|
| 434 |
--save_total_limit 1 \
|
| 435 |
--load_best_model_at_end \
|
|
|
|
| 478 |
--logging_strategy steps \
|
| 479 |
--logging_steps 10 \
|
| 480 |
--metric_for_best_model eval_rougeL_for_task1729_personachat_generate_next \
|
| 481 |
+
--evaluation_strategy steps \
|
| 482 |
--save_strategy steps \
|
| 483 |
--save_total_limit 1 \
|
| 484 |
--load_best_model_at_end \
|
|
|
|
| 527 |
--logging_strategy steps \
|
| 528 |
--logging_steps 10 \
|
| 529 |
--metric_for_best_model eval_rougeL_for_task181_outcome_extraction \
|
| 530 |
+
--evaluation_strategy steps \
|
| 531 |
--save_strategy steps \
|
| 532 |
--save_total_limit 1 \
|
| 533 |
--load_best_model_at_end \
|
|
|
|
| 576 |
--logging_strategy steps \
|
| 577 |
--logging_steps 10 \
|
| 578 |
--metric_for_best_model eval_rougeL_for_task511_reddit_tifu_long_text_summarization \
|
| 579 |
+
--evaluation_strategy steps \
|
| 580 |
--save_strategy steps \
|
| 581 |
--save_total_limit 1 \
|
| 582 |
--load_best_model_at_end \
|
|
|
|
| 625 |
--logging_strategy steps \
|
| 626 |
--logging_steps 10 \
|
| 627 |
--metric_for_best_model eval_rougeL_for_task002_quoref_answer_generation \
|
| 628 |
+
--evaluation_strategy steps \
|
| 629 |
--save_strategy steps \
|
| 630 |
--save_total_limit 1 \
|
| 631 |
--load_best_model_at_end \
|
|
|
|
| 674 |
--logging_strategy steps \
|
| 675 |
--logging_steps 10 \
|
| 676 |
--metric_for_best_model eval_rougeL_for_task1290_xsum_summarization \
|
| 677 |
+
--evaluation_strategy steps \
|
| 678 |
--save_strategy steps \
|
| 679 |
--save_total_limit 1 \
|
| 680 |
--load_best_model_at_end \
|
|
|
|
| 723 |
--logging_strategy steps \
|
| 724 |
--logging_steps 10 \
|
| 725 |
--metric_for_best_model eval_rougeL_for_task875_emotion_classification \
|
| 726 |
+
--evaluation_strategy steps \
|
| 727 |
--save_strategy steps \
|
| 728 |
--save_total_limit 1 \
|
| 729 |
--load_best_model_at_end \
|
root_gainlora/gen_script_superni_order2_t5_inflora.sh
CHANGED
|
@@ -38,7 +38,7 @@ CUDA_VISIBLE_DEVICES=$1 python src/run_t5.py \
|
|
| 38 |
--logging_strategy steps \
|
| 39 |
--logging_steps 10 \
|
| 40 |
--metric_for_best_model eval_rougeL \
|
| 41 |
-
--
|
| 42 |
--save_strategy steps \
|
| 43 |
--save_total_limit 1 \
|
| 44 |
--lora_r 4 \
|
|
@@ -84,7 +84,7 @@ CUDA_VISIBLE_DEVICES=$1 python src/run_t5.py \
|
|
| 84 |
--logging_strategy steps \
|
| 85 |
--logging_steps 10 \
|
| 86 |
--metric_for_best_model eval_rougeL_for_task073_commonsenseqa_answer_generation \
|
| 87 |
-
--
|
| 88 |
--save_strategy steps \
|
| 89 |
--save_total_limit 1 \
|
| 90 |
--load_best_model_at_end \
|
|
@@ -131,7 +131,7 @@ CUDA_VISIBLE_DEVICES=$1 python src/run_t5.py \
|
|
| 131 |
--logging_strategy steps \
|
| 132 |
--logging_steps 10 \
|
| 133 |
--metric_for_best_model eval_rougeL_for_task1590_diplomacy_text_generation \
|
| 134 |
-
--
|
| 135 |
--save_strategy steps \
|
| 136 |
--save_total_limit 1 \
|
| 137 |
--load_best_model_at_end \
|
|
@@ -178,7 +178,7 @@ CUDA_VISIBLE_DEVICES=$1 python src/run_t5.py \
|
|
| 178 |
--logging_strategy steps \
|
| 179 |
--logging_steps 10 \
|
| 180 |
--metric_for_best_model eval_rougeL_for_task639_multi_woz_user_utterance_generation \
|
| 181 |
-
--
|
| 182 |
--save_strategy steps \
|
| 183 |
--save_total_limit 1 \
|
| 184 |
--load_best_model_at_end \
|
|
@@ -225,7 +225,7 @@ CUDA_VISIBLE_DEVICES=$1 python src/run_t5.py \
|
|
| 225 |
--logging_strategy steps \
|
| 226 |
--logging_steps 10 \
|
| 227 |
--metric_for_best_model eval_rougeL_for_task1572_samsum_summary \
|
| 228 |
-
--
|
| 229 |
--save_strategy steps \
|
| 230 |
--save_total_limit 1 \
|
| 231 |
--load_best_model_at_end \
|
|
@@ -272,7 +272,7 @@ CUDA_VISIBLE_DEVICES=$1 python src/run_t5.py \
|
|
| 272 |
--logging_strategy steps \
|
| 273 |
--logging_steps 10 \
|
| 274 |
--metric_for_best_model eval_rougeL_for_task1687_sentiment140_classification \
|
| 275 |
-
--
|
| 276 |
--save_strategy steps \
|
| 277 |
--save_total_limit 1 \
|
| 278 |
--load_best_model_at_end \
|
|
@@ -319,7 +319,7 @@ CUDA_VISIBLE_DEVICES=$1 python src/run_t5.py \
|
|
| 319 |
--logging_strategy steps \
|
| 320 |
--logging_steps 10 \
|
| 321 |
--metric_for_best_model eval_rougeL_for_task591_sciq_answer_generation \
|
| 322 |
-
--
|
| 323 |
--save_strategy steps \
|
| 324 |
--save_total_limit 1 \
|
| 325 |
--load_best_model_at_end \
|
|
@@ -366,7 +366,7 @@ CUDA_VISIBLE_DEVICES=$1 python src/run_t5.py \
|
|
| 366 |
--logging_strategy steps \
|
| 367 |
--logging_steps 10 \
|
| 368 |
--metric_for_best_model eval_rougeL_for_task363_sst2_polarity_classification \
|
| 369 |
-
--
|
| 370 |
--save_strategy steps \
|
| 371 |
--save_total_limit 1 \
|
| 372 |
--load_best_model_at_end \
|
|
@@ -413,7 +413,7 @@ CUDA_VISIBLE_DEVICES=$1 python src/run_t5.py \
|
|
| 413 |
--logging_strategy steps \
|
| 414 |
--logging_steps 10 \
|
| 415 |
--metric_for_best_model eval_rougeL_for_task1510_evalution_relation_extraction \
|
| 416 |
-
--
|
| 417 |
--save_strategy steps \
|
| 418 |
--save_total_limit 1 \
|
| 419 |
--load_best_model_at_end \
|
|
@@ -460,7 +460,7 @@ CUDA_VISIBLE_DEVICES=$1 python src/run_t5.py \
|
|
| 460 |
--logging_strategy steps \
|
| 461 |
--logging_steps 10 \
|
| 462 |
--metric_for_best_model eval_rougeL_for_task1729_personachat_generate_next \
|
| 463 |
-
--
|
| 464 |
--save_strategy steps \
|
| 465 |
--save_total_limit 1 \
|
| 466 |
--load_best_model_at_end \
|
|
@@ -507,7 +507,7 @@ CUDA_VISIBLE_DEVICES=$1 python src/run_t5.py \
|
|
| 507 |
--logging_strategy steps \
|
| 508 |
--logging_steps 10 \
|
| 509 |
--metric_for_best_model eval_rougeL_for_task181_outcome_extraction \
|
| 510 |
-
--
|
| 511 |
--save_strategy steps \
|
| 512 |
--save_total_limit 1 \
|
| 513 |
--load_best_model_at_end \
|
|
@@ -554,7 +554,7 @@ CUDA_VISIBLE_DEVICES=$1 python src/run_t5.py \
|
|
| 554 |
--logging_strategy steps \
|
| 555 |
--logging_steps 10 \
|
| 556 |
--metric_for_best_model eval_rougeL_for_task511_reddit_tifu_long_text_summarization \
|
| 557 |
-
--
|
| 558 |
--save_strategy steps \
|
| 559 |
--save_total_limit 1 \
|
| 560 |
--load_best_model_at_end \
|
|
@@ -601,7 +601,7 @@ CUDA_VISIBLE_DEVICES=$1 python src/run_t5.py \
|
|
| 601 |
--logging_strategy steps \
|
| 602 |
--logging_steps 10 \
|
| 603 |
--metric_for_best_model eval_rougeL_for_task002_quoref_answer_generation \
|
| 604 |
-
--
|
| 605 |
--save_strategy steps \
|
| 606 |
--save_total_limit 1 \
|
| 607 |
--load_best_model_at_end \
|
|
@@ -648,7 +648,7 @@ CUDA_VISIBLE_DEVICES=$1 python src/run_t5.py \
|
|
| 648 |
--logging_strategy steps \
|
| 649 |
--logging_steps 10 \
|
| 650 |
--metric_for_best_model eval_rougeL_for_task1290_xsum_summarization \
|
| 651 |
-
--
|
| 652 |
--save_strategy steps \
|
| 653 |
--save_total_limit 1 \
|
| 654 |
--load_best_model_at_end \
|
|
@@ -695,7 +695,7 @@ CUDA_VISIBLE_DEVICES=$1 python src/run_t5.py \
|
|
| 695 |
--logging_strategy steps \
|
| 696 |
--logging_steps 10 \
|
| 697 |
--metric_for_best_model eval_rougeL_for_task875_emotion_classification \
|
| 698 |
-
--
|
| 699 |
--save_strategy steps \
|
| 700 |
--save_total_limit 1 \
|
| 701 |
--load_best_model_at_end \
|
|
|
|
| 38 |
--logging_strategy steps \
|
| 39 |
--logging_steps 10 \
|
| 40 |
--metric_for_best_model eval_rougeL \
|
| 41 |
+
--evaluation_strategy steps \
|
| 42 |
--save_strategy steps \
|
| 43 |
--save_total_limit 1 \
|
| 44 |
--lora_r 4 \
|
|
|
|
| 84 |
--logging_strategy steps \
|
| 85 |
--logging_steps 10 \
|
| 86 |
--metric_for_best_model eval_rougeL_for_task073_commonsenseqa_answer_generation \
|
| 87 |
+
--evaluation_strategy steps \
|
| 88 |
--save_strategy steps \
|
| 89 |
--save_total_limit 1 \
|
| 90 |
--load_best_model_at_end \
|
|
|
|
| 131 |
--logging_strategy steps \
|
| 132 |
--logging_steps 10 \
|
| 133 |
--metric_for_best_model eval_rougeL_for_task1590_diplomacy_text_generation \
|
| 134 |
+
--evaluation_strategy steps \
|
| 135 |
--save_strategy steps \
|
| 136 |
--save_total_limit 1 \
|
| 137 |
--load_best_model_at_end \
|
|
|
|
| 178 |
--logging_strategy steps \
|
| 179 |
--logging_steps 10 \
|
| 180 |
--metric_for_best_model eval_rougeL_for_task639_multi_woz_user_utterance_generation \
|
| 181 |
+
--evaluation_strategy steps \
|
| 182 |
--save_strategy steps \
|
| 183 |
--save_total_limit 1 \
|
| 184 |
--load_best_model_at_end \
|
|
|
|
| 225 |
--logging_strategy steps \
|
| 226 |
--logging_steps 10 \
|
| 227 |
--metric_for_best_model eval_rougeL_for_task1572_samsum_summary \
|
| 228 |
+
--evaluation_strategy steps \
|
| 229 |
--save_strategy steps \
|
| 230 |
--save_total_limit 1 \
|
| 231 |
--load_best_model_at_end \
|
|
|
|
| 272 |
--logging_strategy steps \
|
| 273 |
--logging_steps 10 \
|
| 274 |
--metric_for_best_model eval_rougeL_for_task1687_sentiment140_classification \
|
| 275 |
+
--evaluation_strategy steps \
|
| 276 |
--save_strategy steps \
|
| 277 |
--save_total_limit 1 \
|
| 278 |
--load_best_model_at_end \
|
|
|
|
| 319 |
--logging_strategy steps \
|
| 320 |
--logging_steps 10 \
|
| 321 |
--metric_for_best_model eval_rougeL_for_task591_sciq_answer_generation \
|
| 322 |
+
--evaluation_strategy steps \
|
| 323 |
--save_strategy steps \
|
| 324 |
--save_total_limit 1 \
|
| 325 |
--load_best_model_at_end \
|
|
|
|
| 366 |
--logging_strategy steps \
|
| 367 |
--logging_steps 10 \
|
| 368 |
--metric_for_best_model eval_rougeL_for_task363_sst2_polarity_classification \
|
| 369 |
+
--evaluation_strategy steps \
|
| 370 |
--save_strategy steps \
|
| 371 |
--save_total_limit 1 \
|
| 372 |
--load_best_model_at_end \
|
|
|
|
| 413 |
--logging_strategy steps \
|
| 414 |
--logging_steps 10 \
|
| 415 |
--metric_for_best_model eval_rougeL_for_task1510_evalution_relation_extraction \
|
| 416 |
+
--evaluation_strategy steps \
|
| 417 |
--save_strategy steps \
|
| 418 |
--save_total_limit 1 \
|
| 419 |
--load_best_model_at_end \
|
|
|
|
| 460 |
--logging_strategy steps \
|
| 461 |
--logging_steps 10 \
|
| 462 |
--metric_for_best_model eval_rougeL_for_task1729_personachat_generate_next \
|
| 463 |
+
--evaluation_strategy steps \
|
| 464 |
--save_strategy steps \
|
| 465 |
--save_total_limit 1 \
|
| 466 |
--load_best_model_at_end \
|
|
|
|
| 507 |
--logging_strategy steps \
|
| 508 |
--logging_steps 10 \
|
| 509 |
--metric_for_best_model eval_rougeL_for_task181_outcome_extraction \
|
| 510 |
+
--evaluation_strategy steps \
|
| 511 |
--save_strategy steps \
|
| 512 |
--save_total_limit 1 \
|
| 513 |
--load_best_model_at_end \
|
|
|
|
| 554 |
--logging_strategy steps \
|
| 555 |
--logging_steps 10 \
|
| 556 |
--metric_for_best_model eval_rougeL_for_task511_reddit_tifu_long_text_summarization \
|
| 557 |
+
--evaluation_strategy steps \
|
| 558 |
--save_strategy steps \
|
| 559 |
--save_total_limit 1 \
|
| 560 |
--load_best_model_at_end \
|
|
|
|
| 601 |
--logging_strategy steps \
|
| 602 |
--logging_steps 10 \
|
| 603 |
--metric_for_best_model eval_rougeL_for_task002_quoref_answer_generation \
|
| 604 |
+
--evaluation_strategy steps \
|
| 605 |
--save_strategy steps \
|
| 606 |
--save_total_limit 1 \
|
| 607 |
--load_best_model_at_end \
|
|
|
|
| 648 |
--logging_strategy steps \
|
| 649 |
--logging_steps 10 \
|
| 650 |
--metric_for_best_model eval_rougeL_for_task1290_xsum_summarization \
|
| 651 |
+
--evaluation_strategy steps \
|
| 652 |
--save_strategy steps \
|
| 653 |
--save_total_limit 1 \
|
| 654 |
--load_best_model_at_end \
|
|
|
|
| 695 |
--logging_strategy steps \
|
| 696 |
--logging_steps 10 \
|
| 697 |
--metric_for_best_model eval_rougeL_for_task875_emotion_classification \
|
| 698 |
+
--evaluation_strategy steps \
|
| 699 |
--save_strategy steps \
|
| 700 |
--save_total_limit 1 \
|
| 701 |
--load_best_model_at_end \
|