| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
|
|
| import argparse |
| import itertools |
| import operator |
| import sys |
| from collections import OrderedDict |
|
|
| from run_eval import datetime_now, run_generate |
|
|
| from utils import ROUGE_KEYS |
|
|
|
|
| |
| |
| task_score_names = { |
| "translation": ["bleu"], |
| "summarization": ROUGE_KEYS, |
| } |
|
|
|
|
| def parse_search_arg(search): |
| groups = search.split() |
| entries = dict(g.split("=") for g in groups) |
| entry_names = list(entries.keys()) |
| sets = [[f"--{k} {v}" for v in vs.split(":")] for k, vs in entries.items()] |
| matrix = [list(x) for x in itertools.product(*sets)] |
| return matrix, entry_names |
|
|
|
|
| def run_search(): |
| """ |
| Run parametric search over the desired hparam space with help of ``run_eval.py``. |
| |
| All the arguments except ``--search`` are passed to ``run_eval.py`` as is. The values inside of "--search" are parsed, reformatted and fed to ``run_eval.py`` as additional args. |
| |
| The format for the ``--search`` value is a simple string with hparams and colon separated values to try, e.g.: |
| ``` |
| --search "num_beams=5:10 length_penalty=0.8:1.0:1.2 early_stopping=true:false" |
| ``` |
| which will generate ``12`` ``(2*3*2)`` searches for a product of each hparam. For example the example that was just used will invoke ``run_eval.py`` repeatedly with: |
| |
| ``` |
| --num_beams 5 --length_penalty 0.8 --early_stopping true |
| --num_beams 5 --length_penalty 0.8 --early_stopping false |
| [...] |
| --num_beams 10 --length_penalty 1.2 --early_stopping false |
| ``` |
| |
| On completion, this function prints a markdown table of the results sorted by the best BLEU score and the winning arguments. |
| |
| |
| """ |
| prog = sys.argv[0] |
|
|
| parser = argparse.ArgumentParser( |
| usage=( |
| "\n\nImportant: this script accepts all arguments `run_eval.py` accepts and then a few extra, therefore" |
| " refer to `run_eval.py -h` for the complete list." |
| ) |
| ) |
| parser.add_argument( |
| "--search", |
| type=str, |
| required=False, |
| help='param space to search, e.g. "num_beams=5:10 length_penalty=0.8:1.0:1.2"', |
| ) |
| parser.add_argument( |
| "--bs", type=int, default=8, required=False, help="initial batch size (may get reduced if it's too big)" |
| ) |
| parser.add_argument("--task", type=str, help="used for task_specific_params + metrics") |
| parser.add_argument( |
| "--info", |
| nargs="?", |
| type=str, |
| const=datetime_now(), |
| help=( |
| "add custom notes to be printed before the results table. If no value is passed, the current datetime" |
| " string will be used." |
| ), |
| ) |
| args, args_main = parser.parse_known_args() |
| |
| args_main.extend(["--task", args.task]) |
| args_normal = [prog] + args_main |
|
|
| |
| task = "translation" if "translation" in args.task else "summarization" |
|
|
| matrix, col_names = parse_search_arg(args.search) |
| col_names[0:0] = task_score_names[task] |
| col_widths = {col: len(str(col)) for col in col_names} |
| results = [] |
| for r in matrix: |
| hparams = dict(x.replace("--", "").split() for x in r) |
| args_exp = " ".join(r).split() |
| args_exp.extend(["--bs", str(args.bs)]) |
| sys.argv = args_normal + args_exp |
|
|
| |
|
|
| scores = run_generate(verbose=False) |
| |
| result = OrderedDict() |
| for score in task_score_names[task]: |
| result[score] = scores[score] |
| result.update(hparams) |
| results.append(result) |
|
|
| |
| for k, v in result.items(): |
| l = len(str(v)) |
| if l > col_widths[k]: |
| col_widths[k] = l |
|
|
| results_sorted = sorted(results, key=operator.itemgetter(*task_score_names[task]), reverse=True) |
| print(" | ".join([f"{col:{col_widths[col]}}" for col in col_names])) |
| print(" | ".join([f"{'-' * col_widths[col]}" for col in col_names])) |
| for row in results_sorted: |
| print(" | ".join([f"{row[col]:{col_widths[col]}}" for col in col_names])) |
|
|
| best = results_sorted[0] |
| for score in task_score_names[task]: |
| del best[score] |
| best_args = [f"--{k} {v}" for k, v in best.items()] |
| dyn_args = ["--bs", str(args.bs)] |
| if args.info: |
| print(f"\nInfo: {args.info}") |
| print("\nBest score args:") |
| print(" ".join(args_main + best_args + dyn_args)) |
|
|
| return results_sorted |
|
|
|
|
| if __name__ == "__main__": |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| run_search() |
|
|