| | import argparse |
| | import os |
| | import sys |
| |
|
| | |
| | sys.path.insert(0, os.path.join(os.path.dirname(__file__), '..', '..')) |
| | from utils.benchmark_utils import get_benchmark_score |
| |
|
| | def main(): |
| | parser = argparse.ArgumentParser(description="Evaluate dialogue generation") |
| | parser.add_argument("model_path", type=str, help="Path to model checkpoint") |
| | args = parser.parse_args() |
| | |
| | if not os.path.isdir(args.model_path): |
| | print(f"Error: Directory not found at '{args.model_path}'", file=sys.stderr) |
| | sys.exit(1) |
| | |
| | checkpoint_name = os.path.basename(os.path.normpath(args.model_path)) |
| | try: |
| | step_number = int(checkpoint_name.split('_')[-1]) |
| | except (ValueError, IndexError): |
| | print(f"Error: Cannot parse step number from '{checkpoint_name}'", file=sys.stderr) |
| | sys.exit(1) |
| | |
| | config_data = config_init() |
| | |
| | result = get_benchmark_score("dialogue_generation", step_number) |
| | if result is None: |
| | print(f"Error: Invalid step number {step_number}", file=sys.stderr) |
| | sys.exit(1) |
| | |
| | print(result) |
| |
|
| | if __name__ == "__main__": |
| | main() |