| import os |
| import json |
| import glob |
| import traceback |
| from flask import Flask, render_template, jsonify, send_file, request |
| from flask_cors import CORS |
|
|
| app = Flask(__name__) |
| CORS(app) |
|
|
|
|
| |
| @app.route("/") |
| def index(): |
| return render_template("viewer.html") |
|
|
|
|
| |
| @app.route("/api/evals") |
| def list_evals(): |
| base_dir = request.args.get("path", "./eval_results") |
| if not os.path.exists(base_dir): |
| return jsonify({"error": f"Path {base_dir} does not exist"}), 404 |
|
|
| eval_dirs = [] |
| for item in os.listdir(base_dir): |
| full_path = os.path.join(base_dir, item) |
| if os.path.isdir(full_path) and item.startswith("eval_"): |
| eval_dirs.append(item) |
|
|
| return jsonify(eval_dirs) |
|
|
|
|
| |
| @app.route("/api/eval/<eval_id>/examples") |
| def get_examples(eval_id): |
| base_dir = request.args.get("path", "./eval_results") |
| eval_path = os.path.join(base_dir, eval_id) |
|
|
| |
| examples_json_path = os.path.join(eval_path, "examples.json") |
| examples = {} |
|
|
| if os.path.exists(examples_json_path): |
| try: |
| with open(examples_json_path, "r") as f: |
| examples = json.load(f) |
| except json.JSONDecodeError: |
| app.logger.error(f"Error parsing examples.json at {examples_json_path}") |
|
|
| |
| if not examples: |
| for item in os.listdir(eval_path): |
| if os.path.isdir(os.path.join(eval_path, item)) and item.startswith( |
| "example_" |
| ): |
| example_id = item.replace("example_", "") |
| example_dir = os.path.join(eval_path, item) |
|
|
| |
| run_dirs = [] |
| for run_item in os.listdir(example_dir): |
| run_path = os.path.join(example_dir, run_item) |
| if os.path.isdir(run_path) and run_item.startswith("run_"): |
| run_dirs.append(run_item) |
|
|
| if run_dirs: |
| task_path = os.path.join(example_dir, run_dirs[0], "task.txt") |
| if os.path.exists(task_path): |
| with open(task_path, "r") as f: |
| examples[example_id] = f.read().strip() |
| else: |
| |
| metadata_path = os.path.join( |
| example_dir, run_dirs[0], "metadata.json" |
| ) |
| if os.path.exists(metadata_path): |
| try: |
| with open(metadata_path, "r") as f: |
| metadata = json.load(f) |
| |
| if ( |
| "summary" in metadata |
| and metadata["summary"] |
| and "task" in metadata["summary"][0] |
| ): |
| examples[example_id] = metadata["summary"][0][ |
| "task" |
| ] |
| except: |
| |
| examples[example_id] = f"Task for {example_id}" |
| else: |
| examples[example_id] = f"Task for {example_id}" |
|
|
| return jsonify(examples) |
|
|
|
|
| |
| @app.route("/api/eval/<eval_id>/example/<example_id>/runs") |
| def get_runs(eval_id, example_id): |
| base_dir = request.args.get("path", "./eval_results") |
| example_dir = os.path.join(base_dir, eval_id, f"example_{example_id}") |
|
|
| if not os.path.exists(example_dir): |
| return jsonify({"error": f"Example directory not found: {example_dir}"}), 404 |
|
|
| runs = [] |
| for item in os.listdir(example_dir): |
| item_path = os.path.join(example_dir, item) |
| if os.path.isdir(item_path) and item.startswith("run_"): |
| run_id = item |
|
|
| |
| metadata_path = os.path.join(item_path, "metadata.json") |
| status = "unknown" |
|
|
| if os.path.exists(metadata_path): |
| try: |
| with open(metadata_path, "r") as f: |
| metadata = json.load(f) |
| status = metadata.get("status", "unknown") |
| except Exception as e: |
| app.logger.error( |
| f"Error reading metadata.json for {run_id}: {str(e)}" |
| ) |
|
|
| runs.append({"id": run_id, "status": status}) |
| app.logger.info(f"runs: {runs}") |
|
|
| return jsonify(runs) |
|
|
|
|
| |
| @app.route("/api/eval/<eval_id>/example/<example_id>/run/<run_id>/metadata") |
| def get_metadata(eval_id, example_id, run_id): |
| base_dir = request.args.get("path", "./eval_results") |
| run_dir = os.path.join(base_dir, eval_id, f"example_{example_id}", run_id) |
| metadata_path = os.path.join(run_dir, "metadata.json") |
| app.logger.info(f"metadata: {metadata_path}") |
|
|
| if not os.path.exists(metadata_path): |
| return jsonify({"error": "Metadata not found", "path": metadata_path}), 404 |
|
|
| try: |
| with open(metadata_path, "r") as f: |
| metadata_content = f.read() |
| if not metadata_content.strip(): |
| return jsonify({"error": "Metadata file is empty"}), 404 |
|
|
| metadata = json.loads(metadata_content) |
| return jsonify(metadata) |
| except json.JSONDecodeError as e: |
| error_info = { |
| "error": "Invalid JSON in metadata file", |
| "details": str(e), |
| "path": metadata_path, |
| } |
| app.logger.error(f"JSON error in {metadata_path}: {str(e)}") |
| return jsonify(error_info), 400 |
| except Exception as e: |
| error_info = { |
| "error": "Error reading metadata file", |
| "details": str(e), |
| "traceback": traceback.format_exc(), |
| "path": metadata_path, |
| } |
| app.logger.error(f"Error reading {metadata_path}: {str(e)}") |
| return jsonify(error_info), 500 |
|
|
|
|
| |
| @app.route("/api/eval/<eval_id>/example/<example_id>/run/<run_id>/screenshots") |
| def get_screenshots(eval_id, example_id, run_id): |
| base_dir = request.args.get("path", "./eval_results") |
| run_dir = os.path.join(base_dir, eval_id, f"example_{example_id}", run_id) |
|
|
| if not os.path.exists(run_dir): |
| return jsonify({"error": f"Run directory not found: {run_dir}"}), 404 |
|
|
| screenshots = [] |
| for ext in ["png", "jpg", "jpeg"]: |
| pattern = os.path.join(run_dir, f"*.{ext}") |
| for file_path in glob.glob(pattern): |
| filename = os.path.basename(file_path) |
| screenshots.append( |
| {"name": filename, "path": f"/api/image?path={file_path}"} |
| ) |
|
|
| |
| screenshots.sort(key=lambda x: x["name"]) |
|
|
| app.logger.info(f"screenshots: {screenshots}") |
|
|
| return jsonify(screenshots) |
|
|
|
|
| |
| @app.route("/api/image") |
| def get_image(): |
| path = request.args.get("path") |
| if not path: |
| return jsonify({"error": "No path provided"}), 400 |
|
|
| if not os.path.exists(path): |
| return jsonify({"error": f"Image not found at path: {path}"}), 404 |
|
|
| try: |
| return send_file(path) |
| except Exception as e: |
| return jsonify({"error": f"Error serving image: {str(e)}"}), 500 |
|
|
|
|
| if __name__ == "__main__": |
| print("Evaluation Server is running at http://localhost:8000") |
| print("Press Ctrl+C to stop the server") |
|
|
| app.run(debug=True, port=8000) |
|
|