AVBENCH_INTRODUCTION = """# AVBench Leaderboard AVBench is a human-aligned and automated benchmark for evaluating text-to-audio-video (T2AV) generation. It reports **Normal** and **Hard** splits across cross-modal alignment and unimodal quality metrics. ## Links - Code: https://github.com/YaJialiang/AVBench - Models: https://huggingface.co/iiiiii123/AVBench_model - Dataset: https://huggingface.co/datasets/iiiiii123/AVBench ## Metrics - Cross-Modal Alignment & Sync: AV, AT, VT, SyncNet - Unimodal Generation Quality: SC, DF-Arena, NISQA, Audiobox, DOVER++, Aesthetic - All metrics are higher-is-better. ## Chart ![AVBench Radar Chart](https://raw.githubusercontent.com/YaJialiang/AVBench-site/main/static/images/avbench/radar_chart.png) """ METRIC_COLUMNS = [ "AV", "AT", "VT", "SyncNet", "SC", "DF-Arena", "NISQA", "Audiobox", "DOVER++", "Aesthetic", ] # Equal weight by default, can be adjusted later. METRIC_WEIGHTS = { "AV": 1.0, "AT": 1.0, "VT": 1.0, "SyncNet": 1.0, "SC": 1.0, "DF-Arena": 1.0, "NISQA": 1.0, "Audiobox": 1.0, "DOVER++": 1.0, "Aesthetic": 1.0, } NORMAL_ROWS = [ ["Sora 2", 0.8713, 0.8675, 0.7599, 4.9057, 87.8391, 0.4328, 2.3784, 3.1759, 60.0125, 4.0704], ["Veo 3 Fast", 0.6924, 0.8300, 0.7235, 6.5943, 77.4950, 0.3043, 2.8191, 3.5877, 69.2275, 4.9967], ["Wan 2.6", 0.8207, 0.8227, 0.7556, 4.5016, 91.5568, 0.0441, 3.0289, 3.9271, 71.6473, 4.7790], ["Kling 2.6", 0.7626, 0.8061, 0.7501, 8.1027, 68.7844, 0.1665, 3.3141, 3.8082, 65.6786, 5.4885], ["Seedance 1.5 Pro", 0.6536, 0.8554, 0.7363, 5.0146, 84.9268, 0.1602, 3.6411, 4.1686, 71.7205, 4.7373], ] HARD_ROWS = [ ["Sora 2", 0.9320, 0.8575, 0.7190, 3.7932, 76.7905, 0.5498, 2.0564, 3.1339, 58.1538, 4.0434], ["Veo 3 Fast", 0.7766, 0.8117, 0.6943, 3.4535, 70.3144, 0.3827, 2.3321, 3.6113, 67.0833, 5.1438], ["Wan 2.6", 0.8780, 0.8418, 0.7482, 3.0488, 84.4512, 0.0498, 3.0726, 4.0924, 71.5229, 4.7721], ["Kling 2.6", 0.8813, 0.7602, 0.7105, 3.9844, 69.0691, 0.1469, 3.2425, 3.8912, 62.9994, 5.5033], ["Seedance 1.5 Pro", 0.7409, 0.8646, 0.7398, 3.3239, 80.8029, 0.2059, 3.4093, 4.1618, 69.4430, 4.7707], ]