| from mmengine.config import read_base | |
| with read_base(): | |
| from opencompass.configs.datasets.eese.eese_judge_gen import \ | |
| eese_datasets | |
| # 选择一个感兴趣的模型 | |
| from opencompass.configs.models.openai.gpt_4o_2024_05_13 import \ | |
| models as gpt4 | |
| from opencompass.models import OpenAISDK | |
| # 配置评判模型 | |
| api_meta_template = dict(round=[ | |
| dict(role='HUMAN', api_role='HUMAN'), | |
| dict(role='BOT', api_role='BOT', generate=True), | |
| ], ) | |
| judge_cfg = dict( | |
| abbr='model-judge', | |
| type=OpenAISDK, | |
| path='model-name', | |
| key='your-api-key', | |
| openai_api_base=['openai-url'], | |
| meta_template=api_meta_template, | |
| query_per_second=16, | |
| batch_size=1, | |
| temperature=0.001, | |
| tokenizer_path='gpt-4o', | |
| verbose=True, | |
| max_out_len=16384, | |
| max_seq_len=49152, | |
| ) | |
| datasets = eese_datasets | |
| models = gpt4 | |
| # 为每个数据集增加judge_cfg信息,而不是覆盖 | |
| for dataset in datasets: | |
| if 'eval_cfg' in dataset and 'evaluator' in dataset['eval_cfg']: | |
| # 获取现有的judge_cfg,如果不存在则创建空字典 | |
| existing_judge_cfg = dataset['eval_cfg']['evaluator'].get('judge_cfg', {}) | |
| # 更新现有的judge_cfg,保留原有配置并添加新配置 | |
| existing_judge_cfg.update(judge_cfg) | |
| # 将更新后的配置设置回去 | |
| dataset['eval_cfg']['evaluator']['judge_cfg'] = existing_judge_cfg | |