from __future__ import print_function import volcenginesdkcore import volcenginesdkmlplatform20240701 from volcenginesdkcore.rest import ApiException import datetime import os os.environ['no_proxy'] = 'volces.com,volcengineapi.com' if __name__ == '__main__': configuration = volcenginesdkcore.Configuration() configuration.ak = "AKLTN2FkNjljZTc5ZTc0NGExZGExZjMwNDMxNDdiYjQ3ZDY" configuration.sk = "T0dNeU9UUmpPRGcyWkRVM05HVXlOamxsTVdJeE1XVTJaalJoT1RaaU9HVQ==" configuration.region = "cn-beijing2" timestamp = datetime.datetime.now().strftime("%Y%m%d_%H%M%S") log_file_eval=f"/map-vepfs/haozhe/BiDIT/qqllm/dection_{timestamp}.log" bash_command = f''' # cd /map-vepfs/haozhe/BiDIT/qqllm/HBLLM && # source activate /map-vepfs/haozhe/BiDIT/qqllm/dataset_env && # sh /map-vepfs/haozhe/BiDIT/qqllm/HBLLM/run.sh # cd /map-vepfs/haozhe/BiDIT/qqllm/BiLLM && # source activate /map-vepfs/haozhe/BiDIT/qqllm/dataset_env && # bash /map-vepfs/haozhe/BiDIT/qqllm/OBR/FlatQuant/run_Qwen2.5-7B/run_obr_flatquant_qwen25_7b_w4a4kv4_s50.sh # cd /map-vepfs/haozhe/BiDIT/qqllm && # source activate /map-vepfs/haozhe/BiDIT/qqllm/dataset_env && # bash /map-vepfs/haozhe/BiDIT/qqllm/eval_scripts/eval_standard_qwen7b.sh cd /map-vepfs/haozhe/BiDIT/qqllm/WANDA_gptq_shift && source activate /map-vepfs/haozhe/BiDIT/qqllm/dataset_env && bash /map-vepfs/haozhe/BiDIT/qqllm/WANDA_gptq_shift/QuaRot/run_final_0406retry_llama31_70b_quarot_no_rot_sparsegpt_gptq_baseline_w4a16kv16_c4_s50_ns128_asym.sh ''' card_type = "ml.pni2l.7xlarge" jobname = f'TR-DQ_{timestamp}' resource_queue_id = "q-20241024095431-86z6j" vepfs_id = "vepfs-cnbj26c39866e9ec1" vepfs_host_path = f"/mnt/{vepfs_id}" volcenginesdkcore.Configuration.set_default(configuration) api_instance = volcenginesdkmlplatform20240701.MLPLATFORM20240701Api() def create_job(): req_resource = volcenginesdkmlplatform20240701.ResourceForCreateJobInput( instance_type_id=card_type, type="Preset", zone_id="cn-beijing2-a", ) req_roles = volcenginesdkmlplatform20240701.RoleForCreateJobInput( name="worker", replicas=1, resource=req_resource, ) req_resource_config = volcenginesdkmlplatform20240701.ResourceConfigForCreateJobInput( priority=2, resource_queue_id=resource_queue_id, roles=[req_roles], ) req_image = volcenginesdkmlplatform20240701.ImageForCreateJobInput( type="Prebuild", url="vemlp-cn-beijing2.cr.volces.com/preset-images/ray:2.12.0-cuda-121-py310", ) req_runtime_config = volcenginesdkmlplatform20240701.RuntimeConfigForCreateJobInput( command=bash_command, framework="PyTorch", image=req_image, ) req_vepfs = volcenginesdkmlplatform20240701.VepfsForCreateJobInput( host_path=vepfs_host_path, id=vepfs_id, ) req_config = volcenginesdkmlplatform20240701.ConfigForCreateJobInput( vepfs=req_vepfs, ) req_storages = volcenginesdkmlplatform20240701.StorageForCreateJobInput( config=req_config, mount_path="/map-vepfs", type="Vepfs", ) req_storage_config = volcenginesdkmlplatform20240701.StorageConfigForCreateJobInput( storages=[req_storages], ) create_job_request = volcenginesdkmlplatform20240701.CreateJobRequest( dry_run=False, name=jobname, resource_config=req_resource_config, runtime_config=req_runtime_config, storage_config=req_storage_config, ) try: response = api_instance.create_job(create_job_request) job_id = response.id print(f"✅ 作业提交成功") print(f" 作业ID: {job_id}") print(f" 作业名称: {jobname}") print(f" 等待5-10分钟启动...") return job_id except ApiException as e: print(f"❌ 提交失败: {e}") return None created_job_id = create_job()