text2text / verl /utils /ray_utils.py
braindeck
Initial commit
bcdf9fa
# Copyright 2024 Bytedance Ltd. and/or its affiliates
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
"""
Contains commonly used utilities for ray
"""
import concurrent.futures
import ray
def parallel_put(data_list, max_workers=None):
def put_data(index, data):
return index, ray.put(data)
if max_workers is None:
max_workers = min(len(data_list), 16)
with concurrent.futures.ThreadPoolExecutor(max_workers=max_workers) as executor:
data_list_f = [executor.submit(put_data, i, data) for i, data in enumerate(data_list)]
res_lst = []
for future in concurrent.futures.as_completed(data_list_f):
res_lst.append(future.result())
# reorder based on index
output = [None for _ in range(len(data_list))]
for res in res_lst:
index, data_ref = res
output[index] = data_ref
return output