| LICENSE |
| README.md |
| pyproject.toml |
| setup.py |
| ./search_r1/__init__.py |
| ./search_r1/llm_agent/__init__.py |
| ./search_r1/llm_agent/generation.py |
| ./search_r1/llm_agent/tensor_helper.py |
| ./verl/__init__.py |
| ./verl/protocol.py |
| ./verl/models/__init__.py |
| ./verl/models/registry.py |
| ./verl/models/weight_loader_registry.py |
| ./verl/models/llama/__init__.py |
| ./verl/models/llama/megatron/__init__.py |
| ./verl/models/llama/megatron/modeling_llama_megatron.py |
| ./verl/models/llama/megatron/checkpoint_utils/__init__.py |
| ./verl/models/llama/megatron/checkpoint_utils/llama_loader.py |
| ./verl/models/llama/megatron/checkpoint_utils/llama_saver.py |
| ./verl/models/llama/megatron/layers/__init__.py |
| ./verl/models/llama/megatron/layers/parallel_attention.py |
| ./verl/models/llama/megatron/layers/parallel_decoder.py |
| ./verl/models/llama/megatron/layers/parallel_linear.py |
| ./verl/models/llama/megatron/layers/parallel_mlp.py |
| ./verl/models/llama/megatron/layers/parallel_rmsnorm.py |
| ./verl/models/transformers/__init__.py |
| ./verl/models/transformers/llama.py |
| ./verl/models/transformers/monkey_patch.py |
| ./verl/models/transformers/qwen2.py |
| ./verl/single_controller/__init__.py |
| ./verl/single_controller/base/__init__.py |
| ./verl/single_controller/base/decorator.py |
| ./verl/single_controller/base/worker.py |
| ./verl/single_controller/base/worker_group.py |
| ./verl/single_controller/base/megatron/__init__.py |
| ./verl/single_controller/base/megatron/worker.py |
| ./verl/single_controller/base/megatron/worker_group.py |
| ./verl/single_controller/base/register_center/__init__.py |
| ./verl/single_controller/base/register_center/ray.py |
| ./verl/single_controller/ray/__init__.py |
| ./verl/single_controller/ray/base.py |
| ./verl/single_controller/ray/megatron.py |
| ./verl/third_party/__init__.py |
| ./verl/third_party/vllm/__init__.py |
| ./verl/third_party/vllm/vllm_v_0_3_1/__init__.py |
| ./verl/third_party/vllm/vllm_v_0_3_1/arg_utils.py |
| ./verl/third_party/vllm/vllm_v_0_3_1/config.py |
| ./verl/third_party/vllm/vllm_v_0_3_1/llm.py |
| ./verl/third_party/vllm/vllm_v_0_3_1/llm_engine_sp.py |
| ./verl/third_party/vllm/vllm_v_0_3_1/model_loader.py |
| ./verl/third_party/vllm/vllm_v_0_3_1/model_runner.py |
| ./verl/third_party/vllm/vllm_v_0_3_1/parallel_state.py |
| ./verl/third_party/vllm/vllm_v_0_3_1/tokenizer.py |
| ./verl/third_party/vllm/vllm_v_0_3_1/weight_loaders.py |
| ./verl/third_party/vllm/vllm_v_0_3_1/worker.py |
| ./verl/third_party/vllm/vllm_v_0_4_2/__init__.py |
| ./verl/third_party/vllm/vllm_v_0_4_2/arg_utils.py |
| ./verl/third_party/vllm/vllm_v_0_4_2/config.py |
| ./verl/third_party/vllm/vllm_v_0_4_2/dtensor_weight_loaders.py |
| ./verl/third_party/vllm/vllm_v_0_4_2/hf_weight_loader.py |
| ./verl/third_party/vllm/vllm_v_0_4_2/llm.py |
| ./verl/third_party/vllm/vllm_v_0_4_2/llm_engine_sp.py |
| ./verl/third_party/vllm/vllm_v_0_4_2/megatron_weight_loaders.py |
| ./verl/third_party/vllm/vllm_v_0_4_2/model_loader.py |
| ./verl/third_party/vllm/vllm_v_0_4_2/model_runner.py |
| ./verl/third_party/vllm/vllm_v_0_4_2/parallel_state.py |
| ./verl/third_party/vllm/vllm_v_0_4_2/spmd_gpu_executor.py |
| ./verl/third_party/vllm/vllm_v_0_4_2/tokenizer.py |
| ./verl/third_party/vllm/vllm_v_0_4_2/worker.py |
| ./verl/third_party/vllm/vllm_v_0_5_4/__init__.py |
| ./verl/third_party/vllm/vllm_v_0_5_4/arg_utils.py |
| ./verl/third_party/vllm/vllm_v_0_5_4/config.py |
| ./verl/third_party/vllm/vllm_v_0_5_4/dtensor_weight_loaders.py |
| ./verl/third_party/vllm/vllm_v_0_5_4/hf_weight_loader.py |
| ./verl/third_party/vllm/vllm_v_0_5_4/llm.py |
| ./verl/third_party/vllm/vllm_v_0_5_4/llm_engine_sp.py |
| ./verl/third_party/vllm/vllm_v_0_5_4/megatron_weight_loaders.py |
| ./verl/third_party/vllm/vllm_v_0_5_4/model_loader.py |
| ./verl/third_party/vllm/vllm_v_0_5_4/model_runner.py |
| ./verl/third_party/vllm/vllm_v_0_5_4/parallel_state.py |
| ./verl/third_party/vllm/vllm_v_0_5_4/spmd_gpu_executor.py |
| ./verl/third_party/vllm/vllm_v_0_5_4/tokenizer.py |
| ./verl/third_party/vllm/vllm_v_0_5_4/worker.py |
| ./verl/third_party/vllm/vllm_v_0_6_3/__init__.py |
| ./verl/third_party/vllm/vllm_v_0_6_3/arg_utils.py |
| ./verl/third_party/vllm/vllm_v_0_6_3/config.py |
| ./verl/third_party/vllm/vllm_v_0_6_3/dtensor_weight_loaders.py |
| ./verl/third_party/vllm/vllm_v_0_6_3/hf_weight_loader.py |
| ./verl/third_party/vllm/vllm_v_0_6_3/llm.py |
| ./verl/third_party/vllm/vllm_v_0_6_3/llm_engine_sp.py |
| ./verl/third_party/vllm/vllm_v_0_6_3/megatron_weight_loaders.py |
| ./verl/third_party/vllm/vllm_v_0_6_3/model_loader.py |
| ./verl/third_party/vllm/vllm_v_0_6_3/model_runner.py |
| ./verl/third_party/vllm/vllm_v_0_6_3/parallel_state.py |
| ./verl/third_party/vllm/vllm_v_0_6_3/spmd_gpu_executor.py |
| ./verl/third_party/vllm/vllm_v_0_6_3/tokenizer.py |
| ./verl/third_party/vllm/vllm_v_0_6_3/worker.py |
| ./verl/trainer/__init__.py |
| ./verl/trainer/fsdp_sft_trainer.py |
| ./verl/trainer/main_eval.py |
| ./verl/trainer/main_generation.py |
| ./verl/trainer/main_ppo.py |
| ./verl/trainer/main_ppo_format.py |
| ./verl/trainer/config/evaluation.yaml |
| ./verl/trainer/config/generation.yaml |
| ./verl/trainer/config/ppo_megatron_trainer.yaml |
| ./verl/trainer/config/ppo_trainer.yaml |
| ./verl/trainer/config/sft_trainer.yaml |
| ./verl/trainer/ppo/__init__.py |
| ./verl/trainer/ppo/core_algos.py |
| ./verl/trainer/ppo/ray_trainer.py |
| ./verl/utils/__init__.py |
| ./verl/utils/config.py |
| ./verl/utils/distributed.py |
| ./verl/utils/flops_counter.py |
| ./verl/utils/fs.py |
| ./verl/utils/fsdp_utils.py |
| ./verl/utils/hdfs_io.py |
| ./verl/utils/import_utils.py |
| ./verl/utils/logging_utils.py |
| ./verl/utils/megatron_utils.py |
| ./verl/utils/memory_buffer.py |
| ./verl/utils/model.py |
| ./verl/utils/py_functional.py |
| ./verl/utils/ray_utils.py |
| ./verl/utils/seqlen_balancing.py |
| ./verl/utils/tokenizer.py |
| ./verl/utils/torch_dtypes.py |
| ./verl/utils/torch_functional.py |
| ./verl/utils/tracking.py |
| ./verl/utils/ulysses.py |
| ./verl/utils/dataset/__init__.py |
| ./verl/utils/dataset/rl_dataset.py |
| ./verl/utils/dataset/rm_dataset.py |
| ./verl/utils/debug/__init__.py |
| ./verl/utils/debug/performance.py |
| ./verl/utils/debug/trajectory_tracker.py |
| ./verl/utils/logger/__init__.py |
| ./verl/utils/logger/aggregate_logger.py |
| ./verl/utils/megatron/__init__.py |
| ./verl/utils/megatron/memory.py |
| ./verl/utils/megatron/optimizer.py |
| ./verl/utils/megatron/optimizer_config.py |
| ./verl/utils/megatron/pipeline_parallel.py |
| ./verl/utils/megatron/sequence_parallel.py |
| ./verl/utils/megatron/tensor_parallel.py |
| ./verl/utils/rendezvous/__init__.py |
| ./verl/utils/rendezvous/ray_backend.py |
| ./verl/utils/reward_score/__init__.py |
| ./verl/utils/reward_score/countdown.py |
| ./verl/utils/reward_score/gsm8k.py |
| ./verl/utils/reward_score/math.py |
| ./verl/utils/reward_score/multiply.py |
| ./verl/utils/reward_score/qa_em.py |
| ./verl/utils/reward_score/qa_em_format.py |
| ./verl/version/version |
| ./verl/workers/__init__.py |
| ./verl/workers/fsdp_workers.py |
| ./verl/workers/megatron_workers.py |
| ./verl/workers/actor/__init__.py |
| ./verl/workers/actor/base.py |
| ./verl/workers/actor/dp_actor.py |
| ./verl/workers/actor/megatron_actor.py |
| ./verl/workers/critic/__init__.py |
| ./verl/workers/critic/base.py |
| ./verl/workers/critic/dp_critic.py |
| ./verl/workers/critic/megatron_critic.py |
| ./verl/workers/reward_model/__init__.py |
| ./verl/workers/reward_model/base.py |
| ./verl/workers/reward_model/megatron/__init__.py |
| ./verl/workers/reward_model/megatron/reward_model.py |
| ./verl/workers/rollout/__init__.py |
| ./verl/workers/rollout/base.py |
| ./verl/workers/rollout/hf_rollout.py |
| ./verl/workers/rollout/tokenizer.py |
| ./verl/workers/rollout/naive/__init__.py |
| ./verl/workers/rollout/naive/naive_rollout.py |
| ./verl/workers/rollout/vllm_rollout/__init__.py |
| ./verl/workers/rollout/vllm_rollout/vllm_rollout.py |
| ./verl/workers/sharding_manager/__init__.py |
| ./verl/workers/sharding_manager/base.py |
| ./verl/workers/sharding_manager/fsdp_ulysses.py |
| ./verl/workers/sharding_manager/fsdp_vllm.py |
| ./verl/workers/sharding_manager/megatron_vllm.py |
| verl.egg-info/PKG-INFO |
| verl.egg-info/SOURCES.txt |
| verl.egg-info/dependency_links.txt |
| verl.egg-info/requires.txt |
| verl.egg-info/top_level.txt |
| verl/version/version |