add reward_mapping into reward function and add permission
Showing
.github/dependabot.yml
100644 → 100755
File mode changed from 100644 to 100755
.github/workflows/checkpoints.yml
100644 → 100755
File mode changed from 100644 to 100755
.github/workflows/dataset.yml
100644 → 100755
File mode changed from 100644 to 100755
.github/workflows/e2e_ascend.yml
100644 → 100755
File mode changed from 100644 to 100755
.github/workflows/e2e_digit_completion.yml
100644 → 100755
File mode changed from 100644 to 100755
.github/workflows/e2e_digit_completion_fire.yml
100644 → 100755
File mode changed from 100644 to 100755
.github/workflows/e2e_eval_aime24.yml
100644 → 100755
File mode changed from 100644 to 100755
.github/workflows/e2e_grpo.yml
100644 → 100755
File mode changed from 100644 to 100755
.github/workflows/e2e_gsm8k.yml
100644 → 100755
File mode changed from 100644 to 100755
.github/workflows/e2e_gsm8k_dapo.yml
100644 → 100755
File mode changed from 100644 to 100755
.github/workflows/e2e_gsm8k_megatron.yml
100644 → 100755
File mode changed from 100644 to 100755
.github/workflows/e2e_gsm8k_prime.yml
100644 → 100755
File mode changed from 100644 to 100755
.github/workflows/e2e_lora.yml
100644 → 100755
File mode changed from 100644 to 100755
.github/workflows/e2e_sft.yml
100644 → 100755
File mode changed from 100644 to 100755
.github/workflows/e2e_sglang_gsm8k.yml
100644 → 100755
File mode changed from 100644 to 100755
.github/workflows/e2e_vlm_geo3k.yml
100644 → 100755
File mode changed from 100644 to 100755
.github/workflows/model.yml
100644 → 100755
File mode changed from 100644 to 100755
.github/workflows/pylint.yml
100644 → 100755
File mode changed from 100644 to 100755
.github/workflows/ray_test.yml
100644 → 100755
File mode changed from 100644 to 100755
.github/workflows/sandbox.yml
100644 → 100755
File mode changed from 100644 to 100755
.github/workflows/sanity.yml
100644 → 100755
File mode changed from 100644 to 100755
.github/workflows/scorecard.yml
100644 → 100755
File mode changed from 100644 to 100755
.github/workflows/secrets_scan.yml
100644 → 100755
File mode changed from 100644 to 100755
.github/workflows/vllm.yml
100644 → 100755
File mode changed from 100644 to 100755
.github/workflows/yapf_format.yml
100644 → 100755
File mode changed from 100644 to 100755
.gitignore
100644 → 100755
File mode changed from 100644 to 100755
.readthedocs.yaml
100644 → 100755
File mode changed from 100644 to 100755
.style.yapf
100644 → 100755
File mode changed from 100644 to 100755
LICENSE
100644 → 100755
File mode changed from 100644 to 100755
Notice.txt
100644 → 100755
File mode changed from 100644 to 100755
README.md
100644 → 100755
File mode changed from 100644 to 100755
docker/Dockerfile.megatron
100644 → 100755
File mode changed from 100644 to 100755
docker/Dockerfile.ngc.vllm
100644 → 100755
File mode changed from 100644 to 100755
docker/Dockerfile.ngc.vllm0.8
100644 → 100755
File mode changed from 100644 to 100755
docker/Dockerfile.ngc.vllm0.8.sagemaker
100644 → 100755
File mode changed from 100644 to 100755
docker/Dockerfile.rocm
100644 → 100755
File mode changed from 100644 to 100755
docker/Dockerfile.vemlp.vllm.te
100644 → 100755
File mode changed from 100644 to 100755
docker/Dockfile.ngc.vllm0.8
100644 → 100755
File mode changed from 100644 to 100755
docs/Makefile
100644 → 100755
File mode changed from 100644 to 100755
docs/README.md
100644 → 100755
File mode changed from 100644 to 100755
docs/README_vllm0.7.md
100644 → 100755
File mode changed from 100644 to 100755
docs/README_vllm0.8.md
100644 → 100755
File mode changed from 100644 to 100755
docs/_static/logo.png
100644 → 100755
File mode changed from 100644 to 100755
docs/advance/checkpoint.rst
100644 → 100755
File mode changed from 100644 to 100755
docs/advance/dpo_extension.rst
100644 → 100755
File mode changed from 100644 to 100755
docs/advance/fsdp_extension.rst
100644 → 100755
File mode changed from 100644 to 100755
docs/advance/megatron_extension.rst
100644 → 100755
File mode changed from 100644 to 100755
docs/advance/placement.rst
100644 → 100755
File mode changed from 100644 to 100755
docs/amd_tutorial/amd_build_dockerfile.md
100644 → 100755
File mode changed from 100644 to 100755
docs/amd_tutorial/amd_build_dockerfile_page.rst
100644 → 100755
File mode changed from 100644 to 100755
docs/amd_tutorial/amd_existing_docker.md
100644 → 100755
File mode changed from 100644 to 100755
docs/conf.py
100644 → 100755
File mode changed from 100644 to 100755
docs/data.rst
100644 → 100755
File mode changed from 100644 to 100755
docs/examples/config.rst
100644 → 100755
File mode changed from 100644 to 100755
docs/examples/gsm8k_example.rst
100644 → 100755
File mode changed from 100644 to 100755
docs/examples/ppo_code_architecture.rst
100644 → 100755
File mode changed from 100644 to 100755
docs/experiment/ppo.rst
100644 → 100755
File mode changed from 100644 to 100755
docs/faq/faq.rst
100644 → 100755
File mode changed from 100644 to 100755
docs/hybrid_flow.rst
100644 → 100755
File mode changed from 100644 to 100755
docs/index.rst
100644 → 100755
File mode changed from 100644 to 100755
docs/perf/perf_tuning.rst
100644 → 100755
File mode changed from 100644 to 100755
docs/preparation/prepare_data.rst
100644 → 100755
File mode changed from 100644 to 100755
docs/preparation/reward_function.rst
100644 → 100755
File mode changed from 100644 to 100755
docs/requirements-docs.txt
100644 → 100755
File mode changed from 100644 to 100755
docs/start/install.rst
100644 → 100755
File mode changed from 100644 to 100755
docs/start/multinode.rst
100644 → 100755
File mode changed from 100644 to 100755
docs/start/quickstart.rst
100644 → 100755
File mode changed from 100644 to 100755
docs/workers/fsdp_workers.rst
100644 → 100755
File mode changed from 100644 to 100755
docs/workers/megatron_workers.rst
100644 → 100755
File mode changed from 100644 to 100755
docs/workers/ray_trainer.rst
100644 → 100755
File mode changed from 100644 to 100755
examples/checkpoint/run_deepseek_megatron_ckpt.sh
100644 → 100755
File mode changed from 100644 to 100755
examples/checkpoint/run_qwen_megatron_ckpt.sh
100644 → 100755
File mode changed from 100644 to 100755
examples/data_preprocess/codev.py
100644 → 100755
File mode changed from 100644 to 100755
examples/data_preprocess/full_hh_rlhf.py
100644 → 100755
File mode changed from 100644 to 100755
examples/data_preprocess/geo3k.py
100644 → 100755
File mode changed from 100644 to 100755
examples/data_preprocess/gsm8k.py
100644 → 100755
File mode changed from 100644 to 100755
examples/data_preprocess/hellaswag.py
100644 → 100755
File mode changed from 100644 to 100755
examples/data_preprocess/kk.py
100644 → 100755
File mode changed from 100644 to 100755
examples/data_preprocess/math_dataset.py
100644 → 100755
File mode changed from 100644 to 100755
examples/generation/run_deepseek7b_mutli_node.sh
100644 → 100755
File mode changed from 100644 to 100755
examples/generation/run_deepseek_v2_lite_math.sh
100644 → 100755
File mode changed from 100644 to 100755
examples/grpo_trainer/run_deepseek7b_llm.sh
100644 → 100755
File mode changed from 100644 to 100755
examples/grpo_trainer/run_deepseek7b_llm_math.sh
100644 → 100755
File mode changed from 100644 to 100755
examples/grpo_trainer/run_deepseek7b_llm_math_megatron.sh
100644 → 100755
File mode changed from 100644 to 100755
examples/grpo_trainer/run_deepseek7b_llm_megatron.sh
100644 → 100755
File mode changed from 100644 to 100755
examples/grpo_trainer/run_deepseek7b_llm_seq_balance.sh
100644 → 100755
File mode changed from 100644 to 100755
examples/grpo_trainer/run_qwen2-7b.sh
100644 → 100755
File mode changed from 100644 to 100755
examples/grpo_trainer/run_qwen2-7b_math.sh
100644 → 100755
File mode changed from 100644 to 100755
examples/grpo_trainer/run_qwen2-7b_math_megatron.sh
100644 → 100755
File mode changed from 100644 to 100755
examples/grpo_trainer/run_qwen2-7b_megatron.sh
100644 → 100755
File mode changed from 100644 to 100755
examples/grpo_trainer/run_qwen2-7b_seq_balance.sh
100644 → 100755
File mode changed from 100644 to 100755
examples/grpo_trainer/run_qwen2_5_vl-7b.sh
100644 → 100755
File mode changed from 100644 to 100755
examples/ppo_trainer/run_deepseek7b_llm.sh
100644 → 100755
File mode changed from 100644 to 100755
examples/ppo_trainer/run_deepseek7b_llm_modelscope.sh
100644 → 100755
File mode changed from 100644 to 100755
examples/ppo_trainer/run_deepseek7b_llm_sp2.sh
100644 → 100755
File mode changed from 100644 to 100755
examples/ppo_trainer/run_deepseek_full_hh_rlhf.sh
100644 → 100755
File mode changed from 100644 to 100755
examples/ppo_trainer/run_deepseek_math_gsm8k_megatron.sh
100644 → 100755
File mode changed from 100644 to 100755
examples/ppo_trainer/run_deepseek_megatron.sh
100644 → 100755
File mode changed from 100644 to 100755
examples/ppo_trainer/run_gemma.sh
100644 → 100755
File mode changed from 100644 to 100755
examples/ppo_trainer/run_qwen2-7b_math_gsm8k_megatron.sh
100644 → 100755
File mode changed from 100644 to 100755
examples/ppo_trainer/run_qwen2-7b_megatron.sh
100644 → 100755
File mode changed from 100644 to 100755
examples/ppo_trainer/run_qwen2-7b_rm.sh
100644 → 100755
File mode changed from 100644 to 100755
examples/ppo_trainer/run_qwen2-7b_rm_seq_balance.sh
100644 → 100755
File mode changed from 100644 to 100755
examples/ppo_trainer/run_qwen2-7b_seq_balance.sh
100644 → 100755
File mode changed from 100644 to 100755
examples/ppo_trainer/run_qwen2.5-32b.sh
100644 → 100755
File mode changed from 100644 to 100755
examples/ppo_trainer/verl_getting_started.ipynb
100644 → 100755
File mode changed from 100644 to 100755
examples/ray/tutorial.ipynb
100644 → 100755
File mode changed from 100644 to 100755
examples/remax_trainer/run_qwen2.5-3b_seq_balance.sh
100644 → 100755
File mode changed from 100644 to 100755
examples/remax_trainer/run_qwen2.5-7b_seq_balance.sh
100644 → 100755
File mode changed from 100644 to 100755
examples/rloo_trainer/run_qwen2-7b.sh
100644 → 100755
File mode changed from 100644 to 100755
examples/sft/gsm8k/run_deepseek_6b7.sh
100644 → 100755
File mode changed from 100644 to 100755
examples/sft/gsm8k/run_gemma_2b.sh
100644 → 100755
File mode changed from 100644 to 100755
examples/sft/gsm8k/run_gemma_7b.sh
100644 → 100755
File mode changed from 100644 to 100755
examples/split_placement/README.md
100644 → 100755
File mode changed from 100644 to 100755
examples/split_placement/config/ppo_trainer_split.yaml
100644 → 100755
File mode changed from 100644 to 100755
examples/split_placement/main_ppo_split.py
100644 → 100755
File mode changed from 100644 to 100755
examples/split_placement/run_deepseek7b_llm.sh
100644 → 100755
File mode changed from 100644 to 100755
examples/split_placement/split_monkey_patch.py
100644 → 100755
File mode changed from 100644 to 100755
patches/megatron_v4.patch
100644 → 100755
File mode changed from 100644 to 100755
plot_and_analyze/extract_ve2_result.py
100644 → 100755
File mode changed from 100644 to 100755
plot_and_analyze/plot.py
100644 → 100755
File mode changed from 100644 to 100755
pyproject.toml
100644 → 100755
File mode changed from 100644 to 100755
recipe/dapo/README.md
100644 → 100755
File mode changed from 100644 to 100755
recipe/dapo/dapo_7b_test.sh
100644 → 100755
This diff is collapsed.
Click to expand it.
recipe/dapo/prepare_dapo_data.sh
100644 → 100755
File mode changed from 100644 to 100755
recipe/dapo/run_dapo_codev_7b_16k.sh
100644 → 100755
File mode changed from 100644 to 100755
This diff is collapsed.
Click to expand it.
This diff is collapsed.
Click to expand it.
recipe/dapo/run_dapo_codev_7b_16k_err_l1.0_continuous_reward.sh
100644 → 100755
This diff is collapsed.
Click to expand it.
File mode changed from 100644 to 100755
recipe/dapo/run_dapo_codev_7b_3.4k.sh
100644 → 100755
File mode changed from 100644 to 100755
recipe/dapo/run_dapo_codev_7b_8k.sh
100644 → 100755
File mode changed from 100644 to 100755
recipe/dapo/run_dapo_codev_7b_8k_terminal.sh
100644 → 100755
File mode changed from 100644 to 100755
recipe/dapo/run_dapo_early_qwen2.5_32b.sh
100644 → 100755
File mode changed from 100644 to 100755
recipe/dapo/run_dapo_qwen2.5_32b.sh
100644 → 100755
File mode changed from 100644 to 100755
recipe/dapo/src/config/dapo_trainer.yaml
100644 → 100755
File mode changed from 100644 to 100755
recipe/dapo/src/dapo_ray_trainer.py
100644 → 100755
File mode changed from 100644 to 100755
recipe/dapo/src/main_dapo.py
100644 → 100755
File mode changed from 100644 to 100755
recipe/dapo/test_dapo_7b.sh
100644 → 100755
File mode changed from 100644 to 100755
recipe/prime/__init__.py
100644 → 100755
File mode changed from 100644 to 100755
recipe/prime/config/prime_trainer.yaml
100644 → 100755
File mode changed from 100644 to 100755
recipe/prime/main_prime.py
100644 → 100755
File mode changed from 100644 to 100755
recipe/prime/prime_core_algos.py
100644 → 100755
File mode changed from 100644 to 100755
recipe/prime/prime_dp_rm.py
100644 → 100755
File mode changed from 100644 to 100755
recipe/prime/prime_fsdp_workers.py
100644 → 100755
File mode changed from 100644 to 100755
recipe/prime/prime_ray_trainer.py
100644 → 100755
File mode changed from 100644 to 100755
recipe/prime/run_prime_qwen.sh
100644 → 100755
File mode changed from 100644 to 100755
recipe/r1/__init__.py
100644 → 100755
File mode changed from 100644 to 100755
recipe/r1/config/evaluation.yaml
100644 → 100755
File mode changed from 100644 to 100755
recipe/r1/data_process.py
100644 → 100755
File mode changed from 100644 to 100755
recipe/r1/main_eval.py
100644 → 100755
File mode changed from 100644 to 100755
recipe/r1/reward_score.py
100644 → 100755
File mode changed from 100644 to 100755
recipe/r1/run_r1_distill_qwen.sh
100644 → 100755
File mode changed from 100644 to 100755
recipe/r1/tasks/__init__.py
100644 → 100755
File mode changed from 100644 to 100755
recipe/r1/tasks/gpqa.py
100644 → 100755
File mode changed from 100644 to 100755
recipe/r1/tasks/livecodebench.py
100644 → 100755
File mode changed from 100644 to 100755
recipe/r1/tasks/math.py
100644 → 100755
File mode changed from 100644 to 100755
requirements.txt
100644 → 100755
File mode changed from 100644 to 100755
requirements_sglang.txt
100644 → 100755
File mode changed from 100644 to 100755
results/dapo_7b_test/dapo_7b_test.sh
0 → 100755
This diff is collapsed.
Click to expand it.
This diff is collapsed.
Click to expand it.
scripts/model_merger.py
100644 → 100755
File mode changed from 100644 to 100755
setup.py
100644 → 100755
File mode changed from 100644 to 100755
slurm_submit.py
100644 → 100755
This diff is collapsed.
Click to expand it.
tests/__init__.py
100644 → 100755
File mode changed from 100644 to 100755
tests/checkpoint/run_deepseek_megatron_ckpt.sh
100644 → 100755
File mode changed from 100644 to 100755
tests/checkpoint/run_qwen_megatron_ckpt.sh
100644 → 100755
File mode changed from 100644 to 100755
tests/checkpoint/test_fsdp_ckpt.py
100644 → 100755
File mode changed from 100644 to 100755
tests/distributed/run_all.sh
100644 → 100755
File mode changed from 100644 to 100755
tests/distributed/test_tensor_dict.py
100644 → 100755
File mode changed from 100644 to 100755
tests/distro/requirements.py
100644 → 100755
File mode changed from 100644 to 100755
tests/e2e/__init__.py
100644 → 100755
File mode changed from 100644 to 100755
tests/e2e/arithmetic_sequence/data/create_dataset.py
100644 → 100755
File mode changed from 100644 to 100755
tests/e2e/arithmetic_sequence/model/config.json
100644 → 100755
File mode changed from 100644 to 100755
tests/e2e/arithmetic_sequence/model/create_model_tokenizer.py
100644 → 100755
File mode changed from 100644 to 100755
tests/e2e/arithmetic_sequence/model/generation_config.json
100644 → 100755
File mode changed from 100644 to 100755
tests/e2e/arithmetic_sequence/model/model.safetensors
100644 → 100755
This diff is collapsed.
Click to expand it.
tests/e2e/arithmetic_sequence/model/tokenizer_config.json
100644 → 100755
File mode changed from 100644 to 100755
tests/e2e/arithmetic_sequence/rl/README.md
100644 → 100755
File mode changed from 100644 to 100755
tests/e2e/arithmetic_sequence/rl/main_trainer.py
100644 → 100755
File mode changed from 100644 to 100755
tests/e2e/check_custom_rwd_fn.py
100644 → 100755
File mode changed from 100644 to 100755
tests/e2e/check_results.py
100644 → 100755
File mode changed from 100644 to 100755
tests/e2e/envs/__init__.py
100644 → 100755
File mode changed from 100644 to 100755
tests/e2e/envs/digit_completion/__init__.py
100644 → 100755
File mode changed from 100644 to 100755
tests/e2e/envs/digit_completion/task.py
100644 → 100755
File mode changed from 100644 to 100755
tests/e2e/envs/digit_completion/tokenizer.py
100644 → 100755
File mode changed from 100644 to 100755
tests/e2e/run_deepseek_grpo.sh
100644 → 100755
File mode changed from 100644 to 100755
tests/e2e/run_deepseek_grpo_megatron.sh
100644 → 100755
File mode changed from 100644 to 100755
tests/e2e/run_deepseek_megatron.sh
100644 → 100755
File mode changed from 100644 to 100755
tests/e2e/run_deepseek_megatron_parallelism.sh
100644 → 100755
File mode changed from 100644 to 100755
tests/e2e/run_qwen2vl_geo3k_function_rm.sh
100644 → 100755
File mode changed from 100644 to 100755
tests/e2e/run_qwen_grpo.sh
100644 → 100755
File mode changed from 100644 to 100755
tests/e2e/run_qwen_grpo_megatron.sh
100644 → 100755
File mode changed from 100644 to 100755
tests/e2e/run_qwen_gsm8k_custom_function_rm.sh
100644 → 100755
File mode changed from 100644 to 100755
tests/e2e/run_qwen_gsm8k_dapo.sh
100644 → 100755
File mode changed from 100644 to 100755
tests/e2e/run_qwen_gsm8k_function_rm.sh
100644 → 100755
File mode changed from 100644 to 100755
tests/e2e/run_qwen_gsm8k_function_rm_both_kl.sh
100644 → 100755
File mode changed from 100644 to 100755
tests/e2e/run_qwen_gsm8k_function_rm_grpo.sh
100644 → 100755
File mode changed from 100644 to 100755
tests/e2e/run_qwen_gsm8k_function_rm_no_rmpad.sh
100644 → 100755
File mode changed from 100644 to 100755
tests/e2e/run_qwen_gsm8k_function_rm_remax.sh
100644 → 100755
File mode changed from 100644 to 100755
tests/e2e/run_qwen_gsm8k_model_rm.sh
100644 → 100755
File mode changed from 100644 to 100755
tests/e2e/run_qwen_gsm8k_model_rm_liger_kernel.sh
100644 → 100755
File mode changed from 100644 to 100755
tests/e2e/run_qwen_gsm8k_model_rm_no_rmpad.sh
100644 → 100755
File mode changed from 100644 to 100755
tests/e2e/run_qwen_gsm8k_model_rm_seq_balance.sh
100644 → 100755
File mode changed from 100644 to 100755
tests/e2e/run_qwen_gsm8k_model_rm_ulysses.sh
100644 → 100755
File mode changed from 100644 to 100755
tests/e2e/run_qwen_gsm8k_prime.sh
100644 → 100755
File mode changed from 100644 to 100755
tests/e2e/run_qwen_megatron.sh
100644 → 100755
File mode changed from 100644 to 100755
tests/e2e/run_qwen_megatron_parallelism.sh
100644 → 100755
File mode changed from 100644 to 100755
tests/e2e/run_r1_distill_qwen_aime24_eval.sh
100644 → 100755
File mode changed from 100644 to 100755
tests/e2e/run_ray_trainer.sh
100644 → 100755
File mode changed from 100644 to 100755
tests/e2e/run_ray_trainer_fire_sampling.sh
100644 → 100755
File mode changed from 100644 to 100755
tests/e2e/run_ray_trainer_rmpad.sh
100644 → 100755
File mode changed from 100644 to 100755
tests/gpu_utility/test_memory_buffers.py
100644 → 100755
File mode changed from 100644 to 100755
tests/gpu_utility/test_ops.py
100644 → 100755
File mode changed from 100644 to 100755
tests/gpu_utility/test_torch_functional.py
100644 → 100755
File mode changed from 100644 to 100755
tests/kill_github_tests.sh
100644 → 100755
File mode changed from 100644 to 100755
tests/model/test_transformer.py
100644 → 100755
File mode changed from 100644 to 100755
tests/model/test_transformers_ulysses.py
100644 → 100755
File mode changed from 100644 to 100755
tests/my_test.py
100644 → 100755
File mode changed from 100644 to 100755
tests/ray/check_worker_alive/main.py
100644 → 100755
File mode changed from 100644 to 100755
tests/ray/detached_worker/README.md
100644 → 100755
File mode changed from 100644 to 100755
tests/ray/detached_worker/client.py
100644 → 100755
File mode changed from 100644 to 100755
tests/ray/detached_worker/run.sh
100644 → 100755
File mode changed from 100644 to 100755
tests/ray/detached_worker/server.py
100644 → 100755
File mode changed from 100644 to 100755
tests/ray/test_check_worker_alive.py
100644 → 100755
File mode changed from 100644 to 100755
tests/ray/test_colocated_workers.py
100644 → 100755
File mode changed from 100644 to 100755
tests/ray/test_data_transfer.py
100644 → 100755
File mode changed from 100644 to 100755
tests/ray/test_driverfunc_to_worker.py
100644 → 100755
File mode changed from 100644 to 100755
tests/ray/test_high_level_scheduling_api.py
100644 → 100755
File mode changed from 100644 to 100755
tests/ray/test_ray_local_envs.py
100644 → 100755
File mode changed from 100644 to 100755
tests/ray/test_rvdz.py
100644 → 100755
File mode changed from 100644 to 100755
tests/ray/test_worker_group_basics.py
100644 → 100755
File mode changed from 100644 to 100755
tests/ray/test_worker_group_torch.py
100644 → 100755
File mode changed from 100644 to 100755
tests/rollout/run_fsdp_vllm.py
100644 → 100755
File mode changed from 100644 to 100755
tests/rollout/test_sglang_spmd.py
100644 → 100755
File mode changed from 100644 to 100755
tests/rollout/test_vllm_hf_loader.py
100644 → 100755
File mode changed from 100644 to 100755
tests/rollout/test_vllm_spmd.py
100644 → 100755
File mode changed from 100644 to 100755
tests/sandbox/test_sandbox.py
100644 → 100755
File mode changed from 100644 to 100755
tests/sanity/check_license.py
100644 → 100755
File mode changed from 100644 to 100755
tests/sanity/test_import.py
100644 → 100755
File mode changed from 100644 to 100755
tests/sft/run_sft.sh
100644 → 100755
File mode changed from 100644 to 100755
tests/sft/run_sft_qwen05_peft.sh
100644 → 100755
File mode changed from 100644 to 100755
tests/sft/run_sft_qwen05_sp2_liger.sh
100644 → 100755
File mode changed from 100644 to 100755
tests/sft/run_sft_sp_loss_match.sh
100644 → 100755
File mode changed from 100644 to 100755
tests/sft/test_sp_loss_match.py
100644 → 100755
File mode changed from 100644 to 100755
tests/utility/test_tensor_dict_utilities.py
100644 → 100755
File mode changed from 100644 to 100755
tests/verl/utils/dataset/test_rl_dataset.py
100644 → 100755
File mode changed from 100644 to 100755
tests/verl/utils/dataset/test_rm_dataset.py
100644 → 100755
File mode changed from 100644 to 100755
tests/verl/utils/dataset/test_sft_dataset.py
100644 → 100755
File mode changed from 100644 to 100755
verl/__init__.py
100644 → 100755
File mode changed from 100644 to 100755
verl/models/README.md
100644 → 100755
File mode changed from 100644 to 100755
verl/models/__init__.py
100644 → 100755
File mode changed from 100644 to 100755
verl/models/llama/__init__.py
100644 → 100755
File mode changed from 100644 to 100755
verl/models/llama/megatron/__init__.py
100644 → 100755
File mode changed from 100644 to 100755
verl/models/llama/megatron/checkpoint_utils/__init__.py
100644 → 100755
File mode changed from 100644 to 100755
verl/models/llama/megatron/checkpoint_utils/llama_loader.py
100644 → 100755
File mode changed from 100644 to 100755
File mode changed from 100644 to 100755
verl/models/llama/megatron/checkpoint_utils/llama_saver.py
100644 → 100755
File mode changed from 100644 to 100755
verl/models/llama/megatron/layers/__init__.py
100644 → 100755
File mode changed from 100644 to 100755
verl/models/llama/megatron/layers/parallel_attention.py
100644 → 100755
File mode changed from 100644 to 100755
verl/models/llama/megatron/layers/parallel_decoder.py
100644 → 100755
File mode changed from 100644 to 100755
verl/models/llama/megatron/layers/parallel_linear.py
100644 → 100755
File mode changed from 100644 to 100755
verl/models/llama/megatron/layers/parallel_mlp.py
100644 → 100755
File mode changed from 100644 to 100755
verl/models/llama/megatron/layers/parallel_rmsnorm.py
100644 → 100755
File mode changed from 100644 to 100755
verl/models/llama/megatron/modeling_llama_megatron.py
100644 → 100755
File mode changed from 100644 to 100755
verl/models/qwen2/__init__.py
100644 → 100755
File mode changed from 100644 to 100755
verl/models/qwen2/megatron/__init__.py
100644 → 100755
File mode changed from 100644 to 100755
verl/models/qwen2/megatron/checkpoint_utils/__init__.py
100644 → 100755
File mode changed from 100644 to 100755
verl/models/qwen2/megatron/checkpoint_utils/qwen2_loader.py
100644 → 100755
File mode changed from 100644 to 100755
File mode changed from 100644 to 100755
verl/models/qwen2/megatron/checkpoint_utils/qwen2_saver.py
100644 → 100755
File mode changed from 100644 to 100755
verl/models/qwen2/megatron/layers/__init__.py
100644 → 100755
File mode changed from 100644 to 100755
verl/models/qwen2/megatron/layers/parallel_attention.py
100644 → 100755
File mode changed from 100644 to 100755
verl/models/qwen2/megatron/layers/parallel_decoder.py
100644 → 100755
File mode changed from 100644 to 100755
verl/models/qwen2/megatron/layers/parallel_linear.py
100644 → 100755
File mode changed from 100644 to 100755
verl/models/qwen2/megatron/layers/parallel_mlp.py
100644 → 100755
File mode changed from 100644 to 100755
verl/models/qwen2/megatron/layers/parallel_rmsnorm.py
100644 → 100755
File mode changed from 100644 to 100755
verl/models/qwen2/megatron/modeling_qwen2_megatron.py
100644 → 100755
File mode changed from 100644 to 100755
verl/models/registry.py
100644 → 100755
File mode changed from 100644 to 100755
verl/models/transformers/__init__.py
100644 → 100755
File mode changed from 100644 to 100755
verl/models/transformers/llama.py
100644 → 100755
File mode changed from 100644 to 100755
verl/models/transformers/monkey_patch.py
100644 → 100755
File mode changed from 100644 to 100755
verl/models/transformers/qwen2.py
100644 → 100755
File mode changed from 100644 to 100755
verl/models/transformers/qwen2_vl.py
100644 → 100755
File mode changed from 100644 to 100755
verl/models/weight_loader_registry.py
100644 → 100755
File mode changed from 100644 to 100755
verl/protocol.py
100644 → 100755
File mode changed from 100644 to 100755
verl/single_controller/__init__.py
100644 → 100755
File mode changed from 100644 to 100755
verl/single_controller/base/__init__.py
100644 → 100755
File mode changed from 100644 to 100755
verl/single_controller/base/decorator.py
100644 → 100755
File mode changed from 100644 to 100755
verl/single_controller/base/megatron/__init__.py
100644 → 100755
File mode changed from 100644 to 100755
verl/single_controller/base/megatron/worker.py
100644 → 100755
File mode changed from 100644 to 100755
verl/single_controller/base/megatron/worker_group.py
100644 → 100755
File mode changed from 100644 to 100755
verl/single_controller/base/register_center/__init__.py
100644 → 100755
File mode changed from 100644 to 100755
verl/single_controller/base/register_center/ray.py
100644 → 100755
File mode changed from 100644 to 100755
verl/single_controller/base/worker.py
100644 → 100755
File mode changed from 100644 to 100755
verl/single_controller/base/worker_group.py
100644 → 100755
File mode changed from 100644 to 100755
verl/single_controller/ray/__init__.py
100644 → 100755
File mode changed from 100644 to 100755
verl/single_controller/ray/base.py
100644 → 100755
File mode changed from 100644 to 100755
verl/single_controller/ray/megatron.py
100644 → 100755
File mode changed from 100644 to 100755
verl/third_party/__init__.py
100644 → 100755
File mode changed from 100644 to 100755
verl/third_party/sglang/__init__.py
100644 → 100755
File mode changed from 100644 to 100755
verl/third_party/sglang/parallel_state.py
100644 → 100755
File mode changed from 100644 to 100755
verl/third_party/vllm/__init__.py
100644 → 100755
File mode changed from 100644 to 100755
verl/third_party/vllm/vllm_v_0_3_1/__init__.py
100644 → 100755
File mode changed from 100644 to 100755
verl/third_party/vllm/vllm_v_0_3_1/arg_utils.py
100644 → 100755
File mode changed from 100644 to 100755
verl/third_party/vllm/vllm_v_0_3_1/config.py
100644 → 100755
File mode changed from 100644 to 100755
verl/third_party/vllm/vllm_v_0_3_1/llm.py
100644 → 100755
File mode changed from 100644 to 100755
verl/third_party/vllm/vllm_v_0_3_1/llm_engine_sp.py
100644 → 100755
File mode changed from 100644 to 100755
verl/third_party/vllm/vllm_v_0_3_1/model_loader.py
100644 → 100755
File mode changed from 100644 to 100755
verl/third_party/vllm/vllm_v_0_3_1/model_runner.py
100644 → 100755
File mode changed from 100644 to 100755
verl/third_party/vllm/vllm_v_0_3_1/parallel_state.py
100644 → 100755
File mode changed from 100644 to 100755
verl/third_party/vllm/vllm_v_0_3_1/tokenizer.py
100644 → 100755
File mode changed from 100644 to 100755
verl/third_party/vllm/vllm_v_0_3_1/weight_loaders.py
100644 → 100755
File mode changed from 100644 to 100755
verl/third_party/vllm/vllm_v_0_3_1/worker.py
100644 → 100755
File mode changed from 100644 to 100755
verl/third_party/vllm/vllm_v_0_4_2/__init__.py
100644 → 100755
File mode changed from 100644 to 100755
verl/third_party/vllm/vllm_v_0_4_2/arg_utils.py
100644 → 100755
File mode changed from 100644 to 100755
verl/third_party/vllm/vllm_v_0_4_2/config.py
100644 → 100755
File mode changed from 100644 to 100755
verl/third_party/vllm/vllm_v_0_4_2/dtensor_weight_loaders.py
100644 → 100755
File mode changed from 100644 to 100755
verl/third_party/vllm/vllm_v_0_4_2/hf_weight_loader.py
100644 → 100755
File mode changed from 100644 to 100755
verl/third_party/vllm/vllm_v_0_4_2/llm.py
100644 → 100755
File mode changed from 100644 to 100755
verl/third_party/vllm/vllm_v_0_4_2/llm_engine_sp.py
100644 → 100755
File mode changed from 100644 to 100755
verl/third_party/vllm/vllm_v_0_4_2/megatron_weight_loaders.py
100644 → 100755
File mode changed from 100644 to 100755
verl/third_party/vllm/vllm_v_0_4_2/model_loader.py
100644 → 100755
File mode changed from 100644 to 100755
verl/third_party/vllm/vllm_v_0_4_2/model_runner.py
100644 → 100755
File mode changed from 100644 to 100755
verl/third_party/vllm/vllm_v_0_4_2/parallel_state.py
100644 → 100755
File mode changed from 100644 to 100755
verl/third_party/vllm/vllm_v_0_4_2/spmd_gpu_executor.py
100644 → 100755
File mode changed from 100644 to 100755
verl/third_party/vllm/vllm_v_0_4_2/tokenizer.py
100644 → 100755
File mode changed from 100644 to 100755
verl/third_party/vllm/vllm_v_0_4_2/worker.py
100644 → 100755
File mode changed from 100644 to 100755
verl/third_party/vllm/vllm_v_0_5_4/__init__.py
100644 → 100755
File mode changed from 100644 to 100755
verl/third_party/vllm/vllm_v_0_5_4/arg_utils.py
100644 → 100755
File mode changed from 100644 to 100755
verl/third_party/vllm/vllm_v_0_5_4/config.py
100644 → 100755
File mode changed from 100644 to 100755
verl/third_party/vllm/vllm_v_0_5_4/dtensor_weight_loaders.py
100644 → 100755
File mode changed from 100644 to 100755
verl/third_party/vllm/vllm_v_0_5_4/hf_weight_loader.py
100644 → 100755
File mode changed from 100644 to 100755
verl/third_party/vllm/vllm_v_0_5_4/llm.py
100644 → 100755
File mode changed from 100644 to 100755
verl/third_party/vllm/vllm_v_0_5_4/llm_engine_sp.py
100644 → 100755
File mode changed from 100644 to 100755
verl/third_party/vllm/vllm_v_0_5_4/megatron_weight_loaders.py
100644 → 100755
File mode changed from 100644 to 100755
verl/third_party/vllm/vllm_v_0_5_4/model_loader.py
100644 → 100755
File mode changed from 100644 to 100755
verl/third_party/vllm/vllm_v_0_5_4/model_runner.py
100644 → 100755
File mode changed from 100644 to 100755
verl/third_party/vllm/vllm_v_0_5_4/parallel_state.py
100644 → 100755
File mode changed from 100644 to 100755
verl/third_party/vllm/vllm_v_0_5_4/spmd_gpu_executor.py
100644 → 100755
File mode changed from 100644 to 100755
verl/third_party/vllm/vllm_v_0_5_4/tokenizer.py
100644 → 100755
File mode changed from 100644 to 100755
verl/third_party/vllm/vllm_v_0_5_4/worker.py
100644 → 100755
File mode changed from 100644 to 100755
verl/third_party/vllm/vllm_v_0_6_3/__init__.py
100644 → 100755
File mode changed from 100644 to 100755
verl/third_party/vllm/vllm_v_0_6_3/arg_utils.py
100644 → 100755
File mode changed from 100644 to 100755
verl/third_party/vllm/vllm_v_0_6_3/config.py
100644 → 100755
File mode changed from 100644 to 100755
verl/third_party/vllm/vllm_v_0_6_3/dtensor_weight_loaders.py
100644 → 100755
File mode changed from 100644 to 100755
verl/third_party/vllm/vllm_v_0_6_3/hf_weight_loader.py
100644 → 100755
File mode changed from 100644 to 100755
verl/third_party/vllm/vllm_v_0_6_3/llm.py
100644 → 100755
File mode changed from 100644 to 100755
verl/third_party/vllm/vllm_v_0_6_3/llm_engine_sp.py
100644 → 100755
File mode changed from 100644 to 100755
verl/third_party/vllm/vllm_v_0_6_3/megatron_weight_loaders.py
100644 → 100755
File mode changed from 100644 to 100755
verl/third_party/vllm/vllm_v_0_6_3/model_loader.py
100644 → 100755
File mode changed from 100644 to 100755
verl/third_party/vllm/vllm_v_0_6_3/model_runner.py
100644 → 100755
File mode changed from 100644 to 100755
verl/third_party/vllm/vllm_v_0_6_3/parallel_state.py
100644 → 100755
File mode changed from 100644 to 100755
verl/third_party/vllm/vllm_v_0_6_3/spmd_gpu_executor.py
100644 → 100755
File mode changed from 100644 to 100755
verl/third_party/vllm/vllm_v_0_6_3/tokenizer.py
100644 → 100755
File mode changed from 100644 to 100755
verl/third_party/vllm/vllm_v_0_6_3/worker.py
100644 → 100755
File mode changed from 100644 to 100755
verl/trainer/__init__.py
100644 → 100755
File mode changed from 100644 to 100755
verl/trainer/config/evaluation.yaml
100644 → 100755
File mode changed from 100644 to 100755
verl/trainer/config/generation.yaml
100644 → 100755
File mode changed from 100644 to 100755
verl/trainer/config/ppo_megatron_trainer.yaml
100644 → 100755
File mode changed from 100644 to 100755
verl/trainer/config/ppo_trainer.yaml
100644 → 100755
This diff is collapsed.
Click to expand it.
verl/trainer/config/sft_trainer.yaml
100644 → 100755
File mode changed from 100644 to 100755
verl/trainer/fsdp_sft_trainer.py
100644 → 100755
File mode changed from 100644 to 100755
verl/trainer/main_eval.py
100644 → 100755
File mode changed from 100644 to 100755
verl/trainer/main_generation.py
100644 → 100755
File mode changed from 100644 to 100755
verl/trainer/main_ppo.py
100644 → 100755
This diff is collapsed.
Click to expand it.
verl/trainer/ppo/__init__.py
100644 → 100755
File mode changed from 100644 to 100755
verl/trainer/ppo/core_algos.py
100644 → 100755
File mode changed from 100644 to 100755
verl/trainer/ppo/metric_utils.py
100644 → 100755
File mode changed from 100644 to 100755
verl/trainer/ppo/ray_trainer.py
100644 → 100755
File mode changed from 100644 to 100755
verl/trainer/runtime_env.yaml
100644 → 100755
File mode changed from 100644 to 100755
verl/utils/__init__.py
100644 → 100755
File mode changed from 100644 to 100755
verl/utils/checkpoint/__init__.py
100644 → 100755
File mode changed from 100644 to 100755
verl/utils/checkpoint/checkpoint_manager.py
100644 → 100755
File mode changed from 100644 to 100755
verl/utils/checkpoint/fsdp_checkpoint_manager.py
100644 → 100755
File mode changed from 100644 to 100755
verl/utils/checkpoint/megatron_checkpoint_manager.py
100644 → 100755
File mode changed from 100644 to 100755
verl/utils/config.py
100644 → 100755
File mode changed from 100644 to 100755
verl/utils/dataset/README.md
100644 → 100755
File mode changed from 100644 to 100755
verl/utils/dataset/__init__.py
100644 → 100755
File mode changed from 100644 to 100755
verl/utils/dataset/rl_dataset.py
100644 → 100755
File mode changed from 100644 to 100755
verl/utils/dataset/rm_dataset.py
100644 → 100755
File mode changed from 100644 to 100755
verl/utils/dataset/sft_dataset.py
100644 → 100755
File mode changed from 100644 to 100755
verl/utils/debug/__init__.py
100644 → 100755
File mode changed from 100644 to 100755
verl/utils/debug/performance.py
100644 → 100755
File mode changed from 100644 to 100755
verl/utils/debug/trajectory_tracker.py
100644 → 100755
File mode changed from 100644 to 100755
verl/utils/distributed.py
100644 → 100755
File mode changed from 100644 to 100755
verl/utils/flops_counter.py
100644 → 100755
File mode changed from 100644 to 100755
verl/utils/fs.py
100644 → 100755
File mode changed from 100644 to 100755
verl/utils/fsdp_utils.py
100644 → 100755
File mode changed from 100644 to 100755
verl/utils/hdfs_io.py
100644 → 100755
File mode changed from 100644 to 100755
verl/utils/import_utils.py
100644 → 100755
File mode changed from 100644 to 100755
verl/utils/logger/__init__.py
100644 → 100755
File mode changed from 100644 to 100755
verl/utils/logger/aggregate_logger.py
100644 → 100755
File mode changed from 100644 to 100755
verl/utils/logging_utils.py
100644 → 100755
File mode changed from 100644 to 100755
verl/utils/megatron/__init__.py
100644 → 100755
File mode changed from 100644 to 100755
verl/utils/megatron/memory.py
100644 → 100755
File mode changed from 100644 to 100755
verl/utils/megatron/optimizer.py
100644 → 100755
File mode changed from 100644 to 100755
verl/utils/megatron/pipeline_parallel.py
100644 → 100755
File mode changed from 100644 to 100755
verl/utils/megatron/sequence_parallel.py
100644 → 100755
File mode changed from 100644 to 100755
verl/utils/megatron/tensor_parallel.py
100644 → 100755
File mode changed from 100644 to 100755
verl/utils/megatron_utils.py
100644 → 100755
File mode changed from 100644 to 100755
verl/utils/memory_buffer.py
100644 → 100755
File mode changed from 100644 to 100755
verl/utils/model.py
100644 → 100755
File mode changed from 100644 to 100755
verl/utils/py_functional.py
100644 → 100755
File mode changed from 100644 to 100755
verl/utils/ray_utils.py
100644 → 100755
File mode changed from 100644 to 100755
verl/utils/rendezvous/__init__.py
100644 → 100755
File mode changed from 100644 to 100755
verl/utils/rendezvous/ray_backend.py
100644 → 100755
File mode changed from 100644 to 100755
verl/utils/reward_score/__init__.py
100644 → 100755
File mode changed from 100644 to 100755
verl/utils/reward_score/codev.py
100644 → 100755
This diff is collapsed.
Click to expand it.
verl/utils/reward_score/codev_eval_toolkit/eval_codev.py
100644 → 100755
File mode changed from 100644 to 100755
verl/utils/reward_score/codev_eval_toolkit/verify.py
100644 → 100755
File mode changed from 100644 to 100755
verl/utils/reward_score/geo3k.py
100644 → 100755
File mode changed from 100644 to 100755
verl/utils/reward_score/gsm8k.py
100644 → 100755
File mode changed from 100644 to 100755
verl/utils/reward_score/math.py
100644 → 100755
File mode changed from 100644 to 100755
verl/utils/reward_score/math_dapo.py
100644 → 100755
File mode changed from 100644 to 100755
verl/utils/reward_score/math_verify.py
100644 → 100755
File mode changed from 100644 to 100755
verl/utils/reward_score/prime_code/__init__.py
100644 → 100755
File mode changed from 100644 to 100755
verl/utils/reward_score/prime_code/testing_util.py
100644 → 100755
File mode changed from 100644 to 100755
verl/utils/reward_score/prime_code/utils.py
100644 → 100755
File mode changed from 100644 to 100755
verl/utils/reward_score/prime_math/__init__.py
100644 → 100755
File mode changed from 100644 to 100755
verl/utils/reward_score/prime_math/grader.py
100644 → 100755
File mode changed from 100644 to 100755
verl/utils/reward_score/prime_math/math_normalize.py
100644 → 100755
File mode changed from 100644 to 100755
verl/utils/seqlen_balancing.py
100644 → 100755
File mode changed from 100644 to 100755
verl/utils/tokenizer.py
100644 → 100755
File mode changed from 100644 to 100755
verl/utils/torch_dtypes.py
100644 → 100755
File mode changed from 100644 to 100755
verl/utils/torch_functional.py
100644 → 100755
File mode changed from 100644 to 100755
verl/utils/tracking.py
100644 → 100755
File mode changed from 100644 to 100755
verl/utils/ulysses.py
100644 → 100755
File mode changed from 100644 to 100755
verl/version/version
100644 → 100755
File mode changed from 100644 to 100755
verl/workers/__init__.py
100644 → 100755
File mode changed from 100644 to 100755
verl/workers/actor/__init__.py
100644 → 100755
File mode changed from 100644 to 100755
verl/workers/actor/base.py
100644 → 100755
File mode changed from 100644 to 100755
verl/workers/actor/dp_actor.py
100644 → 100755
File mode changed from 100644 to 100755
verl/workers/actor/megatron_actor.py
100644 → 100755
File mode changed from 100644 to 100755
verl/workers/critic/__init__.py
100644 → 100755
File mode changed from 100644 to 100755
verl/workers/critic/base.py
100644 → 100755
File mode changed from 100644 to 100755
verl/workers/critic/dp_critic.py
100644 → 100755
File mode changed from 100644 to 100755
verl/workers/critic/megatron_critic.py
100644 → 100755
File mode changed from 100644 to 100755
verl/workers/fsdp_workers.py
100644 → 100755
File mode changed from 100644 to 100755
verl/workers/megatron_workers.py
100644 → 100755
File mode changed from 100644 to 100755
verl/workers/reward_manager/__init__.py
100644 → 100755
File mode changed from 100644 to 100755
verl/workers/reward_manager/dapo.py
100644 → 100755
File mode changed from 100644 to 100755
verl/workers/reward_manager/naive.py
100644 → 100755
File mode changed from 100644 to 100755
verl/workers/reward_manager/prime.py
100644 → 100755
File mode changed from 100644 to 100755
verl/workers/reward_model/__init__.py
100644 → 100755
File mode changed from 100644 to 100755
verl/workers/reward_model/base.py
100644 → 100755
File mode changed from 100644 to 100755
verl/workers/reward_model/megatron/__init__.py
100644 → 100755
File mode changed from 100644 to 100755
verl/workers/reward_model/megatron/reward_model.py
100644 → 100755
File mode changed from 100644 to 100755
verl/workers/rollout/__init__.py
100644 → 100755
File mode changed from 100644 to 100755
verl/workers/rollout/base.py
100644 → 100755
File mode changed from 100644 to 100755
verl/workers/rollout/hf_rollout.py
100644 → 100755
File mode changed from 100644 to 100755
verl/workers/rollout/naive/__init__.py
100644 → 100755
File mode changed from 100644 to 100755
verl/workers/rollout/naive/naive_rollout.py
100644 → 100755
File mode changed from 100644 to 100755
verl/workers/rollout/sglang_rollout/__init__.py
100644 → 100755
File mode changed from 100644 to 100755
verl/workers/rollout/sglang_rollout/sglang_rollout.py
100644 → 100755
File mode changed from 100644 to 100755
verl/workers/rollout/tokenizer.py
100644 → 100755
File mode changed from 100644 to 100755
verl/workers/rollout/vllm_rollout/__init__.py
100644 → 100755
File mode changed from 100644 to 100755
verl/workers/rollout/vllm_rollout/fire_vllm_rollout.py
100644 → 100755
File mode changed from 100644 to 100755
verl/workers/rollout/vllm_rollout/vllm_rollout.py
100644 → 100755
File mode changed from 100644 to 100755
verl/workers/rollout/vllm_rollout/vllm_rollout_spmd.py
100644 → 100755
File mode changed from 100644 to 100755
verl/workers/sharding_manager/__init__.py
100644 → 100755
File mode changed from 100644 to 100755
verl/workers/sharding_manager/base.py
100644 → 100755
File mode changed from 100644 to 100755
verl/workers/sharding_manager/fsdp_sglang.py
100644 → 100755
File mode changed from 100644 to 100755
verl/workers/sharding_manager/fsdp_ulysses.py
100644 → 100755
File mode changed from 100644 to 100755
verl/workers/sharding_manager/fsdp_vllm.py
100644 → 100755
File mode changed from 100644 to 100755
verl/workers/sharding_manager/megatron_vllm.py
100644 → 100755
File mode changed from 100644 to 100755
Please
register
or
sign in
to comment