distro: bump version to 0.2.0.post2. restrict vllm to v0.6.3 instead of v0.6.3.post1 (#320 )

distro: bump up version to v0.2.0.post1
example: fix remove padding flags for gemma example. update v0.2 install docs (#290 )
2025-10-20 13:43:50 +08:00 · 2025-02-20 11:03:11 +08:00 · 2025-02-16 22:42:30 +08:00 · 2025-02-16 21:52:31 +08:00
18 changed files with 34 additions and 13 deletions
--- a/.github/workflows/dataset.yml
+++ b/.github/workflows/dataset.yml
@ -6,12 +6,14 @@ on:
  push:
    branches:
      - main
+      - v0.2.x
    paths:
      - "**/*.py"
      - .github/workflows/dataset.yml
  pull_request:
    branches:
      - main
+      - v0.2.x
    paths:
      - "**/*.py"
      - .github/workflows/dataset.yml
@ -35,4 +37,4 @@ jobs:
      - name: Running ray test using cupy (move it to L20 when dockerfile ready)
        run: |
          cd tests/ray
-          pytest -s -x test_rvdz.py
+          pytest -s -x test_rvdz.py
--- a/.github/workflows/e2e_digit_completion.yml
+++ b/.github/workflows/e2e_digit_completion.yml
@ -6,12 +6,14 @@ on:
  push:
    branches:
      - main
+      - v0.2.x
    paths:
      - "**/*.py"
      - .github/workflows/e2e_digit_completion.yml
  pull_request:
    branches:
      - main
+      - v0.2.x
    paths:
      - "**/*.py"
      - .github/workflows/e2e_digit_completion.yml
--- a/.github/workflows/e2e_gsm8k.yml
+++ b/.github/workflows/e2e_gsm8k.yml
@ -6,12 +6,14 @@ on:
  push:
    branches:
      - main
+      - v0.2.x
    paths:
      - "**/*.py"
      - .github/workflows/e2e_gsm8k.yml
  pull_request:
    branches:
      - main
+      - v0.2.x
    paths:
      - "**/*.py"
      - .github/workflows/e2e_gsm8k.yml
--- a/.github/workflows/e2e_gsm8k_megatron.yml
+++ b/.github/workflows/e2e_gsm8k_megatron.yml
@ -6,12 +6,14 @@ on:
  push:
    branches:
      - main
+      - v0.2.x
    paths:
      - "**/*.py"
      - .github/workflows/e2e_gsm8k_megatron.yml
  pull_request:
    branches:
      - main
+      - v0.2.x
    paths:
      - "**/*.py"
      - .github/workflows/e2e_gsm8k_megatron.yml
--- a/.github/workflows/e2e_lora.yml
+++ b/.github/workflows/e2e_lora.yml
@ -6,12 +6,14 @@ on:
  push:
    branches:
      - main
+      - v0.2.x
    paths:
      - "**/*.py"
      - .github/workflows/e2e_lora.yml
  pull_request:
    branches:
      - main
+      - v0.2.x
    paths:
      - "**/*.py"
      - .github/workflows/e2e_lora.yml
--- a/.github/workflows/e2e_sft.yml
+++ b/.github/workflows/e2e_sft.yml
@ -6,12 +6,14 @@ on:
  push:
    branches:
      - main
+      - v0.2.x
    paths:
      - "**/*.py"
      - .github/workflows/e2e_sft.yml
  pull_request:
    branches:
      - main
+      - v0.2.x
    paths:
      - "**/*.py"
      - .github/workflows/e2e_sft.yml
--- a/.github/workflows/model.yml
+++ b/.github/workflows/model.yml
@ -6,12 +6,14 @@ on:
  push:
    branches:
      - main
+      - v0.2.x
    paths:
      - "**/*.py"
      - .github/workflows/model.yml
  pull_request:
    branches:
      - main
+      - v0.2.x
    paths:
      - "**/*.py"
      - .github/workflows/model.yml
--- a/.github/workflows/ray_test.yml
+++ b/.github/workflows/ray_test.yml
@ -6,12 +6,14 @@ on:
  push:
    branches:
      - main
+      - v0.2.x
    paths:
      - "**/*.py"
      - .github/workflows/ray_test.yml
  pull_request:
    branches:
      - main
+      - v0.2.x
    paths:
      - "**/*.py"
      - .github/workflows/ray_test.yml
--- a/.github/workflows/sandbox.yml
+++ b/.github/workflows/sandbox.yml
@ -6,12 +6,14 @@ on:
  push:
    branches:
      - main
+      - v0.2.x
    paths:
      - "**/*.py"
      - .github/workflows/sandbox.yml
  pull_request:
    branches:
      - main
+      - v0.2.x
    paths:
      - "**/*.py"
      - .github/workflows/sandbox.yml
--- a/.github/workflows/sanity.yml
+++ b/.github/workflows/sanity.yml
@ -6,12 +6,14 @@ on:
  push:
    branches:
      - main
+      - v0.2.x
    paths:
      - "**/*.py"
      - .github/workflows/sanity.yml
  pull_request:
    branches:
      - main
+      - v0.2.x
    paths:
      - "**/*.py"
      - .github/workflows/sanity.yml
--- a/.github/workflows/vllm.yml
+++ b/.github/workflows/vllm.yml
@ -6,12 +6,14 @@ on:
  push:
    branches:
      - main
+      - v0.2.x
    paths:
      - "**/*.py"
      - .github/workflows/vllm.yml
  pull_request:
    branches:
      - main
+      - v0.2.x
    paths:
      - "**/*.py"
      - .github/workflows/vllm.yml
--- a/.github/workflows/yapf_format.yml
+++ b/.github/workflows/yapf_format.yml
@ -6,12 +6,14 @@ on:
  push:
    branches:
      - main
+      - v0.2.x
    paths:
      - "**/*.py"
      - .github/workflows/yapf_format.yml
  pull_request:
    branches:
      - main
+      - v0.2.x
    paths:
      - "**/*.py"
      - .github/workflows/yapf_format.yml
--- a/docs/start/install.rst
+++ b/docs/start/install.rst
@ -38,9 +38,8 @@ Image and tag: ``verlai/verl:vemlp-th2.4.0-cu124-vllm0.6.3-ray2.10-te1.7-v0.0.3`

 .. code:: bash

-    # install the nightly version (recommended)
-    git clone https://github.com/volcengine/verl && cd verl && pip3 install -e .
-    # or install from pypi via `pip3 install verl`
+    # install the stable version
+    pip3 install verl


 3. Setup Megatron (optional)
@ -83,9 +82,7 @@ own post-training jobs.
   # install verl together with some lightweight dependencies in setup.py
   pip3 install torch==2.4.0 --index-url https://download.pytorch.org/whl/cu124
   pip3 install flash-attn --no-build-isolation
-   git clone https://github.com/volcengine/verl.git
-   cd verl
-   pip3 install -e .
+   pip3 install verl


 Megatron is optional. It's dependencies can be setup as below:
--- a/examples/ppo_trainer/run_gemma.sh
+++ b/examples/ppo_trainer/run_gemma.sh
@ -9,7 +9,7 @@ python3 -m verl.trainer.main_ppo \
    data.max_response_length=512 \
    actor_rollout_ref.model.path=google/gemma-2-2b-it \
    actor_rollout_ref.actor.optim.lr=1e-6 \
-    actor_rollout_ref.model.use_remove_padding=True \
+    actor_rollout_ref.model.use_remove_padding=False \
    actor_rollout_ref.actor.ppo_mini_batch_size=128 \
    actor_rollout_ref.actor.ppo_micro_batch_size_per_gpu=4 \
    actor_rollout_ref.actor.fsdp_config.param_offload=False \
@ -22,7 +22,7 @@ python3 -m verl.trainer.main_ppo \
    actor_rollout_ref.ref.log_prob_micro_batch_size_per_gpu=4 \
    actor_rollout_ref.ref.fsdp_config.param_offload=True \
    critic.optim.lr=1e-5 \
-    critic.model.use_remove_padding=True \
+    critic.model.use_remove_padding=False \
    critic.model.path=google/gemma-2-2b-it \
    critic.model.enable_gradient_checkpointing=False \
    critic.ppo_micro_batch_size_per_gpu=4 \
--- a/pyproject.toml
+++ b/pyproject.toml
@ -44,7 +44,7 @@ dependencies = [
    "ray>=2.10",
    "tensordict<0.6",
    "transformers",
-    "vllm<=0.6.3.post1",
+    "vllm<=0.6.3",
    'wandb',
 ]

--- a/requirements.txt
+++ b/requirements.txt
@ -15,5 +15,5 @@ pylatexenc
 ray
 tensordict<0.6
 transformers
-vllm==0.6.3.post1
+vllm<=0.6.3
 wandb
--- a/setup.py
+++ b/setup.py
@ -36,7 +36,7 @@ install_requires = [
  'ray>=2.10',
  'tensordict<0.6',
  'transformers',
-  'vllm<=0.6.3.post1',
+  'vllm<=0.6.3',
  'wandb',
 ]

--- a/verl/version/version
+++ b/verl/version/version
@ -1 +1 @@
-0.2
+0.2.0.post2
Author	SHA1	Message	Date
HL	fb532783ad	distro: bump version to 0.2.0.post2. restrict vllm to v0.6.3 instead of v0.6.3.post1 (#320 )	2025-02-20 11:03:11 +08:00
HL	96f49818b8	distro: bump up version to v0.2.0.post1	2025-02-16 22:42:30 +08:00
HL	550938745f	example: fix remove padding flags for gemma example. update v0.2 install docs (#290 )	2025-02-16 21:52:31 +08:00