add verl as submodule, update install instructions

kylemontgomery1 · kylemontgomery1 · commit 62cc8b927952 · 2025-08-20T16:57:17.000-07:00
diff --git a/.gitmodules b/.gitmodules
@@ -0,0 +1,4 @@
+[submodule "verl"]
+	path = verl
+	url = https://github.com/volcengine/verl.git
+	branch = main
diff --git a/Dockerfile b/Dockerfile
@@ -4,9 +4,13 @@ ENV DEBIAN_FRONTEND=noninteractive
 
 WORKDIR /workspace
 
-RUN git clone https://github.com/rllm-org/rllm.git rllm
+RUN pip uninstall verl -y || true
 
-RUN cd rllm && pip install -e .
+RUN git clone --recurse-submodules https://github.com/rllm-org/rllm.git rllm
+
+RUN cd rllm && \
+    pip install --no-deps -e ./verl && \
+    pip install -e .
 
 RUN pip install playwright && \
     playwright install chromium && \
diff --git a/README.md b/README.md
@@ -44,15 +44,16 @@ rLLM is an open-source framework for post-training language agents via reinforce
 
 ```bash
 # Clone the repository
-git clone https://github.com/rllm-org/rllm.git
+git clone --recurse-submodules https://github.com/rllm-org/rllm.git
 cd rllm
 
 # Create a conda environment
 conda create -n rllm python=3.10
 conda activate rllm
 
-# Install verl v0.5.0
-bash scripts/install_verl.sh # (or follow the instructions at https://verl.readthedocs.io/en/v0.5.x/start/install.html)
+# Install verl
+bash verl/scripts/install_vllm_sglang_mcore.sh
+pip install --no-deps -e ./verl
 
 # Install rllm
 pip install -e .
@@ -77,7 +78,7 @@ docker exec -it rllm-container bash
 
 ## Acknowledgements
 
-- Our training experiments are powered by our heavily modified fork of [verl](https://github.com/volcengine/verl), an open-source RLHF library.
+- Our training experiments are powered by [verl](https://github.com/volcengine/verl), an open-source RLHF library.
 - Our models are trained on top of [`DeepSeek-R1-Distill-Qwen-1.5B`](https://huggingface.co/deepseek-ai/DeepSeek-R1-Distill-Qwen-1.5B), [`DeepSeek-R1-Distill-Qwen-14B`](https://huggingface.co/deepseek-ai/DeepSeek-R1-Distill-Qwen-14B), and [`Qwen3-32B`](https://huggingface.co/Qwen/Qwen3-32b).
 - Our work is done as part of [Berkeley Sky Computing Lab](https://skycomputing.berkeley.edu/), [Berkeley AI Research](https://bair.berkeley.edu/), and a successful collaboration with Together AI.
 
diff --git a/verl b/verl
@@ -0,0 +1 @@
+Subproject commit 8fdc4d3f202f41461f4de9f42a637228e342668b