Skip to content

Commit cdb6a20

Browse files
update dependencies
1 parent 3b598c9 commit cdb6a20

File tree

4 files changed

+97
-26
lines changed

4 files changed

+97
-26
lines changed

.gitignore

Lines changed: 10 additions & 15 deletions
Original file line numberDiff line numberDiff line change
@@ -24,6 +24,7 @@ share/python-wheels/
2424
*.egg-info/
2525
.installed.cfg
2626
*.egg
27+
*.whl
2728
MANIFEST
2829

2930
# PyInstaller
@@ -173,28 +174,22 @@ cython_debug/
173174
# DS_Store
174175
.DS_Store
175176

177+
# Ignore parquet files.
178+
data/*
179+
176180
# Ignore verl script outputs.
177181
**/outputs/
178182
**/wandb/
179183
**/checkpoints/
180-
181-
# Ignore parquet files.
182-
data/*
183-
184-
rllm/data/preprocess/*.json
185-
rllm/data/preprocess/code/*.json
186-
rllm/data/preprocess/math/*.json
187184
tmp/
188185

189186
# Ignore debug logs and run result logs
190187
logs/
188+
rllm/*.json
191189

192190
# Ignore the big datasets
193-
rllm/data/test/code/taco.json
194-
rllm/data/train/code/taco.json
195-
rllm/data/train/math/olympiad.json
196-
rllm/data/test/code/livecodebench.json
197-
rllm/data/train/code/livecodebench.json
198-
rllm/data/train/code/kodcode.json
199-
rllm/data/train/code/primeintellect.json
200-
rllm/data/train/code/primeintellect_dedupe.json
191+
rllm/data/test/
192+
rllm/data/train/
193+
194+
rllm/data/datasets/
195+
rllm/registry/

README.md

Lines changed: 9 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -44,15 +44,21 @@ rLLM is an open-source framework for post-training language agents via reinforce
4444

4545
```bash
4646
# Clone the repository
47+
<<<<<<< HEAD
4748
git clone --recurse-submodules https://github.com/rllm-org/rllm.git
49+
=======
50+
git clone https://github.com/rllm-org/rllm.git
51+
>>>>>>> private/v0.2-verl-stable
4852
cd rllm
4953

50-
# create a conda environment
54+
# Create a conda environment
5155
conda create -n rllm python=3.10
5256
conda activate rllm
5357

54-
# Install all dependencies
55-
pip install -e ./verl
58+
# Install verl v0.5.0
59+
bash scripts/install_verl.sh # (or follow the instructions at https://verl.readthedocs.io/en/v0.5.x/start/install.html)
60+
61+
# Install rllm
5662
pip install -e .
5763

5864
**Note:** On macOS, GPU features (flash-attn, deepspeed, vllm) are automatically excluded for compatibility. For GPU support on macOS, you can install with: `pip install -e .[gpu]`

pyproject.toml

Lines changed: 41 additions & 8 deletions
Original file line numberDiff line numberDiff line change
@@ -19,16 +19,30 @@ classifiers = [
1919
license = {file = "LICENSE"}
2020
dependencies = [
2121
# Core ML/AI packages
22+
<<<<<<< HEAD
2223
"torch>=2.7",
2324
"transformers",
2425
"openai",
26+
=======
27+
"torch>=2.6",
28+
"transformers>=4.5",
29+
"sentence-transformers",
30+
>>>>>>> private/v0.2-verl-stable
2531

2632
# Data processing
2733
"datasets",
34+
"pandas",
2835
"polars",
29-
"dm-tree",
36+
"pillow",
3037

3138
# Cloud and infrastructure
39+
<<<<<<< HEAD
40+
=======
41+
"google-cloud-aiplatform",
42+
"vertexai",
43+
"docker",
44+
"kubernetes",
45+
>>>>>>> private/v0.2-verl-stable
3246
"ray",
3347

3448
# Web and automation
@@ -38,26 +52,45 @@ dependencies = [
3852
"firecrawl",
3953

4054
# Math and science
41-
"latex2sympy2",
55+
"numpy",
56+
"sympy",
4257
"pylatexenc",
58+
<<<<<<< HEAD
4359
"nltk",
4460
"sympy",
4561
"scipy",
62+
=======
63+
"antlr4-python3-runtime==4.9.3",
64+
>>>>>>> private/v0.2-verl-stable
4665

4766
# Code evaluation
4867
"swebench",
4968
"e2b_code_interpreter",
5069

70+
# Tools
71+
"mcp",
72+
"camel-ai",
73+
74+
# DB
75+
"supabase",
76+
5177
# Utilities
78+
"hydra-core",
79+
"openai",
5280
"fire",
5381
"gdown",
54-
"tabulate",
55-
"sortedcontainers",
56-
"PyMuPDF",
57-
"together",
82+
"together>=1.4",
5883
"wandb",
59-
"pybind11",
60-
"gym",
84+
"gymnasium",
85+
"click",
86+
"fastapi",
87+
"uvicorn",
88+
"httpx",
89+
"jupyter",
90+
"tqdm",
91+
"rich",
92+
"PyYAML",
93+
"pydantic",
6194

6295
# Development and testing
6396
"pytest",

scripts/install_verl.sh

Lines changed: 37 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,37 @@
1+
#!/bin/bash
2+
# Adapted from https://github.com/volcengine/verl/blob/v0.5.0/scripts/install_vllm_sglang_mcore.sh
3+
4+
echo "1. install inference frameworks and pytorch they need"
5+
pip install "sglang[all]==0.4.6.post1" --no-cache-dir --find-links https://flashinfer.ai/whl/cu124/torch2.6/flashinfer-python && pip install torch-memory-saver --no-cache-dir
6+
pip install --no-cache-dir "vllm==0.8.5.post1" "torch==2.6.0" "torchvision==0.21.0" "torchaudio==2.6.0" "tensordict==0.6.2" torchdata
7+
8+
9+
echo "2. install basic packages"
10+
pip install "transformers[hf_xet]>=4.51.0" accelerate datasets peft hf-transfer \
11+
"numpy<2.0.0" "pyarrow>=15.0.0" pandas \
12+
ray[default] codetiming hydra-core pylatexenc qwen-vl-utils wandb dill pybind11 liger-kernel mathruler \
13+
pytest py-spy pyext pre-commit ruff tensorboard
14+
15+
pip install "nvidia-ml-py>=12.560.30" "fastapi[standard]>=0.115.0" "optree>=0.13.0" "pydantic>=2.9" "grpcio>=1.62.1"
16+
17+
18+
echo "3. install FlashAttention and FlashInfer"
19+
# Install flash-attn-2.7.4.post1 (cxx11abi=False)
20+
wget -nv https://github.com/Dao-AILab/flash-attention/releases/download/v2.7.4.post1/flash_attn-2.7.4.post1+cu12torch2.6cxx11abiFALSE-cp310-cp310-linux_x86_64.whl && \
21+
pip install --no-cache-dir flash_attn-2.7.4.post1+cu12torch2.6cxx11abiFALSE-cp310-cp310-linux_x86_64.whl
22+
23+
# Install flashinfer-0.2.2.post1+cu124 (cxx11abi=False)
24+
# vllm-0.8.3 does not support flashinfer>=0.2.3
25+
# see https://github.com/vllm-project/vllm/pull/15777
26+
wget -nv https://github.com/flashinfer-ai/flashinfer/releases/download/v0.2.2.post1/flashinfer_python-0.2.2.post1+cu124torch2.6-cp38-abi3-linux_x86_64.whl && \
27+
pip install --no-cache-dir flashinfer_python-0.2.2.post1+cu124torch2.6-cp38-abi3-linux_x86_64.whl
28+
29+
30+
echo "4. May need to fix opencv"
31+
pip install opencv-python
32+
pip install opencv-fixer && \
33+
python -c "from opencv_fixer import AutoFix; AutoFix()"
34+
35+
36+
echo "5. Install verl"
37+
pip install --no-deps --no-cache-dir git+https://github.com/volcengine/[email protected]

0 commit comments

Comments
 (0)