vllm-project · DarkLight1337 · Aug 3, 2025 · Aug 3, 2025 · gemini-code-assist · Aug 3, 2025
diff --git a/.buildkite/test-pipeline.yaml b/.buildkite/test-pipeline.yaml
@@ -535,8 +535,6 @@ steps:
   - vllm/
   - tests/models/language
   commands:
-    # Install causal-conv1d for plamo2 models here, as it is not compatible with pip-compile.
-    - pip install 'git+https://github.com/Dao-AILab/[email protected]'
     - pip freeze | grep -E 'torch'
     - pytest -v -s models/language -m core_model
 
@@ -547,8 +545,6 @@ steps:
   - vllm/
   - tests/models/language/generation
   commands:
-    # Install causal-conv1d for plamo2 models here, as it is not compatible with pip-compile.
-    - pip install 'git+https://github.com/Dao-AILab/[email protected]'
     - pytest -v -s models/language/generation -m hybrid_model
 
 - label: Language Models Test (Extended Generation) # 1hr20min
@@ -558,8 +554,6 @@ steps:
   - vllm/
   - tests/models/language/generation
   commands:
-    # Install causal-conv1d for plamo2 models here, as it is not compatible with pip-compile.
-    - pip install 'git+https://github.com/Dao-AILab/[email protected]'
     - pytest -v -s models/language/generation -m '(not core_model) and (not hybrid_model)'
 
 - label: Language Models Test (Extended Pooling)  # 36min

@@ -113,6 +113,7 @@ WORKDIR /workspace/vllm
 
 RUN --mount=type=bind,src=requirements/test.in,target=requirements/test.in \
     cp requirements/test.in requirements/cpu-test.in && \
+    sed -i '/causal_conv1d/d' requirements/cpu-test.in && \
     sed -i '/mamba_ssm/d' requirements/cpu-test.in && \
     sed -i 's/^torch==.*/torch==2.6.0/g' requirements/cpu-test.in && \
     sed -i 's/torchaudio.*/torchaudio/g' requirements/cpu-test.in && \

diff --git a/docker/Dockerfile.rocm b/docker/Dockerfile.rocm
@@ -71,7 +71,7 @@ COPY --from=build_vllm ${COMMON_WORKDIR}/vllm /vllm-workspace
 RUN cd /vllm-workspace \
     && rm -rf vllm \
     && python3 -m pip install -e tests/vllm_test_utils \
-    && python3 -m pip install lm-eval[api]==0.4.4 \
+    && python3 -m pip install git+https://github.com/EleutherAI/lm-evaluation-harness.git@bc811365ef3917a15da6aac9b7feafb4ba0fb42f#egg=lm-eval[api] \
     && python3 -m pip install pytest-shard
 
 # -----------------------

@@ -141,7 +141,7 @@ uv pip install --system \
 ### causal-conv1d
 
 ```bash
-uv pip install 'git+https://github.com/Dao-AILab/[email protected].0.post8'
+uv pip install 'git+https://github.com/Dao-AILab/[email protected].2'
 ```
 
 ## Update all the different vLLM platforms

diff --git a/requirements/test.in b/requirements/test.in
@@ -26,14 +26,15 @@ torch==2.7.1
 torchaudio==2.7.1
 torchvision==0.22.1
 transformers_stream_generator # required for qwen-vl test
+causal_conv1d==1.5.2 # required for plamo2 test
 mamba_ssm==2.2.5 # required for plamo2 test
 matplotlib # required for qwen-vl test
 mistral_common[image,audio] >= 1.8.2 # required for voxtral test
 num2words # required for smolvlm test
 open_clip_torch==2.32.0 # Required for nemotron_vl test
 opencv-python-headless >= 4.11.0 # required for video test
 datamodel_code_generator # required for minicpm3 test
-lm-eval[api]==0.4.8 # required for model evaluation test
+lm-eval[api] @ git+https://github.com/EleutherAI/lm-evaluation-harness.git@bc811365ef3917a15da6aac9b7feafb4ba0fb42f # required for model evaluation test
 mteb[bm25s]>=1.38.11, <2 # required for mteb test
 transformers==4.53.2
 tokenizers==0.21.1

diff --git a/requirements/test.txt b/requirements/test.txt
@@ -85,6 +85,8 @@ cachetools==5.5.2
     # via
     #   google-auth
     #   mlflow-skinny
+causal-conv1d==1.5.2
+    # via -r requirements/test.in
 certifi==2024.8.30
     # via
     #   fiona
@@ -410,7 +412,7 @@ lightning-utilities==0.14.3
     #   torchmetrics
 llvmlite==0.44.0
     # via numba
-lm-eval==0.4.8
+lm-eval @ git+https://github.com/EleutherAI/lm-evaluation-harness.git@bc811365ef3917a15da6aac9b7feafb4ba0fb42f
     # via -r requirements/test.in
 lxml==5.3.0
     # via
@@ -477,7 +479,9 @@ networkx==3.2.1
     #   scikit-image
     #   torch
 ninja==1.11.1.3
-    # via mamba-ssm
+    # via
+    #   causal-conv1d
+    #   mamba-ssm
 nltk==3.9.1
     # via rouge-score
 num2words==0.5.14
@@ -618,6 +622,7 @@ packaging==24.2
     # via
     #   accelerate
     #   black
+    #   causal-conv1d
     #   datamodel-code-generator
     #   datasets
     #   evaluate
@@ -1079,6 +1084,7 @@ torch==2.7.1+cu128
     #   -r requirements/test.in
     #   accelerate
     #   bitsandbytes
+    #   causal-conv1d
     #   efficientnet-pytorch
     #   encodec
     #   fastsafetensors

@@ -25,9 +25,6 @@
 
 HYBRID_MODELS = [
     "ai21labs/Jamba-tiny-dev",
-    # NOTE: Running Plamo2 in transformers implementation requires to install
-    # causal-conv1d package, which is not listed as a test dependency as it's
-    # not compatible with pip-compile.
     "pfnet/plamo-2-1b",
     "Zyphra/Zamba2-1.2B-instruct",
     "hmellor/tiny-random-BambaForCausalLM",