From c41ea52634d82b552b8f00a889e0d1f5070b7ed4 Mon Sep 17 00:00:00 2001 From: Tyler Michael Smith Date: Wed, 6 Aug 2025 16:40:26 -0700 Subject: [PATCH 1/2] Remove mamba-ssm package Signed-off-by: Tyler Michael Smith --- docker/Dockerfile.cpu | 1 - docs/contributing/ci/update_pytorch_version.md | 13 ------------- requirements/test.in | 3 +-- tests/models/language/generation/test_hybrid.py | 8 ++++---- 4 files changed, 5 insertions(+), 20 deletions(-) diff --git a/docker/Dockerfile.cpu b/docker/Dockerfile.cpu index 1a0981f8ea6d..36dd72c5f3a6 100644 --- a/docker/Dockerfile.cpu +++ b/docker/Dockerfile.cpu @@ -113,7 +113,6 @@ WORKDIR /workspace/vllm RUN --mount=type=bind,src=requirements/test.in,target=requirements/test.in \ cp requirements/test.in requirements/cpu-test.in && \ - sed -i '/mamba_ssm/d' requirements/cpu-test.in && \ sed -i 's/^torch==.*/torch==2.6.0/g' requirements/cpu-test.in && \ sed -i 's/torchaudio.*/torchaudio/g' requirements/cpu-test.in && \ sed -i 's/torchvision.*/torchvision/g' requirements/cpu-test.in && \ diff --git a/docs/contributing/ci/update_pytorch_version.md b/docs/contributing/ci/update_pytorch_version.md index 3a6026d450a6..7ef22d6f8c3f 100644 --- a/docs/contributing/ci/update_pytorch_version.md +++ b/docs/contributing/ci/update_pytorch_version.md @@ -131,19 +131,6 @@ MAX_JOBS=16 uv pip install --system \ --no-build-isolation "git+https://github.com/facebookresearch/xformers@v0.0.30" ``` -### Mamba - -```bash -uv pip install --system \ - --no-build-isolation "git+https://github.com/state-spaces/mamba@v2.2.5" -``` - -### causal-conv1d - -```bash -uv pip install 'git+https://github.com/Dao-AILab/causal-conv1d@v1.5.0.post8' -``` - ## Update all the different vLLM platforms Rather than attempting to update all vLLM platforms in a single pull request, it's more manageable diff --git a/requirements/test.in b/requirements/test.in index 9c8c75dd6f70..ddedefa2e68c 100644 --- a/requirements/test.in +++ b/requirements/test.in @@ -26,7 +26,6 @@ torch==2.7.1 torchaudio==2.7.1 torchvision==0.22.1 transformers_stream_generator # required for qwen-vl test -mamba_ssm==2.2.5 # required for plamo2 test matplotlib # required for qwen-vl test mistral_common[image,audio] >= 1.8.2 # required for voxtral test num2words # required for smolvlm test @@ -54,4 +53,4 @@ runai-model-streamer==0.11.0 runai-model-streamer-s3==0.11.0 fastsafetensors>=0.1.10 pydantic>=2.10 # 2.9 leads to error on python 3.10 -terratorch==1.1rc2 # required for PrithviMAE test \ No newline at end of file +terratorch==1.1rc2 # required for PrithviMAE test diff --git a/tests/models/language/generation/test_hybrid.py b/tests/models/language/generation/test_hybrid.py index 2238924c1b50..78d23c609fbe 100644 --- a/tests/models/language/generation/test_hybrid.py +++ b/tests/models/language/generation/test_hybrid.py @@ -25,10 +25,6 @@ HYBRID_MODELS = [ "ai21labs/Jamba-tiny-dev", - # NOTE: Running Plamo2 in transformers implementation requires to install - # causal-conv1d package, which is not listed as a test dependency as it's - # not compatible with pip-compile. - "pfnet/plamo-2-1b", "Zyphra/Zamba2-1.2B-instruct", "hmellor/tiny-random-BambaForCausalLM", "ibm-ai-platform/Bamba-9B-v1", @@ -50,6 +46,10 @@ # https://github.com/huggingface/transformers/pull/39033 # We will enable vLLM test for Granite after next HF transformers release. "ibm-granite/granite-4.0-tiny-preview", + # NOTE: Plamo2 requires both mamba_ssm and causal-conv1d libraries + # (see https://huggingface.co/pfnet/plamo-2-1b/blob/main/modeling_plamo.py), + # Don't compare it to HF, to avoid managing the dependency. + "pfnet/plamo-2-1b", ] V1_SUPPORTED_MODELS = [ From ddb65dad96c39c82e4a0c25ea215831e1e2c76bb Mon Sep 17 00:00:00 2001 From: Tyler Michael Smith Date: Wed, 6 Aug 2025 23:53:32 +0000 Subject: [PATCH 2/2] fix Signed-off-by: Tyler Michael Smith --- requirements/test.txt | 13 +------------ tests/models/language/generation/test_hybrid.py | 1 + 2 files changed, 2 insertions(+), 12 deletions(-) diff --git a/requirements/test.txt b/requirements/test.txt index 08ba964f22a4..93f00da1f101 100644 --- a/requirements/test.txt +++ b/requirements/test.txt @@ -178,7 +178,6 @@ einops==0.8.1 # via # -r requirements/test.in # encodec - # mamba-ssm # terratorch # torchgeo # vector-quantize-pytorch @@ -418,8 +417,6 @@ lxml==5.3.0 # sacrebleu mako==1.3.10 # via alembic -mamba-ssm==2.2.5 - # via -r requirements/test.in markdown==3.8.2 # via mlflow markdown-it-py==3.0.0 @@ -476,8 +473,6 @@ networkx==3.2.1 # via # scikit-image # torch -ninja==1.11.1.3 - # via mamba-ssm nltk==3.9.1 # via rouge-score num2words==0.5.14 @@ -630,7 +625,6 @@ packaging==24.2 # lazy-loader # lightning # lightning-utilities - # mamba-ssm # matplotlib # mlflow-skinny # peft @@ -974,7 +968,6 @@ sentencepiece==0.2.0 setuptools==77.0.3 # via # lightning-utilities - # mamba-ssm # pytablewriter # torch # triton @@ -1086,7 +1079,6 @@ torch==2.7.1+cu128 # lightly # lightning # lm-eval - # mamba-ssm # mteb # open-clip-torch # peft @@ -1153,16 +1145,13 @@ transformers==4.55.0 # -r requirements/test.in # genai-perf # lm-eval - # mamba-ssm # peft # sentence-transformers # transformers-stream-generator transformers-stream-generator==0.0.5 # via -r requirements/test.in triton==3.3.1 - # via - # mamba-ssm - # torch + # via torch tritonclient==2.51.0 # via # -r requirements/test.in diff --git a/tests/models/language/generation/test_hybrid.py b/tests/models/language/generation/test_hybrid.py index 78d23c609fbe..584a3640eb92 100644 --- a/tests/models/language/generation/test_hybrid.py +++ b/tests/models/language/generation/test_hybrid.py @@ -25,6 +25,7 @@ HYBRID_MODELS = [ "ai21labs/Jamba-tiny-dev", + "pfnet/plamo-2-1b", "Zyphra/Zamba2-1.2B-instruct", "hmellor/tiny-random-BambaForCausalLM", "ibm-ai-platform/Bamba-9B-v1",