Skip to content

Commit dc82925

Browse files
committed
Updates artifacts for v1.0.0-rc.1 release
Signed-off-by: Kellen Swain <[email protected]>
1 parent 7c84b2f commit dc82925

File tree

11 files changed

+24
-24
lines changed

11 files changed

+24
-24
lines changed

config/charts/body-based-routing/values.yaml

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -3,8 +3,8 @@ bbr:
33
replicas: 1
44
image:
55
name: bbr
6-
hub: us-central1-docker.pkg.dev/k8s-staging-images/gateway-api-inference-extension
7-
tag: main
6+
hub: registry.k8s.io/gateway-api-inference-extension
7+
tag: v1.0.0-rc.1
88
pullPolicy: Always
99
port: 9004
1010
healthCheckPort: 9005

config/charts/inferencepool/values.yaml

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -2,8 +2,8 @@ inferenceExtension:
22
replicas: 1
33
image:
44
name: epp
5-
hub: us-central1-docker.pkg.dev/k8s-staging-images/gateway-api-inference-extension
6-
tag: main
5+
hub: registry.k8s.io/gateway-api-inference-extension
6+
tag: v1.0.0-rc.1
77
pullPolicy: Always
88
extProcPort: 9002
99
env: []

config/crd/bases/inference.networking.k8s.io_inferencepools.yaml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -3,7 +3,7 @@ kind: CustomResourceDefinition
33
metadata:
44
annotations:
55
api-approved.kubernetes.io: https://github.com/kubernetes-sigs/gateway-api-inference-extension/pull/1173
6-
inference.networking.k8s.io/bundle-version: main-dev
6+
inference.networking.k8s.io/bundle-version: v1.0.0-rc.1
77
creationTimestamp: null
88
name: inferencepools.inference.networking.k8s.io
99
spec:

config/crd/bases/inference.networking.x-k8s.io_inferenceobjectives.yaml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -2,7 +2,7 @@ apiVersion: apiextensions.k8s.io/v1
22
kind: CustomResourceDefinition
33
metadata:
44
annotations:
5-
inference.networking.k8s.io/bundle-version: main-dev
5+
inference.networking.k8s.io/bundle-version: v1.0.0-rc.1
66
creationTimestamp: null
77
name: inferenceobjectives.inference.networking.x-k8s.io
88
spec:

config/crd/bases/inference.networking.x-k8s.io_inferencepools.yaml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -3,7 +3,7 @@ kind: CustomResourceDefinition
33
metadata:
44
annotations:
55
api-approved.kubernetes.io: unapproved, experimental-only
6-
inference.networking.k8s.io/bundle-version: main-dev
6+
inference.networking.k8s.io/bundle-version: v1.0.0-rc.1
77
creationTimestamp: null
88
name: inferencepools.inference.networking.x-k8s.io
99
spec:

config/manifests/inferencepool-resources.yaml

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -59,8 +59,8 @@ spec:
5959
terminationGracePeriodSeconds: 130
6060
containers:
6161
- name: epp
62-
image: us-central1-docker.pkg.dev/k8s-staging-images/gateway-api-inference-extension/epp:main
63-
imagePullPolicy: Always
62+
image: registry.k8s.io/gateway-api-inference-extension/epp:v1.0.0-rc.1
63+
imagePullPolicy: IfNotPresent
6464
args:
6565
- --pool-name
6666
- "vllm-llama3-8b-instruct"

config/manifests/vllm/cpu-deployment.yaml

Lines changed: 4 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -14,8 +14,8 @@ spec:
1414
spec:
1515
containers:
1616
- name: lora
17-
image: "public.ecr.aws/q9t5s3a7/vllm-cpu-release-repo:latest" # formal images can be found in https://gallery.ecr.aws/q9t5s3a7/vllm-cpu-release-repo
18-
imagePullPolicy: Always
17+
image: "public.ecr.aws/q9t5s3a7/vllm-cpu-release-repo:v0.10.1" # formal images can be found in https://gallery.ecr.aws/q9t5s3a7/vllm-cpu-release-repo
18+
imagePullPolicy: IfNotPresent
1919
command: ["python3", "-m", "vllm.entrypoints.openai.api_server"]
2020
args:
2121
- "--model"
@@ -77,8 +77,8 @@ spec:
7777
- name: lora-adapter-syncer
7878
tty: true
7979
stdin: true
80-
image: us-central1-docker.pkg.dev/k8s-staging-images/gateway-api-inference-extension/lora-syncer:main
81-
restartPolicy: Always
80+
image: registry.k8s.io/gateway-api-inference-extension/lora-syncer:v1.0.0-rc.1
81+
restartPolicy: IfNotPresent
8282
imagePullPolicy: Always
8383
env:
8484
- name: DYNAMIC_LORA_ROLLOUT_CONFIG

config/manifests/vllm/gpu-deployment.yaml

Lines changed: 4 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -14,8 +14,8 @@ spec:
1414
spec:
1515
containers:
1616
- name: vllm
17-
image: "vllm/vllm-openai:latest"
18-
imagePullPolicy: Always
17+
image: "vllm/vllm-openai:v0.10.1.1"
18+
imagePullPolicy: IfNotPresent
1919
command: ["python3", "-m", "vllm.entrypoints.openai.api_server"]
2020
args:
2121
- "--model"
@@ -155,8 +155,8 @@ spec:
155155
- name: lora-adapter-syncer
156156
tty: true
157157
stdin: true
158-
image: us-central1-docker.pkg.dev/k8s-staging-images/gateway-api-inference-extension/lora-syncer:main
159-
restartPolicy: Always
158+
image: registry.k8s.io/gateway-api-inference-extension/lora-syncer:v1.0.0-rc.1
159+
restartPolicy: IfNotPresent
160160
imagePullPolicy: Always
161161
env:
162162
- name: DYNAMIC_LORA_ROLLOUT_CONFIG

config/manifests/vllm/sim-deployment.yaml

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -14,8 +14,8 @@ spec:
1414
spec:
1515
containers:
1616
- name: vllm-sim
17-
image: ghcr.io/llm-d/llm-d-inference-sim:v0.3.0
18-
imagePullPolicy: Always
17+
image: ghcr.io/llm-d/llm-d-inference-sim:v0.4.0
18+
imagePullPolicy: IfNotPresent
1919
args:
2020
- --model
2121
- meta-llama/Llama-3.1-8B-Instruct

conformance/resources/base.yaml

Lines changed: 4 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -198,8 +198,8 @@ spec:
198198
terminationGracePeriodSeconds: 130
199199
containers:
200200
- name: epp
201-
image: us-central1-docker.pkg.dev/k8s-staging-images/gateway-api-inference-extension/epp:main
202-
imagePullPolicy: Always
201+
image: registry.k8s.io/gateway-api-inference-extension/epp:v1.0.0-rc.1
202+
imagePullPolicy: IfNotPresent
203203
args:
204204
- --pool-name
205205
- "primary-inference-pool"
@@ -294,8 +294,8 @@ spec:
294294
terminationGracePeriodSeconds: 130
295295
containers:
296296
- name: epp
297-
image: us-central1-docker.pkg.dev/k8s-staging-images/gateway-api-inference-extension/epp:main
298-
imagePullPolicy: Always
297+
image: registry.k8s.io/gateway-api-inference-extension/epp:v1.0.0-rc.1
298+
imagePullPolicy: IfNotPresent
299299
args:
300300
- --pool-name
301301
- "secondary-inference-pool"

0 commit comments

Comments
 (0)