Skip to content

Commit 770e39d

Browse files
authored
Merge pull request #108 from stackhpc/update/vllm-v0.9.0.1
Update vLLM to v0.9.0.1
2 parents 36c80cf + d932127 commit 770e39d

File tree

5 files changed

+25
-2
lines changed

5 files changed

+25
-2
lines changed

.gitignore

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -20,3 +20,4 @@ charts/*/charts
2020
**/*.egg-info/
2121
**/flagged/
2222
web-apps/**/overrides.yml
23+
**/.env

charts/azimuth-chat/values.schema.json

Lines changed: 11 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -128,6 +128,17 @@
128128
}
129129
}
130130
}
131+
},
132+
"api": {
133+
"properties": {
134+
"image": {
135+
"properties": {
136+
"version": {
137+
"default": "v0.9.0.1"
138+
}
139+
}
140+
}
141+
}
131142
}
132143
}
133144
}

charts/azimuth-image-analysis/values.schema.json

Lines changed: 11 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -115,6 +115,17 @@
115115
}
116116
}
117117
}
118+
},
119+
"api": {
120+
"properties": {
121+
"image": {
122+
"properties": {
123+
"version": {
124+
"default": "v0.9.0.1"
125+
}
126+
}
127+
}
128+
}
118129
}
119130
}
120131
}

charts/azimuth-llm/values.schema.json

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -37,7 +37,7 @@
3737
"type": "string",
3838
"title": "Backend vLLM version",
3939
"description": "The vLLM version to use as a backend. Must be a version tag from [this list](https://github.com/vllm-project/vllm/tags)",
40-
"default": "v0.8.5.post1"
40+
"default": "v0.9.0.1"
4141
}
4242
}
4343
}

charts/azimuth-llm/values.yaml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -37,7 +37,7 @@ api:
3737
# ghcr.io/stackhpc/vllm-xpu when api.gpus > 0 and intelXPUsEnabled is true,
3838
# or ghcr.io/stackhpc/vllm-cpu when api.gpus == 0
3939
repository:
40-
version: v0.8.5.post1
40+
version: v0.9.0.1
4141
monitoring:
4242
enabled: true
4343
# The number of replicas for the backend deployment

0 commit comments

Comments
 (0)