Skip to content

Commit 77c5acb

Browse files
authored
Revert "feat(nvidia-gpu): bump images to cuda 12.8" (#6303)
Revert "feat(nvidia-gpu): bump images to cuda 12.8 (#6239)" This reverts commit d9e25af.
1 parent 44bbf4d commit 77c5acb

File tree

6 files changed

+25
-25
lines changed

6 files changed

+25
-25
lines changed

.github/workflows/backend.yml

Lines changed: 19 additions & 19 deletions
Original file line numberDiff line numberDiff line change
@@ -89,7 +89,7 @@ jobs:
8989
context: "./backend"
9090
- build-type: 'l4t'
9191
cuda-major-version: "12"
92-
cuda-minor-version: "8"
92+
cuda-minor-version: "0"
9393
platforms: 'linux/arm64'
9494
tag-latest: 'auto'
9595
tag-suffix: '-gpu-nvidia-l4t-diffusers'
@@ -187,7 +187,7 @@ jobs:
187187
# CUDA 12 builds
188188
- build-type: 'cublas'
189189
cuda-major-version: "12"
190-
cuda-minor-version: "8"
190+
cuda-minor-version: "0"
191191
platforms: 'linux/amd64'
192192
tag-latest: 'auto'
193193
tag-suffix: '-gpu-nvidia-cuda-12-rerankers'
@@ -199,7 +199,7 @@ jobs:
199199
context: "./backend"
200200
- build-type: 'cublas'
201201
cuda-major-version: "12"
202-
cuda-minor-version: "8"
202+
cuda-minor-version: "0"
203203
platforms: 'linux/amd64'
204204
tag-latest: 'auto'
205205
tag-suffix: '-gpu-nvidia-cuda-12-llama-cpp'
@@ -211,7 +211,7 @@ jobs:
211211
context: "./"
212212
- build-type: 'cublas'
213213
cuda-major-version: "12"
214-
cuda-minor-version: "8"
214+
cuda-minor-version: "0"
215215
platforms: 'linux/amd64'
216216
tag-latest: 'auto'
217217
tag-suffix: '-gpu-nvidia-cuda-12-vllm'
@@ -223,7 +223,7 @@ jobs:
223223
context: "./backend"
224224
- build-type: 'cublas'
225225
cuda-major-version: "12"
226-
cuda-minor-version: "8"
226+
cuda-minor-version: "0"
227227
platforms: 'linux/amd64'
228228
tag-latest: 'auto'
229229
tag-suffix: '-gpu-nvidia-cuda-12-transformers'
@@ -235,7 +235,7 @@ jobs:
235235
context: "./backend"
236236
- build-type: 'cublas'
237237
cuda-major-version: "12"
238-
cuda-minor-version: "8"
238+
cuda-minor-version: "0"
239239
platforms: 'linux/amd64'
240240
tag-latest: 'auto'
241241
tag-suffix: '-gpu-nvidia-cuda-12-diffusers'
@@ -248,7 +248,7 @@ jobs:
248248
# CUDA 12 additional backends
249249
- build-type: 'cublas'
250250
cuda-major-version: "12"
251-
cuda-minor-version: "8"
251+
cuda-minor-version: "0"
252252
platforms: 'linux/amd64'
253253
tag-latest: 'auto'
254254
tag-suffix: '-gpu-nvidia-cuda-12-kokoro'
@@ -260,7 +260,7 @@ jobs:
260260
context: "./backend"
261261
- build-type: 'cublas'
262262
cuda-major-version: "12"
263-
cuda-minor-version: "8"
263+
cuda-minor-version: "0"
264264
platforms: 'linux/amd64'
265265
tag-latest: 'auto'
266266
tag-suffix: '-gpu-nvidia-cuda-12-faster-whisper'
@@ -272,7 +272,7 @@ jobs:
272272
context: "./backend"
273273
- build-type: 'cublas'
274274
cuda-major-version: "12"
275-
cuda-minor-version: "8"
275+
cuda-minor-version: "0"
276276
platforms: 'linux/amd64'
277277
tag-latest: 'auto'
278278
tag-suffix: '-gpu-nvidia-cuda-12-coqui'
@@ -284,7 +284,7 @@ jobs:
284284
context: "./backend"
285285
- build-type: 'cublas'
286286
cuda-major-version: "12"
287-
cuda-minor-version: "8"
287+
cuda-minor-version: "0"
288288
platforms: 'linux/amd64'
289289
tag-latest: 'auto'
290290
tag-suffix: '-gpu-nvidia-cuda-12-bark'
@@ -296,7 +296,7 @@ jobs:
296296
context: "./backend"
297297
- build-type: 'cublas'
298298
cuda-major-version: "12"
299-
cuda-minor-version: "8"
299+
cuda-minor-version: "0"
300300
platforms: 'linux/amd64'
301301
tag-latest: 'auto'
302302
tag-suffix: '-gpu-nvidia-cuda-12-chatterbox'
@@ -578,7 +578,7 @@ jobs:
578578
context: "./"
579579
- build-type: 'cublas'
580580
cuda-major-version: "12"
581-
cuda-minor-version: "8"
581+
cuda-minor-version: "0"
582582
platforms: 'linux/arm64'
583583
skip-drivers: 'true'
584584
tag-latest: 'auto'
@@ -615,7 +615,7 @@ jobs:
615615
context: "./"
616616
- build-type: 'cublas'
617617
cuda-major-version: "12"
618-
cuda-minor-version: "8"
618+
cuda-minor-version: "0"
619619
platforms: 'linux/amd64'
620620
tag-latest: 'auto'
621621
tag-suffix: '-gpu-nvidia-cuda-12-stablediffusion-ggml'
@@ -675,7 +675,7 @@ jobs:
675675
context: "./"
676676
- build-type: 'cublas'
677677
cuda-major-version: "12"
678-
cuda-minor-version: "8"
678+
cuda-minor-version: "0"
679679
platforms: 'linux/arm64'
680680
skip-drivers: 'true'
681681
tag-latest: 'auto'
@@ -700,7 +700,7 @@ jobs:
700700
context: "./"
701701
- build-type: 'cublas'
702702
cuda-major-version: "12"
703-
cuda-minor-version: "8"
703+
cuda-minor-version: "0"
704704
platforms: 'linux/amd64'
705705
tag-latest: 'auto'
706706
tag-suffix: '-gpu-nvidia-cuda-12-whisper'
@@ -760,7 +760,7 @@ jobs:
760760
context: "./"
761761
- build-type: 'cublas'
762762
cuda-major-version: "12"
763-
cuda-minor-version: "8"
763+
cuda-minor-version: "0"
764764
platforms: 'linux/arm64'
765765
skip-drivers: 'true'
766766
tag-latest: 'auto'
@@ -836,7 +836,7 @@ jobs:
836836
context: "./backend"
837837
- build-type: 'cublas'
838838
cuda-major-version: "12"
839-
cuda-minor-version: "8"
839+
cuda-minor-version: "0"
840840
platforms: 'linux/amd64'
841841
tag-latest: 'auto'
842842
tag-suffix: '-gpu-nvidia-cuda-12-rfdetr'
@@ -872,7 +872,7 @@ jobs:
872872
context: "./backend"
873873
- build-type: 'cublas'
874874
cuda-major-version: "12"
875-
cuda-minor-version: "8"
875+
cuda-minor-version: "0"
876876
platforms: 'linux/arm64'
877877
skip-drivers: 'true'
878878
tag-latest: 'auto'
@@ -897,7 +897,7 @@ jobs:
897897
context: "./backend"
898898
- build-type: 'cublas'
899899
cuda-major-version: "12"
900-
cuda-minor-version: "8"
900+
cuda-minor-version: "0"
901901
platforms: 'linux/amd64'
902902
tag-latest: 'auto'
903903
tag-suffix: '-gpu-nvidia-cuda-12-exllama2'

.github/workflows/image-pr.yml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -36,7 +36,7 @@ jobs:
3636
include:
3737
- build-type: 'cublas'
3838
cuda-major-version: "12"
39-
cuda-minor-version: "8"
39+
cuda-minor-version: "0"
4040
platforms: 'linux/amd64'
4141
tag-latest: 'false'
4242
tag-suffix: '-gpu-nvidia-cuda-12'

.github/workflows/image.yml

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -91,7 +91,7 @@ jobs:
9191
aio: "-aio-gpu-nvidia-cuda-11"
9292
- build-type: 'cublas'
9393
cuda-major-version: "12"
94-
cuda-minor-version: "8"
94+
cuda-minor-version: "0"
9595
platforms: 'linux/amd64'
9696
tag-latest: 'auto'
9797
tag-suffix: '-gpu-nvidia-cuda-12'
@@ -144,7 +144,7 @@ jobs:
144144
include:
145145
- build-type: 'cublas'
146146
cuda-major-version: "12"
147-
cuda-minor-version: "8"
147+
cuda-minor-version: "0"
148148
platforms: 'linux/arm64'
149149
tag-latest: 'auto'
150150
tag-suffix: '-nvidia-l4t-arm64'

Dockerfile

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -18,7 +18,7 @@ FROM requirements AS requirements-drivers
1818

1919
ARG BUILD_TYPE
2020
ARG CUDA_MAJOR_VERSION=12
21-
ARG CUDA_MINOR_VERSION=8
21+
ARG CUDA_MINOR_VERSION=0
2222
ARG SKIP_DRIVERS=false
2323
ARG TARGETARCH
2424
ARG TARGETVARIANT

Makefile

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -170,7 +170,7 @@ prepare-e2e:
170170
mkdir -p $(TEST_DIR)
171171
cp -rfv $(abspath ./tests/e2e-fixtures)/gpu.yaml $(TEST_DIR)/gpu.yaml
172172
test -e $(TEST_DIR)/ggllm-test-model.bin || wget -q https://huggingface.co/TheBloke/CodeLlama-7B-Instruct-GGUF/resolve/main/codellama-7b-instruct.Q2_K.gguf -O $(TEST_DIR)/ggllm-test-model.bin
173-
docker build --build-arg IMAGE_TYPE=core --build-arg BUILD_TYPE=$(BUILD_TYPE) --build-arg CUDA_MAJOR_VERSION=12 --build-arg CUDA_MINOR_VERSION=8 -t localai-tests .
173+
docker build --build-arg IMAGE_TYPE=core --build-arg BUILD_TYPE=$(BUILD_TYPE) --build-arg CUDA_MAJOR_VERSION=12 --build-arg CUDA_MINOR_VERSION=0 -t localai-tests .
174174

175175
run-e2e-image:
176176
ls -liah $(abspath ./tests/e2e-fixtures)

backend/README.md

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -111,7 +111,7 @@ docker build -f backend/Dockerfile.python \
111111
--build-arg BACKEND=transformers \
112112
--build-arg BUILD_TYPE=cublas12 \
113113
--build-arg CUDA_MAJOR_VERSION=12 \
114-
--build-arg CUDA_MINOR_VERSION=8 \
114+
--build-arg CUDA_MINOR_VERSION=0 \
115115
-t localai-backend-transformers .
116116

117117
# Build Go backend

0 commit comments

Comments
 (0)