Skip to content

Commit 9352107

Browse files
committed
WIP
1 parent 77c5acb commit 9352107

File tree

3 files changed

+189
-1
lines changed

3 files changed

+189
-1
lines changed

.github/workflows/backend.yml

Lines changed: 169 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -197,6 +197,18 @@ jobs:
197197
backend: "rerankers"
198198
dockerfile: "./backend/Dockerfile.python"
199199
context: "./backend"
200+
- build-type: 'cublas'
201+
cuda-major-version: "13"
202+
cuda-minor-version: "0"
203+
platforms: 'linux/amd64'
204+
tag-latest: 'auto'
205+
tag-suffix: '-gpu-nvidia-cuda-13-rerankers'
206+
runs-on: 'ubuntu-latest'
207+
base-image: "ubuntu:22.04"
208+
skip-drivers: 'false'
209+
backend: "rerankers"
210+
dockerfile: "./backend/Dockerfile.python"
211+
context: "./backend"
200212
- build-type: 'cublas'
201213
cuda-major-version: "12"
202214
cuda-minor-version: "0"
@@ -209,6 +221,18 @@ jobs:
209221
backend: "llama-cpp"
210222
dockerfile: "./backend/Dockerfile.llama-cpp"
211223
context: "./"
224+
- build-type: 'cublas'
225+
cuda-major-version: "13"
226+
cuda-minor-version: "0"
227+
platforms: 'linux/amd64'
228+
tag-latest: 'auto'
229+
tag-suffix: '-gpu-nvidia-cuda-13-llama-cpp'
230+
runs-on: 'ubuntu-latest'
231+
base-image: "ubuntu:22.04"
232+
skip-drivers: 'false'
233+
backend: "llama-cpp"
234+
dockerfile: "./backend/Dockerfile.llama-cpp"
235+
context: "./"
212236
- build-type: 'cublas'
213237
cuda-major-version: "12"
214238
cuda-minor-version: "0"
@@ -221,6 +245,18 @@ jobs:
221245
backend: "vllm"
222246
dockerfile: "./backend/Dockerfile.python"
223247
context: "./backend"
248+
- build-type: 'cublas'
249+
cuda-major-version: "13"
250+
cuda-minor-version: "0"
251+
platforms: 'linux/amd64'
252+
tag-latest: 'auto'
253+
tag-suffix: '-gpu-nvidia-cuda-13-vllm'
254+
runs-on: 'arc-runner-set'
255+
base-image: "ubuntu:22.04"
256+
skip-drivers: 'false'
257+
backend: "vllm"
258+
dockerfile: "./backend/Dockerfile.python"
259+
context: "./backend"
224260
- build-type: 'cublas'
225261
cuda-major-version: "12"
226262
cuda-minor-version: "0"
@@ -233,6 +269,18 @@ jobs:
233269
backend: "transformers"
234270
dockerfile: "./backend/Dockerfile.python"
235271
context: "./backend"
272+
- build-type: 'cublas'
273+
cuda-major-version: "13"
274+
cuda-minor-version: "0"
275+
platforms: 'linux/amd64'
276+
tag-latest: 'auto'
277+
tag-suffix: '-gpu-nvidia-cuda-13-transformers'
278+
runs-on: 'ubuntu-latest'
279+
base-image: "ubuntu:22.04"
280+
skip-drivers: 'false'
281+
backend: "transformers"
282+
dockerfile: "./backend/Dockerfile.python"
283+
context: "./backend"
236284
- build-type: 'cublas'
237285
cuda-major-version: "12"
238286
cuda-minor-version: "0"
@@ -245,7 +293,19 @@ jobs:
245293
backend: "diffusers"
246294
dockerfile: "./backend/Dockerfile.python"
247295
context: "./backend"
248-
# CUDA 12 additional backends
296+
- build-type: 'cublas'
297+
cuda-major-version: "13"
298+
cuda-minor-version: "0"
299+
platforms: 'linux/amd64'
300+
tag-latest: 'auto'
301+
tag-suffix: '-gpu-nvidia-cuda-13-diffusers'
302+
runs-on: 'ubuntu-latest'
303+
base-image: "ubuntu:22.04"
304+
skip-drivers: 'false'
305+
backend: "diffusers"
306+
dockerfile: "./backend/Dockerfile.python"
307+
context: "./backend"
308+
# CUDA additional backends
249309
- build-type: 'cublas'
250310
cuda-major-version: "12"
251311
cuda-minor-version: "0"
@@ -258,6 +318,18 @@ jobs:
258318
backend: "kokoro"
259319
dockerfile: "./backend/Dockerfile.python"
260320
context: "./backend"
321+
- build-type: 'cublas'
322+
cuda-major-version: "13"
323+
cuda-minor-version: "0"
324+
platforms: 'linux/amd64'
325+
tag-latest: 'auto'
326+
tag-suffix: '-gpu-nvidia-cuda-13-kokoro'
327+
runs-on: 'ubuntu-latest'
328+
base-image: "ubuntu:22.04"
329+
skip-drivers: 'false'
330+
backend: "kokoro"
331+
dockerfile: "./backend/Dockerfile.python"
332+
context: "./backend"
261333
- build-type: 'cublas'
262334
cuda-major-version: "12"
263335
cuda-minor-version: "0"
@@ -270,6 +342,18 @@ jobs:
270342
backend: "faster-whisper"
271343
dockerfile: "./backend/Dockerfile.python"
272344
context: "./backend"
345+
- build-type: 'cublas'
346+
cuda-major-version: "13"
347+
cuda-minor-version: "0"
348+
platforms: 'linux/amd64'
349+
tag-latest: 'auto'
350+
tag-suffix: '-gpu-nvidia-cuda-13-faster-whisper'
351+
runs-on: 'ubuntu-latest'
352+
base-image: "ubuntu:22.04"
353+
skip-drivers: 'false'
354+
backend: "faster-whisper"
355+
dockerfile: "./backend/Dockerfile.python"
356+
context: "./backend"
273357
- build-type: 'cublas'
274358
cuda-major-version: "12"
275359
cuda-minor-version: "0"
@@ -282,6 +366,18 @@ jobs:
282366
backend: "coqui"
283367
dockerfile: "./backend/Dockerfile.python"
284368
context: "./backend"
369+
- build-type: 'cublas'
370+
cuda-major-version: "13"
371+
cuda-minor-version: "0"
372+
platforms: 'linux/amd64'
373+
tag-latest: 'auto'
374+
tag-suffix: '-gpu-nvidia-cuda-13-coqui'
375+
runs-on: 'ubuntu-latest'
376+
base-image: "ubuntu:22.04"
377+
skip-drivers: 'false'
378+
backend: "coqui"
379+
dockerfile: "./backend/Dockerfile.python"
380+
context: "./backend"
285381
- build-type: 'cublas'
286382
cuda-major-version: "12"
287383
cuda-minor-version: "0"
@@ -294,6 +390,18 @@ jobs:
294390
backend: "bark"
295391
dockerfile: "./backend/Dockerfile.python"
296392
context: "./backend"
393+
- build-type: 'cublas'
394+
cuda-major-version: "13"
395+
cuda-minor-version: "0"
396+
platforms: 'linux/amd64'
397+
tag-latest: 'auto'
398+
tag-suffix: '-gpu-nvidia-cuda-13-bark'
399+
runs-on: 'ubuntu-latest'
400+
base-image: "ubuntu:22.04"
401+
skip-drivers: 'false'
402+
backend: "bark"
403+
dockerfile: "./backend/Dockerfile.python"
404+
context: "./backend"
297405
- build-type: 'cublas'
298406
cuda-major-version: "12"
299407
cuda-minor-version: "0"
@@ -306,6 +414,18 @@ jobs:
306414
backend: "chatterbox"
307415
dockerfile: "./backend/Dockerfile.python"
308416
context: "./backend"
417+
- build-type: 'cublas'
418+
cuda-major-version: "13"
419+
cuda-minor-version: "0"
420+
platforms: 'linux/amd64'
421+
tag-latest: 'auto'
422+
tag-suffix: '-gpu-nvidia-cuda-13-chatterbox'
423+
runs-on: 'ubuntu-latest'
424+
base-image: "ubuntu:22.04"
425+
skip-drivers: 'false'
426+
backend: "chatterbox"
427+
dockerfile: "./backend/Dockerfile.python"
428+
context: "./backend"
309429
# hipblas builds
310430
- build-type: 'hipblas'
311431
cuda-major-version: ""
@@ -625,6 +745,18 @@ jobs:
625745
backend: "stablediffusion-ggml"
626746
dockerfile: "./backend/Dockerfile.golang"
627747
context: "./"
748+
- build-type: 'cublas'
749+
cuda-major-version: "13"
750+
cuda-minor-version: "0"
751+
platforms: 'linux/amd64'
752+
tag-latest: 'auto'
753+
tag-suffix: '-gpu-nvidia-cuda-13-stablediffusion-ggml'
754+
runs-on: 'ubuntu-latest'
755+
base-image: "ubuntu:22.04"
756+
skip-drivers: 'false'
757+
backend: "stablediffusion-ggml"
758+
dockerfile: "./backend/Dockerfile.golang"
759+
context: "./"
628760
- build-type: 'cublas'
629761
cuda-major-version: "11"
630762
cuda-minor-version: "7"
@@ -710,6 +842,18 @@ jobs:
710842
backend: "whisper"
711843
dockerfile: "./backend/Dockerfile.golang"
712844
context: "./"
845+
- build-type: 'cublas'
846+
cuda-major-version: "13"
847+
cuda-minor-version: "0"
848+
platforms: 'linux/amd64'
849+
tag-latest: 'auto'
850+
tag-suffix: '-gpu-nvidia-cuda-12-whisper'
851+
runs-on: 'ubuntu-latest'
852+
base-image: "ubuntu:22.04"
853+
skip-drivers: 'false'
854+
backend: "whisper"
855+
dockerfile: "./backend/Dockerfile.golang"
856+
context: "./"
713857
- build-type: 'cublas'
714858
cuda-major-version: "11"
715859
cuda-minor-version: "7"
@@ -846,6 +990,18 @@ jobs:
846990
backend: "rfdetr"
847991
dockerfile: "./backend/Dockerfile.python"
848992
context: "./backend"
993+
- build-type: 'cublas'
994+
cuda-major-version: "13"
995+
cuda-minor-version: "0"
996+
platforms: 'linux/amd64'
997+
tag-latest: 'auto'
998+
tag-suffix: '-gpu-nvidia-cuda-12-rfdetr'
999+
runs-on: 'ubuntu-latest'
1000+
base-image: "ubuntu:22.04"
1001+
skip-drivers: 'false'
1002+
backend: "rfdetr"
1003+
dockerfile: "./backend/Dockerfile.python"
1004+
context: "./backend"
8491005
- build-type: 'cublas'
8501006
cuda-major-version: "11"
8511007
cuda-minor-version: "7"
@@ -907,6 +1063,18 @@ jobs:
9071063
backend: "exllama2"
9081064
dockerfile: "./backend/Dockerfile.python"
9091065
context: "./backend"
1066+
- build-type: 'cublas'
1067+
cuda-major-version: "13"
1068+
cuda-minor-version: "0"
1069+
platforms: 'linux/amd64'
1070+
tag-latest: 'auto'
1071+
tag-suffix: '-gpu-nvidia-cuda-12-exllama2'
1072+
runs-on: 'ubuntu-latest'
1073+
base-image: "ubuntu:22.04"
1074+
skip-drivers: 'false'
1075+
backend: "exllama2"
1076+
dockerfile: "./backend/Dockerfile.python"
1077+
context: "./backend"
9101078
- build-type: 'cublas'
9111079
cuda-major-version: "11"
9121080
cuda-minor-version: "7"

.github/workflows/image-pr.yml

Lines changed: 9 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -34,6 +34,15 @@ jobs:
3434
fail-fast: false
3535
matrix:
3636
include:
37+
- build-type: 'cublas'
38+
cuda-major-version: "13"
39+
cuda-minor-version: "0"
40+
platforms: 'linux/amd64'
41+
tag-latest: 'false'
42+
tag-suffix: '-gpu-nvidia-cuda-13'
43+
runs-on: 'ubuntu-latest'
44+
base-image: "ubuntu:22.04"
45+
makeflags: "--jobs=3 --output-sync=target"
3746
- build-type: 'cublas'
3847
cuda-major-version: "12"
3948
cuda-minor-version: "0"

.github/workflows/image.yml

Lines changed: 11 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -100,6 +100,17 @@ jobs:
100100
skip-drivers: 'false'
101101
makeflags: "--jobs=4 --output-sync=target"
102102
aio: "-aio-gpu-nvidia-cuda-12"
103+
- build-type: 'cublas'
104+
cuda-major-version: "13"
105+
cuda-minor-version: "0"
106+
platforms: 'linux/amd64'
107+
tag-latest: 'auto'
108+
tag-suffix: '-gpu-nvidia-cuda-13'
109+
runs-on: 'ubuntu-latest'
110+
base-image: "ubuntu:22.04"
111+
skip-drivers: 'false'
112+
makeflags: "--jobs=4 --output-sync=target"
113+
aio: "-aio-gpu-nvidia-cuda-13"
103114
- build-type: 'vulkan'
104115
platforms: 'linux/amd64'
105116
tag-latest: 'auto'

0 commit comments

Comments
 (0)