@@ -381,24 +381,12 @@ jobs:
381381 dockerfile : " ./backend/Dockerfile.python"
382382 context : " ./backend"
383383 # sycl builds
384- - build-type : ' sycl_f32'
385- cuda-major-version : " "
386- cuda-minor-version : " "
387- platforms : ' linux/amd64'
388- tag-latest : ' auto'
389- tag-suffix : ' -gpu-intel-sycl-f32-rerankers'
390- runs-on : ' ubuntu-latest'
391- base-image : " quay.io/go-skynet/intel-oneapi-base:latest"
392- skip-drivers : ' false'
393- backend : " rerankers"
394- dockerfile : " ./backend/Dockerfile.python"
395- context : " ./backend"
396- - build-type : ' sycl_f16'
384+ - build-type : ' intel'
397385 cuda-major-version : " "
398386 cuda-minor-version : " "
399387 platforms : ' linux/amd64'
400388 tag-latest : ' auto'
401- tag-suffix : ' -gpu-intel-sycl-f16- rerankers'
389+ tag-suffix : ' -gpu-intel-rerankers'
402390 runs-on : ' ubuntu-latest'
403391 base-image : " quay.io/go-skynet/intel-oneapi-base:latest"
404392 skip-drivers : ' false'
@@ -429,157 +417,85 @@ jobs:
429417 backend : " llama-cpp"
430418 dockerfile : " ./backend/Dockerfile.llama-cpp"
431419 context : " ./"
432- - build-type : ' sycl_f32'
433- cuda-major-version : " "
434- cuda-minor-version : " "
435- platforms : ' linux/amd64'
436- tag-latest : ' auto'
437- tag-suffix : ' -gpu-intel-sycl-f32-vllm'
438- runs-on : ' ubuntu-latest'
439- base-image : " quay.io/go-skynet/intel-oneapi-base:latest"
440- skip-drivers : ' false'
441- backend : " vllm"
442- dockerfile : " ./backend/Dockerfile.python"
443- context : " ./backend"
444- - build-type : ' sycl_f16'
420+ - build-type : ' intel'
445421 cuda-major-version : " "
446422 cuda-minor-version : " "
447423 platforms : ' linux/amd64'
448424 tag-latest : ' auto'
449- tag-suffix : ' -gpu-intel-sycl-f16- vllm'
425+ tag-suffix : ' -gpu-intel-vllm'
450426 runs-on : ' ubuntu-latest'
451427 base-image : " quay.io/go-skynet/intel-oneapi-base:latest"
452428 skip-drivers : ' false'
453429 backend : " vllm"
454430 dockerfile : " ./backend/Dockerfile.python"
455431 context : " ./backend"
456- - build-type : ' sycl_f32'
457- cuda-major-version : " "
458- cuda-minor-version : " "
459- platforms : ' linux/amd64'
460- tag-latest : ' auto'
461- tag-suffix : ' -gpu-intel-sycl-f32-transformers'
462- runs-on : ' ubuntu-latest'
463- base-image : " quay.io/go-skynet/intel-oneapi-base:latest"
464- skip-drivers : ' false'
465- backend : " transformers"
466- dockerfile : " ./backend/Dockerfile.python"
467- context : " ./backend"
468- - build-type : ' sycl_f16'
432+ - build-type : ' intel'
469433 cuda-major-version : " "
470434 cuda-minor-version : " "
471435 platforms : ' linux/amd64'
472436 tag-latest : ' auto'
473- tag-suffix : ' -gpu-intel-sycl-f16- transformers'
437+ tag-suffix : ' -gpu-intel-transformers'
474438 runs-on : ' ubuntu-latest'
475439 base-image : " quay.io/go-skynet/intel-oneapi-base:latest"
476440 skip-drivers : ' false'
477441 backend : " transformers"
478442 dockerfile : " ./backend/Dockerfile.python"
479443 context : " ./backend"
480- - build-type : ' sycl_f32 '
444+ - build-type : ' intel '
481445 cuda-major-version : " "
482446 cuda-minor-version : " "
483447 platforms : ' linux/amd64'
484448 tag-latest : ' auto'
485- tag-suffix : ' -gpu-intel-sycl-f32- diffusers'
449+ tag-suffix : ' -gpu-intel-diffusers'
486450 runs-on : ' ubuntu-latest'
487451 base-image : " quay.io/go-skynet/intel-oneapi-base:latest"
488452 skip-drivers : ' false'
489453 backend : " diffusers"
490454 dockerfile : " ./backend/Dockerfile.python"
491455 context : " ./backend"
492456 # SYCL additional backends
493- - build-type : ' sycl_f32'
494- cuda-major-version : " "
495- cuda-minor-version : " "
496- platforms : ' linux/amd64'
497- tag-latest : ' auto'
498- tag-suffix : ' -gpu-intel-sycl-f32-kokoro'
499- runs-on : ' ubuntu-latest'
500- base-image : " quay.io/go-skynet/intel-oneapi-base:latest"
501- skip-drivers : ' false'
502- backend : " kokoro"
503- dockerfile : " ./backend/Dockerfile.python"
504- context : " ./backend"
505- - build-type : ' sycl_f16'
457+ - build-type : ' intel'
506458 cuda-major-version : " "
507459 cuda-minor-version : " "
508460 platforms : ' linux/amd64'
509461 tag-latest : ' auto'
510- tag-suffix : ' -gpu-intel-sycl-f16- kokoro'
462+ tag-suffix : ' -gpu-intel-kokoro'
511463 runs-on : ' ubuntu-latest'
512464 base-image : " quay.io/go-skynet/intel-oneapi-base:latest"
513465 skip-drivers : ' false'
514466 backend : " kokoro"
515467 dockerfile : " ./backend/Dockerfile.python"
516468 context : " ./backend"
517- - build-type : ' sycl_f32'
518- cuda-major-version : " "
519- cuda-minor-version : " "
520- platforms : ' linux/amd64'
521- tag-latest : ' auto'
522- tag-suffix : ' -gpu-intel-sycl-f32-faster-whisper'
523- runs-on : ' ubuntu-latest'
524- base-image : " quay.io/go-skynet/intel-oneapi-base:latest"
525- skip-drivers : ' false'
526- backend : " faster-whisper"
527- dockerfile : " ./backend/Dockerfile.python"
528- context : " ./backend"
529- - build-type : ' sycl_f16'
469+ - build-type : ' intel'
530470 cuda-major-version : " "
531471 cuda-minor-version : " "
532472 platforms : ' linux/amd64'
533473 tag-latest : ' auto'
534- tag-suffix : ' -gpu-intel-sycl-f16- faster-whisper'
474+ tag-suffix : ' -gpu-intel-faster-whisper'
535475 runs-on : ' ubuntu-latest'
536476 base-image : " quay.io/go-skynet/intel-oneapi-base:latest"
537477 skip-drivers : ' false'
538478 backend : " faster-whisper"
539479 dockerfile : " ./backend/Dockerfile.python"
540480 context : " ./backend"
541- - build-type : ' sycl_f32'
542- cuda-major-version : " "
543- cuda-minor-version : " "
544- platforms : ' linux/amd64'
545- tag-latest : ' auto'
546- tag-suffix : ' -gpu-intel-sycl-f32-coqui'
547- runs-on : ' ubuntu-latest'
548- base-image : " quay.io/go-skynet/intel-oneapi-base:latest"
549- skip-drivers : ' false'
550- backend : " coqui"
551- dockerfile : " ./backend/Dockerfile.python"
552- context : " ./backend"
553- - build-type : ' sycl_f16'
481+ - build-type : ' intel'
554482 cuda-major-version : " "
555483 cuda-minor-version : " "
556484 platforms : ' linux/amd64'
557485 tag-latest : ' auto'
558- tag-suffix : ' -gpu-intel-sycl-f16- coqui'
486+ tag-suffix : ' -gpu-intel-coqui'
559487 runs-on : ' ubuntu-latest'
560488 base-image : " quay.io/go-skynet/intel-oneapi-base:latest"
561489 skip-drivers : ' false'
562490 backend : " coqui"
563491 dockerfile : " ./backend/Dockerfile.python"
564492 context : " ./backend"
565- - build-type : ' sycl_f32'
566- cuda-major-version : " "
567- cuda-minor-version : " "
568- platforms : ' linux/amd64'
569- tag-latest : ' auto'
570- tag-suffix : ' -gpu-intel-sycl-f32-bark'
571- runs-on : ' ubuntu-latest'
572- base-image : " quay.io/go-skynet/intel-oneapi-base:latest"
573- skip-drivers : ' false'
574- backend : " bark"
575- dockerfile : " ./backend/Dockerfile.python"
576- context : " ./backend"
577- - build-type : ' sycl_f16'
493+ - build-type : ' intel'
578494 cuda-major-version : " "
579495 cuda-minor-version : " "
580496 platforms : ' linux/amd64'
581497 tag-latest : ' auto'
582- tag-suffix : ' -gpu-intel-sycl-f16- bark'
498+ tag-suffix : ' -gpu-intel-bark'
583499 runs-on : ' ubuntu-latest'
584500 base-image : " quay.io/go-skynet/intel-oneapi-base:latest"
585501 skip-drivers : ' false'
@@ -930,6 +846,67 @@ jobs:
930846 backend : " rfdetr"
931847 dockerfile : " ./backend/Dockerfile.python"
932848 context : " ./backend"
849+ # exllama2
850+ - build-type : ' '
851+ cuda-major-version : " "
852+ cuda-minor-version : " "
853+ platforms : ' linux/amd64'
854+ tag-latest : ' auto'
855+ tag-suffix : ' -cpu-exllama2'
856+ runs-on : ' ubuntu-latest'
857+ base-image : " ubuntu:22.04"
858+ skip-drivers : ' false'
859+ backend : " exllama2"
860+ dockerfile : " ./backend/Dockerfile.python"
861+ context : " ./backend"
862+ - build-type : ' cublas'
863+ cuda-major-version : " 12"
864+ cuda-minor-version : " 0"
865+ platforms : ' linux/amd64'
866+ tag-latest : ' auto'
867+ tag-suffix : ' -gpu-nvidia-cuda-12-exllama2'
868+ runs-on : ' ubuntu-latest'
869+ base-image : " ubuntu:22.04"
870+ skip-drivers : ' false'
871+ backend : " exllama2"
872+ dockerfile : " ./backend/Dockerfile.python"
873+ context : " ./backend"
874+ - build-type : ' cublas'
875+ cuda-major-version : " 11"
876+ cuda-minor-version : " 7"
877+ platforms : ' linux/amd64'
878+ tag-latest : ' auto'
879+ tag-suffix : ' -gpu-nvidia-cuda-11-exllama2'
880+ runs-on : ' ubuntu-latest'
881+ base-image : " ubuntu:22.04"
882+ skip-drivers : ' false'
883+ backend : " exllama2"
884+ dockerfile : " ./backend/Dockerfile.python"
885+ context : " ./backend"
886+ - build-type : ' intel'
887+ cuda-major-version : " "
888+ cuda-minor-version : " "
889+ platforms : ' linux/amd64'
890+ tag-latest : ' auto'
891+ tag-suffix : ' -gpu-intel-exllama2'
892+ runs-on : ' ubuntu-latest'
893+ base-image : " quay.io/go-skynet/intel-oneapi-base:latest"
894+ skip-drivers : ' false'
895+ backend : " exllama2"
896+ dockerfile : " ./backend/Dockerfile.python"
897+ context : " ./backend"
898+ - build-type : ' hipblas'
899+ cuda-major-version : " "
900+ cuda-minor-version : " "
901+ platforms : ' linux/amd64'
902+ skip-drivers : ' true'
903+ tag-latest : ' auto'
904+ tag-suffix : ' -gpu-hipblas-exllama2'
905+ base-image : " rocm/dev-ubuntu-22.04:6.1"
906+ runs-on : ' ubuntu-latest'
907+ backend : " exllama2"
908+ dockerfile : " ./backend/Dockerfile.python"
909+ context : " ./backend"
933910 # runs out of space on the runner
934911 # - build-type: 'hipblas'
935912 # cuda-major-version: ""
0 commit comments