@@ -381,24 +381,12 @@ jobs:
381
381
dockerfile : " ./backend/Dockerfile.python"
382
382
context : " ./backend"
383
383
# sycl builds
384
- - build-type : ' sycl_f32'
385
- cuda-major-version : " "
386
- cuda-minor-version : " "
387
- platforms : ' linux/amd64'
388
- tag-latest : ' auto'
389
- tag-suffix : ' -gpu-intel-sycl-f32-rerankers'
390
- runs-on : ' ubuntu-latest'
391
- base-image : " quay.io/go-skynet/intel-oneapi-base:latest"
392
- skip-drivers : ' false'
393
- backend : " rerankers"
394
- dockerfile : " ./backend/Dockerfile.python"
395
- context : " ./backend"
396
- - build-type : ' sycl_f16'
384
+ - build-type : ' intel'
397
385
cuda-major-version : " "
398
386
cuda-minor-version : " "
399
387
platforms : ' linux/amd64'
400
388
tag-latest : ' auto'
401
- tag-suffix : ' -gpu-intel-sycl-f16- rerankers'
389
+ tag-suffix : ' -gpu-intel-rerankers'
402
390
runs-on : ' ubuntu-latest'
403
391
base-image : " quay.io/go-skynet/intel-oneapi-base:latest"
404
392
skip-drivers : ' false'
@@ -429,157 +417,85 @@ jobs:
429
417
backend : " llama-cpp"
430
418
dockerfile : " ./backend/Dockerfile.llama-cpp"
431
419
context : " ./"
432
- - build-type : ' sycl_f32'
433
- cuda-major-version : " "
434
- cuda-minor-version : " "
435
- platforms : ' linux/amd64'
436
- tag-latest : ' auto'
437
- tag-suffix : ' -gpu-intel-sycl-f32-vllm'
438
- runs-on : ' ubuntu-latest'
439
- base-image : " quay.io/go-skynet/intel-oneapi-base:latest"
440
- skip-drivers : ' false'
441
- backend : " vllm"
442
- dockerfile : " ./backend/Dockerfile.python"
443
- context : " ./backend"
444
- - build-type : ' sycl_f16'
420
+ - build-type : ' intel'
445
421
cuda-major-version : " "
446
422
cuda-minor-version : " "
447
423
platforms : ' linux/amd64'
448
424
tag-latest : ' auto'
449
- tag-suffix : ' -gpu-intel-sycl-f16- vllm'
425
+ tag-suffix : ' -gpu-intel-vllm'
450
426
runs-on : ' ubuntu-latest'
451
427
base-image : " quay.io/go-skynet/intel-oneapi-base:latest"
452
428
skip-drivers : ' false'
453
429
backend : " vllm"
454
430
dockerfile : " ./backend/Dockerfile.python"
455
431
context : " ./backend"
456
- - build-type : ' sycl_f32'
457
- cuda-major-version : " "
458
- cuda-minor-version : " "
459
- platforms : ' linux/amd64'
460
- tag-latest : ' auto'
461
- tag-suffix : ' -gpu-intel-sycl-f32-transformers'
462
- runs-on : ' ubuntu-latest'
463
- base-image : " quay.io/go-skynet/intel-oneapi-base:latest"
464
- skip-drivers : ' false'
465
- backend : " transformers"
466
- dockerfile : " ./backend/Dockerfile.python"
467
- context : " ./backend"
468
- - build-type : ' sycl_f16'
432
+ - build-type : ' intel'
469
433
cuda-major-version : " "
470
434
cuda-minor-version : " "
471
435
platforms : ' linux/amd64'
472
436
tag-latest : ' auto'
473
- tag-suffix : ' -gpu-intel-sycl-f16- transformers'
437
+ tag-suffix : ' -gpu-intel-transformers'
474
438
runs-on : ' ubuntu-latest'
475
439
base-image : " quay.io/go-skynet/intel-oneapi-base:latest"
476
440
skip-drivers : ' false'
477
441
backend : " transformers"
478
442
dockerfile : " ./backend/Dockerfile.python"
479
443
context : " ./backend"
480
- - build-type : ' sycl_f32 '
444
+ - build-type : ' intel '
481
445
cuda-major-version : " "
482
446
cuda-minor-version : " "
483
447
platforms : ' linux/amd64'
484
448
tag-latest : ' auto'
485
- tag-suffix : ' -gpu-intel-sycl-f32- diffusers'
449
+ tag-suffix : ' -gpu-intel-diffusers'
486
450
runs-on : ' ubuntu-latest'
487
451
base-image : " quay.io/go-skynet/intel-oneapi-base:latest"
488
452
skip-drivers : ' false'
489
453
backend : " diffusers"
490
454
dockerfile : " ./backend/Dockerfile.python"
491
455
context : " ./backend"
492
456
# SYCL additional backends
493
- - build-type : ' sycl_f32'
494
- cuda-major-version : " "
495
- cuda-minor-version : " "
496
- platforms : ' linux/amd64'
497
- tag-latest : ' auto'
498
- tag-suffix : ' -gpu-intel-sycl-f32-kokoro'
499
- runs-on : ' ubuntu-latest'
500
- base-image : " quay.io/go-skynet/intel-oneapi-base:latest"
501
- skip-drivers : ' false'
502
- backend : " kokoro"
503
- dockerfile : " ./backend/Dockerfile.python"
504
- context : " ./backend"
505
- - build-type : ' sycl_f16'
457
+ - build-type : ' intel'
506
458
cuda-major-version : " "
507
459
cuda-minor-version : " "
508
460
platforms : ' linux/amd64'
509
461
tag-latest : ' auto'
510
- tag-suffix : ' -gpu-intel-sycl-f16- kokoro'
462
+ tag-suffix : ' -gpu-intel-kokoro'
511
463
runs-on : ' ubuntu-latest'
512
464
base-image : " quay.io/go-skynet/intel-oneapi-base:latest"
513
465
skip-drivers : ' false'
514
466
backend : " kokoro"
515
467
dockerfile : " ./backend/Dockerfile.python"
516
468
context : " ./backend"
517
- - build-type : ' sycl_f32'
518
- cuda-major-version : " "
519
- cuda-minor-version : " "
520
- platforms : ' linux/amd64'
521
- tag-latest : ' auto'
522
- tag-suffix : ' -gpu-intel-sycl-f32-faster-whisper'
523
- runs-on : ' ubuntu-latest'
524
- base-image : " quay.io/go-skynet/intel-oneapi-base:latest"
525
- skip-drivers : ' false'
526
- backend : " faster-whisper"
527
- dockerfile : " ./backend/Dockerfile.python"
528
- context : " ./backend"
529
- - build-type : ' sycl_f16'
469
+ - build-type : ' intel'
530
470
cuda-major-version : " "
531
471
cuda-minor-version : " "
532
472
platforms : ' linux/amd64'
533
473
tag-latest : ' auto'
534
- tag-suffix : ' -gpu-intel-sycl-f16- faster-whisper'
474
+ tag-suffix : ' -gpu-intel-faster-whisper'
535
475
runs-on : ' ubuntu-latest'
536
476
base-image : " quay.io/go-skynet/intel-oneapi-base:latest"
537
477
skip-drivers : ' false'
538
478
backend : " faster-whisper"
539
479
dockerfile : " ./backend/Dockerfile.python"
540
480
context : " ./backend"
541
- - build-type : ' sycl_f32'
542
- cuda-major-version : " "
543
- cuda-minor-version : " "
544
- platforms : ' linux/amd64'
545
- tag-latest : ' auto'
546
- tag-suffix : ' -gpu-intel-sycl-f32-coqui'
547
- runs-on : ' ubuntu-latest'
548
- base-image : " quay.io/go-skynet/intel-oneapi-base:latest"
549
- skip-drivers : ' false'
550
- backend : " coqui"
551
- dockerfile : " ./backend/Dockerfile.python"
552
- context : " ./backend"
553
- - build-type : ' sycl_f16'
481
+ - build-type : ' intel'
554
482
cuda-major-version : " "
555
483
cuda-minor-version : " "
556
484
platforms : ' linux/amd64'
557
485
tag-latest : ' auto'
558
- tag-suffix : ' -gpu-intel-sycl-f16- coqui'
486
+ tag-suffix : ' -gpu-intel-coqui'
559
487
runs-on : ' ubuntu-latest'
560
488
base-image : " quay.io/go-skynet/intel-oneapi-base:latest"
561
489
skip-drivers : ' false'
562
490
backend : " coqui"
563
491
dockerfile : " ./backend/Dockerfile.python"
564
492
context : " ./backend"
565
- - build-type : ' sycl_f32'
566
- cuda-major-version : " "
567
- cuda-minor-version : " "
568
- platforms : ' linux/amd64'
569
- tag-latest : ' auto'
570
- tag-suffix : ' -gpu-intel-sycl-f32-bark'
571
- runs-on : ' ubuntu-latest'
572
- base-image : " quay.io/go-skynet/intel-oneapi-base:latest"
573
- skip-drivers : ' false'
574
- backend : " bark"
575
- dockerfile : " ./backend/Dockerfile.python"
576
- context : " ./backend"
577
- - build-type : ' sycl_f16'
493
+ - build-type : ' intel'
578
494
cuda-major-version : " "
579
495
cuda-minor-version : " "
580
496
platforms : ' linux/amd64'
581
497
tag-latest : ' auto'
582
- tag-suffix : ' -gpu-intel-sycl-f16- bark'
498
+ tag-suffix : ' -gpu-intel-bark'
583
499
runs-on : ' ubuntu-latest'
584
500
base-image : " quay.io/go-skynet/intel-oneapi-base:latest"
585
501
skip-drivers : ' false'
@@ -930,6 +846,67 @@ jobs:
930
846
backend : " rfdetr"
931
847
dockerfile : " ./backend/Dockerfile.python"
932
848
context : " ./backend"
849
+ # exllama2
850
+ - build-type : ' '
851
+ cuda-major-version : " "
852
+ cuda-minor-version : " "
853
+ platforms : ' linux/amd64'
854
+ tag-latest : ' auto'
855
+ tag-suffix : ' -cpu-exllama2'
856
+ runs-on : ' ubuntu-latest'
857
+ base-image : " ubuntu:22.04"
858
+ skip-drivers : ' false'
859
+ backend : " exllama2"
860
+ dockerfile : " ./backend/Dockerfile.python"
861
+ context : " ./backend"
862
+ - build-type : ' cublas'
863
+ cuda-major-version : " 12"
864
+ cuda-minor-version : " 0"
865
+ platforms : ' linux/amd64'
866
+ tag-latest : ' auto'
867
+ tag-suffix : ' -gpu-nvidia-cuda-12-exllama2'
868
+ runs-on : ' ubuntu-latest'
869
+ base-image : " ubuntu:22.04"
870
+ skip-drivers : ' false'
871
+ backend : " exllama2"
872
+ dockerfile : " ./backend/Dockerfile.python"
873
+ context : " ./backend"
874
+ - build-type : ' cublas'
875
+ cuda-major-version : " 11"
876
+ cuda-minor-version : " 7"
877
+ platforms : ' linux/amd64'
878
+ tag-latest : ' auto'
879
+ tag-suffix : ' -gpu-nvidia-cuda-11-exllama2'
880
+ runs-on : ' ubuntu-latest'
881
+ base-image : " ubuntu:22.04"
882
+ skip-drivers : ' false'
883
+ backend : " exllama2"
884
+ dockerfile : " ./backend/Dockerfile.python"
885
+ context : " ./backend"
886
+ - build-type : ' intel'
887
+ cuda-major-version : " "
888
+ cuda-minor-version : " "
889
+ platforms : ' linux/amd64'
890
+ tag-latest : ' auto'
891
+ tag-suffix : ' -gpu-intel-exllama2'
892
+ runs-on : ' ubuntu-latest'
893
+ base-image : " quay.io/go-skynet/intel-oneapi-base:latest"
894
+ skip-drivers : ' false'
895
+ backend : " exllama2"
896
+ dockerfile : " ./backend/Dockerfile.python"
897
+ context : " ./backend"
898
+ - build-type : ' hipblas'
899
+ cuda-major-version : " "
900
+ cuda-minor-version : " "
901
+ platforms : ' linux/amd64'
902
+ skip-drivers : ' true'
903
+ tag-latest : ' auto'
904
+ tag-suffix : ' -gpu-hipblas-exllama2'
905
+ base-image : " rocm/dev-ubuntu-22.04:6.1"
906
+ runs-on : ' ubuntu-latest'
907
+ backend : " exllama2"
908
+ dockerfile : " ./backend/Dockerfile.python"
909
+ context : " ./backend"
933
910
# runs out of space on the runner
934
911
# - build-type: 'hipblas'
935
912
# cuda-major-version: ""
0 commit comments