@@ -544,8 +544,8 @@ static void reorder_mul_mat_vec_q4_0_q8_1_sycl(const void * vx, const void * vy,
544
544
const sycl::range<3 > global_size (1 , GGML_SYCL_MMV_Y, (block_num_y * WARP_SIZE));
545
545
const sycl::range<3 > workgroup_size (1 , GGML_SYCL_MMV_Y, num_subgroups * WARP_SIZE);
546
546
547
- stream-> submit ([&](sycl::handler & cgh) {
548
- cgh. parallel_for ( sycl::nd_range<3 >(global_size, workgroup_size),
547
+ syclex:: submit (*stream, [&](sycl::handler & cgh) {
548
+ syclex::nd_launch (cgh, sycl::nd_range<3 >(global_size, workgroup_size),
549
549
[=](sycl::nd_item<3 > nd_item) [[sycl::reqd_sub_group_size (WARP_SIZE)]] {
550
550
mul_mat_vec_q_reorder<reorder_vec_dot_q_sycl<GGML_TYPE_Q4_0>>(vx, vy, dst, ncols, nrows,
551
551
nd_item);
@@ -561,8 +561,8 @@ static void mul_mat_vec_q4_0_q8_1_sycl(const void * vx, const void * vy, float *
561
561
const sycl::range<3 > block_dims (1 , GGML_SYCL_MMV_Y, WARP_SIZE);
562
562
563
563
{
564
- stream-> submit ([&](sycl::handler & cgh) {
565
- cgh. parallel_for ( sycl::nd_range<3 >(block_nums * block_dims, block_dims),
564
+ syclex:: submit (*stream, [&](sycl::handler & cgh) {
565
+ syclex::nd_launch (cgh, sycl::nd_range<3 >(block_nums * block_dims, block_dims),
566
566
[=](sycl::nd_item<3 > item_ct1) [[sycl::reqd_sub_group_size (WARP_SIZE)]] {
567
567
mul_mat_vec_q<QK4_0, QI4_0, block_q4_0, VDR_Q4_0_Q8_1_MMVQ, vec_dot_q4_0_q8_1>(
568
568
vx, vy, dst, ncols, nrows, item_ct1);
@@ -581,9 +581,9 @@ static void mul_mat_vec_q4_1_q8_1_sycl(const void *vx, const void *vy,
581
581
const sycl::range<3 > block_dims (1 , GGML_SYCL_MMV_Y, WARP_SIZE);
582
582
{
583
583
584
- stream-> submit ([&](sycl::handler &cgh) {
584
+ syclex:: submit (*stream, [&](sycl::handler &cgh) {
585
585
586
- cgh. parallel_for (
586
+ syclex::nd_launch (cgh,
587
587
sycl::nd_range<3 >(block_nums * block_dims, block_dims),
588
588
[=](sycl::nd_item<3 > item_ct1)
589
589
[[sycl::reqd_sub_group_size (WARP_SIZE)]] {
@@ -605,9 +605,9 @@ static void mul_mat_vec_q5_0_q8_1_sycl(const void *vx, const void *vy,
605
605
const sycl::range<3 > block_dims (1 , GGML_SYCL_MMV_Y, WARP_SIZE);
606
606
{
607
607
608
- stream-> submit ([&](sycl::handler &cgh) {
608
+ syclex:: submit (*stream, [&](sycl::handler &cgh) {
609
609
610
- cgh. parallel_for (
610
+ syclex::nd_launch (cgh,
611
611
sycl::nd_range<3 >(block_nums * block_dims, block_dims),
612
612
[=](sycl::nd_item<3 > item_ct1)
613
613
[[sycl::reqd_sub_group_size (WARP_SIZE)]] {
@@ -629,9 +629,9 @@ static void mul_mat_vec_q5_1_q8_1_sycl(const void *vx, const void *vy,
629
629
const sycl::range<3 > block_dims (1 , GGML_SYCL_MMV_Y, WARP_SIZE);
630
630
{
631
631
632
- stream-> submit ([&](sycl::handler &cgh) {
632
+ syclex:: submit (*stream, [&](sycl::handler &cgh) {
633
633
634
- cgh. parallel_for (
634
+ syclex::nd_launch (cgh,
635
635
sycl::nd_range<3 >(block_nums * block_dims, block_dims),
636
636
[=](sycl::nd_item<3 > item_ct1)
637
637
[[sycl::reqd_sub_group_size (WARP_SIZE)]] {
@@ -653,9 +653,9 @@ static void mul_mat_vec_q8_0_q8_1_sycl(const void *vx, const void *vy,
653
653
const sycl::range<3 > block_dims (1 , GGML_SYCL_MMV_Y, WARP_SIZE);
654
654
{
655
655
656
- stream-> submit ([&](sycl::handler &cgh) {
656
+ syclex:: submit (*stream, [&](sycl::handler &cgh) {
657
657
658
- cgh. parallel_for (
658
+ syclex::nd_launch (cgh,
659
659
sycl::nd_range<3 >(block_nums * block_dims, block_dims),
660
660
[=](sycl::nd_item<3 > item_ct1)
661
661
[[sycl::reqd_sub_group_size (WARP_SIZE)]] {
@@ -677,9 +677,9 @@ static void mul_mat_vec_q2_K_q8_1_sycl(const void *vx, const void *vy,
677
677
const sycl::range<3 > block_dims (1 , GGML_SYCL_MMV_Y, WARP_SIZE);
678
678
{
679
679
680
- stream-> submit ([&](sycl::handler &cgh) {
680
+ syclex:: submit (*stream, [&](sycl::handler &cgh) {
681
681
682
- cgh. parallel_for (
682
+ syclex::nd_launch (cgh,
683
683
sycl::nd_range<3 >(block_nums * block_dims, block_dims),
684
684
[=](sycl::nd_item<3 > item_ct1)
685
685
[[sycl::reqd_sub_group_size (WARP_SIZE)]] {
@@ -701,9 +701,9 @@ static void mul_mat_vec_q3_K_q8_1_sycl(const void *vx, const void *vy,
701
701
const sycl::range<3 > block_dims (1 , GGML_SYCL_MMV_Y, WARP_SIZE);
702
702
{
703
703
704
- stream-> submit ([&](sycl::handler &cgh) {
704
+ syclex:: submit (*stream, [&](sycl::handler &cgh) {
705
705
706
- cgh. parallel_for (
706
+ syclex::nd_launch (cgh,
707
707
sycl::nd_range<3 >(block_nums * block_dims, block_dims),
708
708
[=](sycl::nd_item<3 > item_ct1)
709
709
[[sycl::reqd_sub_group_size (WARP_SIZE)]] {
@@ -725,9 +725,9 @@ static void mul_mat_vec_q4_K_q8_1_sycl(const void *vx, const void *vy,
725
725
const sycl::range<3 > block_dims (1 , GGML_SYCL_MMV_Y, WARP_SIZE);
726
726
{
727
727
728
- stream-> submit ([&](sycl::handler &cgh) {
728
+ syclex:: submit (*stream, [&](sycl::handler &cgh) {
729
729
730
- cgh. parallel_for (
730
+ syclex::nd_launch (cgh,
731
731
sycl::nd_range<3 >(block_nums * block_dims, block_dims),
732
732
[=](sycl::nd_item<3 > item_ct1)
733
733
[[sycl::reqd_sub_group_size (WARP_SIZE)]] {
@@ -750,8 +750,8 @@ static void reorder_mul_mat_vec_q4_k_q8_1_sycl(const void * vx, const void * vy,
750
750
const sycl::range<3 > global_size (1 , GGML_SYCL_MMV_Y, block_num_y * WARP_SIZE);
751
751
const sycl::range<3 > workgroup_size (1 , GGML_SYCL_MMV_Y, num_subgroups * WARP_SIZE);
752
752
753
- stream-> submit ([&](sycl::handler & cgh) {
754
- cgh. parallel_for ( sycl::nd_range<3 >(global_size, workgroup_size),
753
+ syclex:: submit (*stream, [&](sycl::handler & cgh) {
754
+ syclex::nd_launch (cgh, sycl::nd_range<3 >(global_size, workgroup_size),
755
755
[=](sycl::nd_item<3 > nd_item) [[sycl::reqd_sub_group_size (WARP_SIZE)]] {
756
756
mul_mat_vec_q_reorder<reorder_vec_dot_q_sycl<GGML_TYPE_Q4_K>>(vx, vy, dst, ncols,
757
757
nrows, nd_item);
@@ -770,9 +770,9 @@ static void mul_mat_vec_q5_K_q8_1_sycl(const void *vx, const void *vy,
770
770
const sycl::range<3 > block_dims (1 , GGML_SYCL_MMV_Y, WARP_SIZE);
771
771
{
772
772
773
- stream-> submit ([&](sycl::handler &cgh) {
773
+ syclex:: submit (*stream, [&](sycl::handler &cgh) {
774
774
775
- cgh. parallel_for (
775
+ syclex::nd_launch (cgh,
776
776
sycl::nd_range<3 >(block_nums * block_dims, block_dims),
777
777
[=](sycl::nd_item<3 > item_ct1)
778
778
[[sycl::reqd_sub_group_size (WARP_SIZE)]] {
@@ -794,8 +794,8 @@ static void reorder_mul_mat_vec_q6_k_q8_1_sycl(const void * vx, const void * vy,
794
794
const sycl::range<3 > global_size (1 , GGML_SYCL_MMV_Y, block_num_y * WARP_SIZE);
795
795
const sycl::range<3 > workgroup_size (1 , GGML_SYCL_MMV_Y, num_subgroups * WARP_SIZE);
796
796
797
- stream-> submit ([&](sycl::handler & cgh) {
798
- cgh. parallel_for ( sycl::nd_range<3 >(global_size, workgroup_size),
797
+ syclex:: submit (*stream, [&](sycl::handler & cgh) {
798
+ syclex::nd_launch (cgh, sycl::nd_range<3 >(global_size, workgroup_size),
799
799
[=](sycl::nd_item<3 > nd_item) [[sycl::reqd_sub_group_size (WARP_SIZE)]] {
800
800
mul_mat_vec_q_reorder<reorder_vec_dot_q_sycl<GGML_TYPE_Q6_K>>(vx, vy, dst, ncols, nrows,
801
801
nd_item);
@@ -812,9 +812,9 @@ static void mul_mat_vec_q6_K_q8_1_sycl(const void *vx, const void *vy,
812
812
const sycl::range<3 > block_dims (1 , GGML_SYCL_MMV_Y, WARP_SIZE);
813
813
{
814
814
815
- stream-> submit ([&](sycl::handler &cgh) {
815
+ syclex:: submit (*stream, [&](sycl::handler &cgh) {
816
816
817
- cgh. parallel_for (
817
+ syclex::nd_launch (cgh,
818
818
sycl::nd_range<3 >(block_nums * block_dims, block_dims),
819
819
[=](sycl::nd_item<3 > item_ct1)
820
820
[[sycl::reqd_sub_group_size (WARP_SIZE)]] {
@@ -836,8 +836,8 @@ static void mul_mat_vec_iq2_xxs_q8_1_sycl(const void *vx, const void *vy,
836
836
const sycl::range<3 > block_nums (1 , 1 , block_num_y);
837
837
const sycl::range<3 > block_dims (1 , GGML_SYCL_MMV_Y, WARP_SIZE);
838
838
{
839
- stream-> submit ([&](sycl::handler &cgh) {
840
- cgh. parallel_for (
839
+ syclex:: submit (*stream, [&](sycl::handler &cgh) {
840
+ syclex::nd_launch (cgh,
841
841
sycl::nd_range<3 >(block_nums * block_dims, block_dims),
842
842
[=](sycl::nd_item<3 > item_ct1)
843
843
[[sycl::reqd_sub_group_size (WARP_SIZE)]] {
@@ -857,8 +857,8 @@ static void mul_mat_vec_iq2_xs_q8_1_sycl(const void *vx, const void *vy,
857
857
const sycl::range<3 > block_nums (1 , 1 , block_num_y);
858
858
const sycl::range<3 > block_dims (1 , GGML_SYCL_MMV_Y, WARP_SIZE);
859
859
{
860
- stream-> submit ([&](sycl::handler & cgh) {
861
- cgh. parallel_for (
860
+ syclex:: submit (*stream, [&](sycl::handler & cgh) {
861
+ syclex::nd_launch (cgh,
862
862
sycl::nd_range<3 >(block_nums * block_dims, block_dims),
863
863
[=](sycl::nd_item<3 > item_ct1)
864
864
[[sycl::reqd_sub_group_size (WARP_SIZE)]] {
@@ -879,8 +879,8 @@ static void mul_mat_vec_iq2_s_q8_1_sycl(const void *vx, const void *vy,
879
879
const sycl::range<3 > block_dims (1 , GGML_SYCL_MMV_Y, WARP_SIZE);
880
880
{
881
881
882
- stream-> submit ([&](sycl::handler &cgh) {
883
- cgh. parallel_for (
882
+ syclex:: submit (*stream, [&](sycl::handler &cgh) {
883
+ syclex::nd_launch (cgh,
884
884
sycl::nd_range<3 >(block_nums * block_dims, block_dims),
885
885
[=](sycl::nd_item<3 > item_ct1)
886
886
[[sycl::reqd_sub_group_size (WARP_SIZE)]] {
@@ -901,8 +901,8 @@ static void mul_mat_vec_iq3_xxs_q8_1_sycl(const void *vx, const void *vy,
901
901
const sycl::range<3 > block_dims (1 , GGML_SYCL_MMV_Y, WARP_SIZE);
902
902
{
903
903
904
- stream-> submit ([&](sycl::handler &cgh) {
905
- cgh. parallel_for (
904
+ syclex:: submit (*stream, [&](sycl::handler &cgh) {
905
+ syclex::nd_launch (cgh,
906
906
sycl::nd_range<3 >(block_nums * block_dims, block_dims),
907
907
[=](sycl::nd_item<3 > item_ct1)
908
908
[[sycl::reqd_sub_group_size (WARP_SIZE)]] {
@@ -923,8 +923,8 @@ static void mul_mat_vec_iq3_s_q8_1_sycl(const void *vx, const void *vy,
923
923
const sycl::range<3 > block_dims (1 , GGML_SYCL_MMV_Y, WARP_SIZE);
924
924
{
925
925
926
- stream-> submit ([&](sycl::handler &cgh) {
927
- cgh. parallel_for (
926
+ syclex:: submit (*stream, [&](sycl::handler &cgh) {
927
+ syclex::nd_launch (cgh,
928
928
sycl::nd_range<3 >(block_nums * block_dims, block_dims),
929
929
[=](sycl::nd_item<3 > item_ct1)
930
930
[[sycl::reqd_sub_group_size (WARP_SIZE)]] {
@@ -945,8 +945,8 @@ static void mul_mat_vec_iq1_s_q8_1_sycl(const void *vx, const void *vy,
945
945
const sycl::range<3 > block_dims (1 , GGML_SYCL_MMV_Y, WARP_SIZE);
946
946
{
947
947
948
- stream-> submit ([&](sycl::handler &cgh) {
949
- cgh. parallel_for (
948
+ syclex:: submit (*stream, [&](sycl::handler &cgh) {
949
+ syclex::nd_launch (cgh,
950
950
sycl::nd_range<3 >(block_nums * block_dims, block_dims),
951
951
[=](sycl::nd_item<3 > item_ct1)
952
952
[[sycl::reqd_sub_group_size (WARP_SIZE)]] {
@@ -966,8 +966,8 @@ static void mul_mat_vec_iq1_m_q8_1_sycl(const void *vx, const void *vy,
966
966
const sycl::range<3 > block_nums (1 , 1 , block_num_y);
967
967
const sycl::range<3 > block_dims (1 , GGML_SYCL_MMV_Y, WARP_SIZE);
968
968
{
969
- stream-> submit ([&](sycl::handler &cgh) {
970
- cgh. parallel_for (
969
+ syclex:: submit (*stream, [&](sycl::handler &cgh) {
970
+ syclex::nd_launch (cgh,
971
971
sycl::nd_range<3 >(block_nums * block_dims, block_dims),
972
972
[=](sycl::nd_item<3 > item_ct1)
973
973
[[sycl::reqd_sub_group_size (WARP_SIZE)]] {
@@ -988,8 +988,8 @@ static void mul_mat_vec_iq4_nl_q8_1_sycl(const void *vx, const void *vy,
988
988
const sycl::range<3 > block_dims (1 , GGML_SYCL_MMV_Y, WARP_SIZE);
989
989
{
990
990
991
- stream-> submit ([&](sycl::handler &cgh) {
992
- cgh. parallel_for (
991
+ syclex:: submit (*stream, [&](sycl::handler &cgh) {
992
+ syclex::nd_launch (cgh,
993
993
sycl::nd_range<3 >(block_nums * block_dims, block_dims),
994
994
[=](sycl::nd_item<3 > item_ct1)
995
995
[[sycl::reqd_sub_group_size (WARP_SIZE)]] {
@@ -1010,8 +1010,8 @@ static void mul_mat_vec_iq4_xs_q8_1_sycl(const void *vx, const void *vy,
1010
1010
const sycl::range<3 > block_dims (1 , GGML_SYCL_MMV_Y, WARP_SIZE);
1011
1011
{
1012
1012
1013
- stream-> submit ([&](sycl::handler &cgh) {
1014
- cgh. parallel_for (
1013
+ syclex:: submit (*stream, [&](sycl::handler &cgh) {
1014
+ syclex::nd_launch (cgh,
1015
1015
sycl::nd_range<3 >(block_nums * block_dims, block_dims),
1016
1016
[=](sycl::nd_item<3 > item_ct1)
1017
1017
[[sycl::reqd_sub_group_size (WARP_SIZE)]] {
0 commit comments