@@ -1887,11 +1887,11 @@ static void argsort_f32_i32_sycl(const float *x, int *dst, const int ncols,
1887
1887
const size_t shared_mem = ncols_pad * sizeof (int );
1888
1888
1889
1889
if (order == GGML_SORT_ORDER_ASC) {
1890
- stream-> submit ([&](sycl::handler &cgh) {
1890
+ syclex:: submit (*stream, [&](sycl::handler &cgh) {
1891
1891
sycl::local_accessor<uint8_t , 1 > dpct_local_acc_ct1 (
1892
1892
sycl::range<1 >(shared_mem), cgh);
1893
1893
1894
- cgh. parallel_for (
1894
+ syclex::nd_launch (cgh,
1895
1895
sycl::nd_range<3 >(block_nums * block_dims, block_dims),
1896
1896
[=](sycl::nd_item<3 > item_ct1) {
1897
1897
k_argsort_f32_i32<GGML_SORT_ORDER_ASC>(
@@ -1901,11 +1901,11 @@ static void argsort_f32_i32_sycl(const float *x, int *dst, const int ncols,
1901
1901
});
1902
1902
});
1903
1903
} else if (order == GGML_SORT_ORDER_DESC) {
1904
- stream-> submit ([&](sycl::handler &cgh) {
1904
+ syclex:: submit (*stream, [&](sycl::handler &cgh) {
1905
1905
sycl::local_accessor<uint8_t , 1 > dpct_local_acc_ct1 (
1906
1906
sycl::range<1 >(shared_mem), cgh);
1907
1907
1908
- cgh. parallel_for (
1908
+ syclex::nd_launch (cgh,
1909
1909
sycl::nd_range<3 >(block_nums * block_dims, block_dims),
1910
1910
[=](sycl::nd_item<3 > item_ct1) {
1911
1911
k_argsort_f32_i32<GGML_SORT_ORDER_DESC>(
@@ -1925,13 +1925,13 @@ static void argmax_f32_i32_sycl(const float *x, int *dst, const int ncols,
1925
1925
const sycl::range<3 > block_nums (1 , nrows, 1 );
1926
1926
const size_t shared_mem = 256 * sizeof (float );
1927
1927
1928
- stream-> submit ([&](sycl::handler &cgh) {
1928
+ syclex:: submit (*stream, [&](sycl::handler &cgh) {
1929
1929
sycl::local_accessor<float , 1 > shared_data (
1930
1930
sycl::range<1 >(shared_mem/sizeof (float )), cgh);
1931
1931
sycl::local_accessor<int , 1 > shared_indices (
1932
1932
sycl::range<1 >(shared_mem/sizeof (float )), cgh);
1933
1933
1934
- cgh. parallel_for (
1934
+ syclex::nd_launch (cgh,
1935
1935
sycl::nd_range<3 >(block_nums * block_dims, block_dims),
1936
1936
[=](sycl::nd_item<3 > item_ct1) {
1937
1937
const int tid = item_ct1.get_local_id (2 );
@@ -2952,7 +2952,7 @@ static void ggml_sycl_mul_mat_batched_sycl(ggml_backend_sycl_context & ctx, cons
2952
2952
void ** ptrs_dst_get = ptrs_dst.get ();
2953
2953
size_t nb12_scaled = src1->type == GGML_TYPE_F16 ? nb12 : s12 * sizeof (sycl::half);
2954
2954
size_t nb13_scaled = src1->type == GGML_TYPE_F16 ? nb13 : s13 * sizeof (sycl::half);
2955
- cgh. parallel_for ( sycl::nd_range<3 >(block_dims, block_dims), [=](sycl::nd_item<3 > item_ct1) {
2955
+ syclex::nd_launch (cgh, sycl::nd_range<3 >(block_dims, block_dims), [=](sycl::nd_item<3 > item_ct1) {
2956
2956
k_compute_batched_ptrs (src0_f16, src1_f16, dst_ddf, ptrs_src_get, ptrs_dst_get, ne12, ne13, ne23, nb02,
2957
2957
nb03, nb12_scaled, nb13_scaled, nbd2, nbd3, r2, r3, item_ct1);
2958
2958
});
@@ -3456,7 +3456,7 @@ static void ggml_sycl_mul_mat_id(ggml_backend_sycl_context & ctx,
3456
3456
{
3457
3457
sycl::range<3 > block_dims (1 , 1 , std::min ((unsigned int )ne10, 768u ));
3458
3458
sycl::range<3 > grid_dims (1 , n_ids, ids->ne [1 ]);
3459
- stream-> submit ([&](sycl::handler &cgh) {
3459
+ syclex:: submit (*stream, [&](sycl::handler &cgh) {
3460
3460
sycl::local_accessor<int , 0 > src1_row_acc (cgh);
3461
3461
3462
3462
char *__restrict src1_contiguous_get =
@@ -3468,7 +3468,7 @@ static void ggml_sycl_mul_mat_id(ggml_backend_sycl_context & ctx,
3468
3468
size_t ids_nb_ct6 = ids->nb [1 ];
3469
3469
size_t ids_nb_ct7 = ids->nb [0 ];
3470
3470
3471
- cgh. parallel_for (
3471
+ syclex::nd_launch (cgh,
3472
3472
sycl::nd_range<3 >(grid_dims * block_dims, block_dims),
3473
3473
[=](sycl::nd_item<3 > item_ct1) {
3474
3474
k_copy_src1_to_contiguous (
@@ -3501,13 +3501,13 @@ static void ggml_sycl_mul_mat_id(ggml_backend_sycl_context & ctx,
3501
3501
{
3502
3502
sycl::range<3 > block_dims (1 , 1 , std::min ((unsigned int )ne0, 768u ));
3503
3503
sycl::range<3 > grid_dims (1 , 1 , num_src1_rows);
3504
- stream-> submit ([&](sycl::handler &cgh) {
3504
+ syclex:: submit (*stream, [&](sycl::handler &cgh) {
3505
3505
const char *__restrict dst_contiguous_get =
3506
3506
dst_contiguous.get ();
3507
3507
const mmid_row_mapping *__restrict dev_row_mapping_get =
3508
3508
dev_row_mapping.get ();
3509
3509
3510
- cgh. parallel_for (
3510
+ syclex::nd_launch (cgh,
3511
3511
sycl::nd_range<3 >(grid_dims * block_dims, block_dims),
3512
3512
[=](sycl::nd_item<3 > item_ct1) {
3513
3513
k_copy_dst_from_contiguous (dst_original,
0 commit comments