@@ -1071,10 +1071,9 @@ sycl::event gemm_impl(sycl::queue &exec_q,
1071
1071
size_t delta_n (16 );
1072
1072
1073
1073
gemm_detail::scale_gemm_k_parameters<resTy, m_groups>(
1074
- local_mem_size, reserved_slm_size,
1075
- delta_k, // modified by reference
1076
- n_wi, // modified by reference
1077
- delta_n // modified by reference
1074
+ local_mem_size, reserved_slm_size, delta_k,
1075
+ n_wi, // modified by reference
1076
+ delta_n // modified by reference
1078
1077
);
1079
1078
1080
1079
size_t n_blocks = (n + delta_n - 1 ) / delta_n;
@@ -1108,10 +1107,9 @@ sycl::event gemm_impl(sycl::queue &exec_q,
1108
1107
size_t delta_n (16 );
1109
1108
1110
1109
gemm_detail::scale_gemm_k_parameters<resTy, m_groups>(
1111
- local_mem_size, reserved_slm_size,
1112
- delta_k, // modified by reference
1113
- n_wi, // modified by reference
1114
- delta_n // modified by reference
1110
+ local_mem_size, reserved_slm_size, delta_k,
1111
+ n_wi, // modified by reference
1112
+ delta_n // modified by reference
1115
1113
);
1116
1114
1117
1115
size_t n_blocks = (n + delta_n - 1 ) / delta_n;
@@ -1239,10 +1237,9 @@ sycl::event gemm_contig_impl(sycl::queue &exec_q,
1239
1237
size_t delta_n (16 );
1240
1238
1241
1239
gemm_detail::scale_gemm_k_parameters<resTy, m_groups>(
1242
- local_mem_size, reserved_slm_size,
1243
- delta_k, // modified by reference
1244
- n_wi, // modified by reference
1245
- delta_n // modified by reference
1240
+ local_mem_size, reserved_slm_size, delta_k,
1241
+ n_wi, // modified by reference
1242
+ delta_n // modified by reference
1246
1243
);
1247
1244
1248
1245
size_t n_blocks = (n + delta_n - 1 ) / delta_n;
@@ -1276,10 +1273,9 @@ sycl::event gemm_contig_impl(sycl::queue &exec_q,
1276
1273
size_t delta_n (16 );
1277
1274
1278
1275
gemm_detail::scale_gemm_k_parameters<resTy, m_groups>(
1279
- local_mem_size, reserved_slm_size,
1280
- delta_k, // modified by reference
1281
- n_wi, // modified by reference
1282
- delta_n // modified by reference
1276
+ local_mem_size, reserved_slm_size, delta_k,
1277
+ n_wi, // modified by reference
1278
+ delta_n // modified by reference
1283
1279
);
1284
1280
1285
1281
size_t n_blocks = (n + delta_n - 1 ) / delta_n;
@@ -1976,10 +1972,9 @@ sycl::event gemm_tree_impl(sycl::queue &exec_q,
1976
1972
constexpr int m_groups = 1 ;
1977
1973
1978
1974
gemm_detail::scale_gemm_k_parameters<resTy, m_groups>(
1979
- local_mem_size, reserved_slm_size,
1980
- delta_k, // modified by reference
1981
- n_wi, // modified by reference
1982
- delta_n // modified by reference
1975
+ local_mem_size, reserved_slm_size, delta_k,
1976
+ n_wi, // modified by reference
1977
+ delta_n // modified by reference
1983
1978
);
1984
1979
1985
1980
sycl::event gemm_ev;
@@ -2250,10 +2245,9 @@ sycl::event gemm_tree_impl(sycl::queue &exec_q,
2250
2245
else {
2251
2246
constexpr int m_groups = 2 ;
2252
2247
gemm_detail::scale_gemm_k_parameters<resTy, m_groups>(
2253
- local_mem_size, reserved_slm_size,
2254
- delta_k, // modified by reference
2255
- n_wi, // modified by reference
2256
- delta_n // modified by reference
2248
+ local_mem_size, reserved_slm_size, delta_k,
2249
+ n_wi, // modified by reference
2250
+ delta_n // modified by reference
2257
2251
);
2258
2252
2259
2253
sycl::event gemm_ev;
@@ -2529,10 +2523,9 @@ sycl::event gemm_tree_impl(sycl::queue &exec_q,
2529
2523
constexpr int m_groups = 1 ;
2530
2524
2531
2525
gemm_detail::scale_gemm_k_parameters<resTy, m_groups>(
2532
- local_mem_size, reserved_slm_size,
2533
- delta_k, // modified by reference
2534
- n_wi, // modified by reference
2535
- delta_n // modified by reference
2526
+ local_mem_size, reserved_slm_size, delta_k,
2527
+ n_wi, // modified by reference
2528
+ delta_n // modified by reference
2536
2529
);
2537
2530
2538
2531
sycl::event gemm_ev;
@@ -3410,10 +3403,9 @@ sycl::event gemm_contig_tree_impl(sycl::queue &exec_q,
3410
3403
constexpr int m_groups = 1 ;
3411
3404
3412
3405
gemm_detail::scale_gemm_k_parameters<resTy, m_groups>(
3413
- local_mem_size, reserved_slm_size,
3414
- delta_k, // modified by reference
3415
- n_wi, // modified by reference
3416
- delta_n // modified by reference
3406
+ local_mem_size, reserved_slm_size, delta_k,
3407
+ n_wi, // modified by reference
3408
+ delta_n // modified by reference
3417
3409
);
3418
3410
3419
3411
sycl::event gemm_ev;
@@ -3663,10 +3655,9 @@ sycl::event gemm_contig_tree_impl(sycl::queue &exec_q,
3663
3655
else {
3664
3656
constexpr int m_groups = 2 ;
3665
3657
gemm_detail::scale_gemm_k_parameters<resTy, m_groups>(
3666
- local_mem_size, reserved_slm_size,
3667
- delta_k, // modified by reference
3668
- n_wi, // modified by reference
3669
- delta_n // modified by reference
3658
+ local_mem_size, reserved_slm_size, delta_k,
3659
+ n_wi, // modified by reference
3660
+ delta_n // modified by reference
3670
3661
);
3671
3662
3672
3663
sycl::event gemm_ev;
@@ -3920,10 +3911,9 @@ sycl::event gemm_contig_tree_impl(sycl::queue &exec_q,
3920
3911
constexpr int m_groups = 1 ;
3921
3912
3922
3913
gemm_detail::scale_gemm_k_parameters<resTy, m_groups>(
3923
- local_mem_size, reserved_slm_size,
3924
- delta_k, // modified by reference
3925
- n_wi, // modified by reference
3926
- delta_n // modified by reference
3914
+ local_mem_size, reserved_slm_size, delta_k,
3915
+ n_wi, // modified by reference
3916
+ delta_n // modified by reference
3927
3917
);
3928
3918
3929
3919
sycl::event gemm_ev;
@@ -5476,10 +5466,9 @@ sycl::event gemm_batch_impl(sycl::queue &exec_q,
5476
5466
size_t delta_n (16 );
5477
5467
5478
5468
gemm_detail::scale_gemm_k_parameters<resTy, m_groups>(
5479
- local_mem_size, reserved_slm_size,
5480
- delta_k, // modified by reference
5481
- n_wi, // modified by reference
5482
- delta_n // modified by reference
5469
+ local_mem_size, reserved_slm_size, delta_k,
5470
+ n_wi, // modified by reference
5471
+ delta_n // modified by reference
5483
5472
);
5484
5473
5485
5474
size_t n_blocks = (n + delta_n - 1 ) / delta_n;
@@ -5518,10 +5507,9 @@ sycl::event gemm_batch_impl(sycl::queue &exec_q,
5518
5507
size_t delta_n (16 );
5519
5508
5520
5509
gemm_detail::scale_gemm_k_parameters<resTy, m_groups>(
5521
- local_mem_size, reserved_slm_size,
5522
- delta_k, // modified by reference
5523
- n_wi, // modified by reference
5524
- delta_n // modified by reference
5510
+ local_mem_size, reserved_slm_size, delta_k,
5511
+ n_wi, // modified by reference
5512
+ delta_n // modified by reference
5525
5513
);
5526
5514
5527
5515
size_t n_blocks = (n + delta_n - 1 ) / delta_n;
@@ -5680,10 +5668,9 @@ sycl::event gemm_batch_contig_impl(sycl::queue &exec_q,
5680
5668
size_t delta_n (16 );
5681
5669
5682
5670
gemm_detail::scale_gemm_k_parameters<resTy, m_groups>(
5683
- local_mem_size, reserved_slm_size,
5684
- delta_k, // modified by reference
5685
- n_wi, // modified by reference
5686
- delta_n // modified by reference
5671
+ local_mem_size, reserved_slm_size, delta_k,
5672
+ n_wi, // modified by reference
5673
+ delta_n // modified by reference
5687
5674
);
5688
5675
5689
5676
size_t n_blocks = (n + delta_n - 1 ) / delta_n;
@@ -5722,10 +5709,9 @@ sycl::event gemm_batch_contig_impl(sycl::queue &exec_q,
5722
5709
size_t delta_n (16 );
5723
5710
5724
5711
gemm_detail::scale_gemm_k_parameters<resTy, m_groups>(
5725
- local_mem_size, reserved_slm_size,
5726
- delta_k, // modified by reference
5727
- n_wi, // modified by reference
5728
- delta_n // modified by reference
5712
+ local_mem_size, reserved_slm_size, delta_k,
5713
+ n_wi, // modified by reference
5714
+ delta_n // modified by reference
5729
5715
);
5730
5716
5731
5717
size_t n_blocks = (n + delta_n - 1 ) / delta_n;
@@ -6506,10 +6492,9 @@ gemm_batch_tree_impl(sycl::queue &exec_q,
6506
6492
if (m == 1 ) {
6507
6493
constexpr int m_groups = 1 ;
6508
6494
gemm_detail::scale_gemm_k_parameters<resTy, m_groups>(
6509
- local_mem_size, reserved_slm_size,
6510
- delta_k, // modified by reference
6511
- n_wi, // modified by reference
6512
- delta_n // modified by reference
6495
+ local_mem_size, reserved_slm_size, delta_k,
6496
+ n_wi, // modified by reference
6497
+ delta_n // modified by reference
6513
6498
);
6514
6499
6515
6500
if (k <= (delta_k * n_wi)) {
@@ -6836,10 +6821,9 @@ gemm_batch_tree_impl(sycl::queue &exec_q,
6836
6821
constexpr int m_groups = 2 ;
6837
6822
6838
6823
gemm_detail::scale_gemm_k_parameters<resTy, m_groups>(
6839
- local_mem_size, reserved_slm_size,
6840
- delta_k, // modified by reference
6841
- n_wi, // modified by reference
6842
- delta_n // modified by reference
6824
+ local_mem_size, reserved_slm_size, delta_k,
6825
+ n_wi, // modified by reference
6826
+ delta_n // modified by reference
6843
6827
);
6844
6828
6845
6829
if (k <= (delta_k * n_wi)) {
@@ -7174,10 +7158,9 @@ gemm_batch_tree_impl(sycl::queue &exec_q,
7174
7158
constexpr int m_groups = 1 ;
7175
7159
7176
7160
gemm_detail::scale_gemm_k_parameters<resTy, m_groups>(
7177
- local_mem_size, reserved_slm_size,
7178
- delta_k, // modified by reference
7179
- n_wi, // modified by reference
7180
- delta_n // modified by reference
7161
+ local_mem_size, reserved_slm_size, delta_k,
7162
+ n_wi, // modified by reference
7163
+ delta_n // modified by reference
7181
7164
);
7182
7165
7183
7166
// each group processes delta_k * n_wi
@@ -8212,10 +8195,9 @@ gemm_batch_contig_tree_impl(sycl::queue &exec_q,
8212
8195
if (m == 1 ) {
8213
8196
constexpr int m_groups = 1 ;
8214
8197
gemm_detail::scale_gemm_k_parameters<resTy, m_groups>(
8215
- local_mem_size, reserved_slm_size,
8216
- delta_k, // modified by reference
8217
- n_wi, // modified by reference
8218
- delta_n // modified by reference
8198
+ local_mem_size, reserved_slm_size, delta_k,
8199
+ n_wi, // modified by reference
8200
+ delta_n // modified by reference
8219
8201
);
8220
8202
8221
8203
if (k <= (delta_k * n_wi)) {
@@ -8533,10 +8515,9 @@ gemm_batch_contig_tree_impl(sycl::queue &exec_q,
8533
8515
constexpr int m_groups = 2 ;
8534
8516
8535
8517
gemm_detail::scale_gemm_k_parameters<resTy, m_groups>(
8536
- local_mem_size, reserved_slm_size,
8537
- delta_k, // modified by reference
8538
- n_wi, // modified by reference
8539
- delta_n // modified by reference
8518
+ local_mem_size, reserved_slm_size, delta_k,
8519
+ n_wi, // modified by reference
8520
+ delta_n // modified by reference
8540
8521
);
8541
8522
8542
8523
if (k <= (delta_k * n_wi)) {
@@ -8857,10 +8838,9 @@ gemm_batch_contig_tree_impl(sycl::queue &exec_q,
8857
8838
constexpr int m_groups = 1 ;
8858
8839
8859
8840
gemm_detail::scale_gemm_k_parameters<resTy, m_groups>(
8860
- local_mem_size, reserved_slm_size,
8861
- delta_k, // modified by reference
8862
- n_wi, // modified by reference
8863
- delta_n // modified by reference
8841
+ local_mem_size, reserved_slm_size, delta_k,
8842
+ n_wi, // modified by reference
8843
+ delta_n // modified by reference
8864
8844
);
8865
8845
8866
8846
// each group processes delta_k * n_wi
0 commit comments