@@ -1691,12 +1691,11 @@ namespace dpct
1691
1691
auto data_c = get_memory<Tc>(c);
1692
1692
oneapi::mkl::blas::column_major::gemm (
1693
1693
#ifdef GGML_SYCL_NVIDIA
1694
- oneapi::mkl::backend_selector<oneapi::mkl::backend::cublas>{q },
1694
+ oneapi::mkl::backend_selector<oneapi::mkl::backend::cublas>{ q },
1695
1695
#else
1696
- q,
1696
+ q,
1697
1697
#endif
1698
- a_trans, b_trans, m, n, k, alpha_value, data_a, lda,
1699
- data_b, ldb, beta_value, data_c, ldc);
1698
+ a_trans, b_trans, m, n, k, alpha_value, data_a, lda, data_b, ldb, beta_value, data_c, ldc);
1700
1699
}
1701
1700
1702
1701
template <typename VecT, class BinaryOperation , class = void >
@@ -1761,16 +1760,14 @@ namespace dpct
1761
1760
1762
1761
sycl::event e = oneapi::mkl::blas::column_major::gemm_batch (
1763
1762
#ifdef GGML_SYCL_NVIDIA
1764
- oneapi::mkl::backend_selector<oneapi::mkl::backend::cublas>{q },
1763
+ oneapi::mkl::backend_selector<oneapi::mkl::backend::cublas>{ q },
1765
1764
#else
1766
- q,
1765
+ q,
1767
1766
#endif
1768
- matrix_info->transpose_info , matrix_info->transpose_info + 1 ,
1769
- matrix_info->size_info , matrix_info->size_info + 1 ,
1770
- matrix_info->size_info + 2 , matrix_info->value_info ,
1771
- reinterpret_cast <const Ta **>(a), matrix_info->ld_info ,
1772
- reinterpret_cast <const Tb **>(b), matrix_info->ld_info + 1 ,
1773
- matrix_info->value_info + 1 , reinterpret_cast <Tc **>(c),
1767
+ matrix_info->transpose_info , matrix_info->transpose_info + 1 , matrix_info->size_info ,
1768
+ matrix_info->size_info + 1 , matrix_info->size_info + 2 , matrix_info->value_info ,
1769
+ reinterpret_cast <const Ta **>(a), matrix_info->ld_info , reinterpret_cast <const Tb **>(b),
1770
+ matrix_info->ld_info + 1 , matrix_info->value_info + 1 , reinterpret_cast <Tc **>(c),
1774
1771
matrix_info->ld_info + 2 , 1 , &(matrix_info->groupsize_info ));
1775
1772
1776
1773
q.submit ([&](sycl::handler &cgh)
@@ -1795,12 +1792,11 @@ namespace dpct
1795
1792
auto data_c = get_memory<Tc>(c);
1796
1793
oneapi::mkl::blas::column_major::gemm_batch (
1797
1794
#ifdef GGML_SYCL_NVIDIA
1798
- oneapi::mkl::backend_selector<oneapi::mkl::backend::cublas>{q },
1795
+ oneapi::mkl::backend_selector<oneapi::mkl::backend::cublas>{ q },
1799
1796
#else
1800
- q,
1797
+ q,
1801
1798
#endif
1802
- a_trans, b_trans, m, n, k, alpha_value, data_a, lda,
1803
- stride_a, data_b, ldb, stride_b, beta_value,
1799
+ a_trans, b_trans, m, n, k, alpha_value, data_a, lda, stride_a, data_b, ldb, stride_b, beta_value,
1804
1800
data_c, ldc, stride_c, batch_size);
1805
1801
}
1806
1802
0 commit comments