@@ -24,8 +24,8 @@ static void acc_f32(const float * x, const float * y, float * dst, const int ne,
24
24
template <typename T>
25
25
static void gelu (const T * x, T * dst, const int k,
26
26
const sycl::nd_item<3 > &item_ct1) {
27
- const T GELU_COEF_A = to_T <T>(0 .044715f );
28
- const T SQRT_2_OVER_PI = to_T <T>(0 .79788456080286535587989211986876f );
27
+ const T GELU_COEF_A = static_cast <T>(0 .044715f );
28
+ const T SQRT_2_OVER_PI = static_cast <T>(0 .79788456080286535587989211986876f );
29
29
const int i = item_ct1.get_local_range (2 ) * item_ct1.get_group (2 ) +
30
30
item_ct1.get_local_id (2 );
31
31
@@ -34,9 +34,9 @@ static void gelu(const T * x, T * dst, const int k,
34
34
}
35
35
36
36
float xi = x[i];
37
- dst[i] = to_T <T>(0 .5f ) * xi *
38
- (to_T <T>(1 .0f ) +
39
- sycl::tanh (SQRT_2_OVER_PI * xi * (to_T <T>(1 .0f ) + GELU_COEF_A * xi * xi)));
37
+ dst[i] = static_cast <T>(0 .5f ) * xi *
38
+ (static_cast <T>(1 .0f ) +
39
+ sycl::tanh (SQRT_2_OVER_PI * xi * (static_cast <T>(1 .0f ) + GELU_COEF_A * xi * xi)));
40
40
}
41
41
42
42
template <typename T>
@@ -48,7 +48,7 @@ static void silu(const T * x, T * dst, const int k,
48
48
if (i >= k) {
49
49
return ;
50
50
}
51
- dst[i] = x[i] / (to_T <T>(1 .0f ) + sycl::native::exp (-x[i]));
51
+ dst[i] = x[i] / (static_cast <T>(1 .0f ) + sycl::native::exp (-x[i]));
52
52
}
53
53
54
54
template <typename T>
@@ -60,7 +60,7 @@ static void gelu_quick(const T *x, T *dst, int k,
60
60
if (i >= k) {
61
61
return ;
62
62
}
63
- dst[i] = x[i] * (to_T <T>(1 .0f ) / (to_T <T>(1 .0f ) + sycl::native::exp (GELU_QUICK_COEF * x[i])));
63
+ dst[i] = x[i] * (static_cast <T>(1 .0f ) / (static_cast <T>(1 .0f ) + sycl::native::exp (GELU_QUICK_COEF * x[i])));
64
64
}
65
65
66
66
template <typename T>
@@ -95,7 +95,7 @@ static void sigmoid(const T * x, T * dst, const int k,
95
95
if (i >= k) {
96
96
return ;
97
97
}
98
- dst[i] = 1 .0f / (to_T <T>(1 .0f ) + sycl::native::exp (-x[i]));
98
+ dst[i] = 1 .0f / (static_cast <T>(1 .0f ) + sycl::native::exp (-x[i]));
99
99
}
100
100
101
101
template <typename T>
@@ -143,7 +143,7 @@ static void hardsigmoid(const T * x, T * dst, const int k,
143
143
if (i >= k) {
144
144
return ;
145
145
}
146
- dst[i] = sycl::fmin (to_T <T>(1 .0f ), sycl::fmax (to_T <T>(0 .0f ), (x[i] + to_T <T>(3 .0f )) / to_T <T>(6 .0f )));
146
+ dst[i] = sycl::fmin (static_cast <T>(1 .0f ), sycl::fmax (static_cast <T>(0 .0f ), (x[i] + static_cast <T>(3 .0f )) / static_cast <T>(6 .0f )));
147
147
}
148
148
149
149
template <typename T>
@@ -155,7 +155,7 @@ static void hardswish(const T * x, T * dst, const int k,
155
155
if (i >= k) {
156
156
return ;
157
157
}
158
- dst[i] = x[i] * sycl::fmin (to_T <T>(1 .0f ), sycl::fmax (to_T <T>(0 .0f ), (x[i] + to_T <T>(3 .0f )) / to_T <T>(6 .0f )));
158
+ dst[i] = x[i] * sycl::fmin (static_cast <T>(1 .0f ), sycl::fmax (static_cast <T>(0 .0f ), (x[i] + static_cast <T>(3 .0f )) / static_cast <T>(6 .0f )));
159
159
}
160
160
161
161
template <typename T>
@@ -276,7 +276,7 @@ static void pad(const T *x, T *dst, const int ne0, const int ne00, const int ne
276
276
item_ct1.get_group (0 ) * ne00 * ne01;
277
277
dst[offset_dst] = x[offset_src];
278
278
} else {
279
- dst[offset_dst] = to_T <T>(0 .0f );
279
+ dst[offset_dst] = static_cast <T>(0 .0f );
280
280
}
281
281
}
282
282
0 commit comments