Skip to content

Commit 50945d0

Browse files
committed
change fmax and fmin fallback implementation back to libdevice float functions
1 parent 1b49010 commit 50945d0

File tree

2 files changed

+2
-2
lines changed

2 files changed

+2
-2
lines changed

libclc/ptx-nvidiacl/libspirv/math/fmax.cl

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -37,7 +37,7 @@ _CLC_DEF _CLC_OVERLOAD half __spirv_ocl_fmax(half x, half y) {
3737
if (__clc_nvvm_reflect_arch() >= 800) {
3838
return __nvvm_fmax_f16(x, y);
3939
}
40-
return x > y ? x : y;
40+
return __nv_fmaxf(x,y);
4141
}
4242
_CLC_DEF _CLC_OVERLOAD half2 __spirv_ocl_fmax(half2 x, half2 y) {
4343
if (__clc_nvvm_reflect_arch() >= 800) {

libclc/ptx-nvidiacl/libspirv/math/fmin.cl

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -37,7 +37,7 @@ _CLC_DEF _CLC_OVERLOAD half __spirv_ocl_fmin(half x, half y) {
3737
if (__clc_nvvm_reflect_arch() >= 800) {
3838
return __nvvm_fmin_f16(x, y);
3939
}
40-
return x < y ? x : y;
40+
return __nv_fminf(x,y);
4141
}
4242
_CLC_DEF _CLC_OVERLOAD half2 __spirv_ocl_fmin(half2 x, half2 y) {
4343
if (__clc_nvvm_reflect_arch() >= 800) {

0 commit comments

Comments
 (0)