Skip to content

Commit 8461886

Browse files
committed
[MLIR][Math][GPU] Add lowering of absi and fpowi to libdevice
1 parent 22d4ff1 commit 8461886

File tree

2 files changed

+26
-0
lines changed

2 files changed

+26
-0
lines changed

mlir/lib/Conversion/GPUToNVVM/LowerGpuOpsToNVVMOps.cpp

Lines changed: 2 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -509,6 +509,7 @@ void mlir::populateGpuToNVVMConversionPatterns(
509509

510510
populateOpPatterns<arith::RemFOp>(converter, patterns, "__nv_fmodf",
511511
"__nv_fmod");
512+
populateOpPatterns<math::AbsIOp>(converter, patterns, "__nv_abs");
512513
populateOpPatterns<math::AbsFOp>(converter, patterns, "__nv_fabsf",
513514
"__nv_fabs");
514515
populateOpPatterns<math::AcosOp>(converter, patterns, "__nv_acosf",
@@ -555,6 +556,7 @@ void mlir::populateGpuToNVVMConversionPatterns(
555556
"__nv_log2", "__nv_fast_log2f");
556557
populateOpPatterns<math::PowFOp>(converter, patterns, "__nv_powf", "__nv_pow",
557558
"__nv_fast_powf");
559+
populateOpPatterns<math::FPowIOp>(converter, patterns, "__nv_powif", "__nv_powi");
558560
populateOpPatterns<math::RoundOp>(converter, patterns, "__nv_roundf",
559561
"__nv_round");
560562
populateOpPatterns<math::RoundEvenOp>(converter, patterns, "__nv_rintf",

mlir/test/Conversion/GPUToNVVM/gpu-to-nvvm.mlir

Lines changed: 24 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -1033,3 +1033,27 @@ module attributes {transform.with_named_sequence} {
10331033
transform.yield
10341034
}
10351035
}
1036+
1037+
1038+
gpu.module @test_module_52 {
1039+
// CHECK: llvm.func @__nv_abs(i32) -> i32
1040+
// CHECK-LABEL: func @gpu_abs
1041+
func.func @gpu_fabs(%arg_i32 : i32) -> (i32) {
1042+
%result32 = math.absi %arg_i32 : i32
1043+
// CHECK: llvm.call @__nv_abs(%{{.*}}) : (i32) -> i32
1044+
func.return %result32 : i32
1045+
}
1046+
}
1047+
1048+
gpu.module @test_module_26 {
1049+
// CHECK: llvm.func @__nv_powif(f32, i32) -> f32
1050+
// CHECK: llvm.func @__nv_powi(f64, i32) -> f64
1051+
// CHECK-LABEL: func @gpu_powi
1052+
func.func @gpu_powi(%arg_f32 : f32, %arg_f64 : f64, %arg_i32 : i32) -> (f32, f64) {
1053+
%result32 = math.fpowi %arg_f32, %arg_i32 : f32
1054+
// CHECK: llvm.call @__nv_powf(%{{.*}}, %{{.*}}) : (f32, i32) -> f32
1055+
%result64 = math.fpowi %arg_f64, %arg_i64 : f64
1056+
// CHECK: llvm.call @__nv_pow(%{{.*}}, %{{.*}}) : (f64, i32) -> f64
1057+
func.return %result32, %result64 : f32, f64
1058+
}
1059+
}

0 commit comments

Comments
 (0)