[Analysis] isTriviallyVectorizable - add vectorization support for acos/asin/atan and cosh/sinh/tanh intrinsics #106584

RKSimon · 2024-08-29T16:52:54Z

Show fallback cases in amdlibm tests where it doesn't have that specific op

llvmbot · 2024-08-29T16:53:27Z

@llvm/pr-subscribers-llvm-analysis

@llvm/pr-subscribers-llvm-transforms

Author: Simon Pilgrim (RKSimon)

Changes

Show fallback cases in amdlibm tests where it doesn't have that specific op

Full diff: https://github.com/llvm/llvm-project/pull/106584.diff

2 Files Affected:

(modified) llvm/lib/Analysis/VectorUtils.cpp (+6)
(modified) llvm/test/Transforms/LoopVectorize/X86/amdlibm-calls.ll (+13)

diff --git a/llvm/lib/Analysis/VectorUtils.cpp b/llvm/lib/Analysis/VectorUtils.cpp
index cc742ab35f4498..32ce34114b2f50 100644
--- a/llvm/lib/Analysis/VectorUtils.cpp
+++ b/llvm/lib/Analysis/VectorUtils.cpp
@@ -66,9 +66,15 @@ bool llvm::isTriviallyVectorizable(Intrinsic::ID ID) {
   case Intrinsic::umul_fix:
   case Intrinsic::umul_fix_sat:
   case Intrinsic::sqrt: // Begin floating-point.
+  case Intrinsic::asin:
+  case Intrinsic::acos:
+  case Intrinsic::atan:
   case Intrinsic::sin:
   case Intrinsic::cos:
   case Intrinsic::tan:
+  case Intrinsic::sinh:
+  case Intrinsic::cosh:
+  case Intrinsic::tanh:
   case Intrinsic::exp:
   case Intrinsic::exp2:
   case Intrinsic::log:
diff --git a/llvm/test/Transforms/LoopVectorize/X86/amdlibm-calls.ll b/llvm/test/Transforms/LoopVectorize/X86/amdlibm-calls.ll
index 04289d43f40e2f..c051e2f18380bd 100644
--- a/llvm/test/Transforms/LoopVectorize/X86/amdlibm-calls.ll
+++ b/llvm/test/Transforms/LoopVectorize/X86/amdlibm-calls.ll
@@ -414,6 +414,7 @@ for.end:
 
 define void @acos_f32_intrinsic(ptr nocapture %varray) {
 ; CHECK-LABEL: @acos_f32_intrinsic(
+; CHECK-VF2:    [[TMP5:%.*]] = call <2 x float> @llvm.acos.v2f32(<2 x float> [[TMP4:%.*]])
 ; CHECK-VF4:    [[TMP5:%.*]] = call <4 x float> @amd_vrs4_acosf(<4 x float> [[TMP4:%.*]])
 ; CHECK-VF8:    [[TMP5:%.*]] = call <8 x float> @amd_vrs8_acosf(<8 x float> [[TMP4:%.*]])
 ; CHECK-VF16:   [[TMP5:%.*]] = call <16 x float> @amd_vrs16_acosf(<16 x float> [[TMP4:%.*]])
@@ -487,7 +488,10 @@ for.end:
 
 define void @asin_f64_intrinsic(ptr nocapture %varray) {
 ; CHECK-LABEL: @asin_f64_intrinsic(
+; CHECK-VF2:    [[TMP5:%.*]] = call <2 x double> @llvm.asin.v2f64(<2 x double> [[TMP4:%.*]])
+; CHECK-VF4:    [[TMP5:%.*]] = call <4 x double> @llvm.asin.v4f64(<4 x double> [[TMP4:%.*]])
 ; CHECK-VF8:    [[TMP5:%.*]] = call <8 x double> @amd_vrd8_asin(<8 x double> [[TMP4:%.*]])
+; CHECK-VF16:   [[TMP5:%.*]] = call <16 x double> @llvm.asin.v16f64(<16 x double> [[TMP4:%.*]])
 ; CHECK:        ret void
 ;
 entry:
@@ -510,6 +514,7 @@ for.end:
 
 define void @asin_f32_intrinsic(ptr nocapture %varray) {
 ; CHECK-LABEL: @asin_f32_intrinsic(
+; CHECK-VF2:    [[TMP5:%.*]] = call <2 x float> @llvm.asin.v2f32(<2 x float> [[TMP4:%.*]])
 ; CHECK-VF4:    [[TMP5:%.*]] = call <4 x float> @amd_vrs4_asinf(<4 x float> [[TMP4:%.*]])
 ; CHECK-VF8:    [[TMP5:%.*]] = call <8 x float> @amd_vrs8_asinf(<8 x float> [[TMP4:%.*]])
 ; CHECK-VF16:   [[TMP5:%.*]] = call <16 x float> @amd_vrs16_asinf(<16 x float> [[TMP4:%.*]])
@@ -588,6 +593,7 @@ define void @atan_f64_intrinsic(ptr nocapture %varray) {
 ; CHECK-VF2:    [[TMP5:%.*]] = call <2 x double> @amd_vrd2_atan(<2 x double> [[TMP4:%.*]])
 ; CHECK-VF4:    [[TMP5:%.*]] = call <4 x double> @amd_vrd4_atan(<4 x double> [[TMP4:%.*]])
 ; CHECK-VF8:    [[TMP5:%.*]] = call <8 x double> @amd_vrd8_atan(<8 x double> [[TMP4:%.*]])
+; CHECK-VF16:   [[TMP5:%.*]] = call <16 x double> @llvm.atan.v16f64(<16 x double> [[TMP4:%.*]])
 ; CHECK:        ret void
 ;
 entry:
@@ -610,6 +616,7 @@ for.end:
 
 define void @atan_f32_intrinsic(ptr nocapture %varray) {
 ; CHECK-LABEL: @atan_f32_intrinsic(
+; CHECK-VF2:    [[TMP5:%.*]] = call <2 x float> @llvm.atan.v2f32(<2 x float> [[TMP4:%.*]])
 ; CHECK-VF4:    [[TMP5:%.*]] = call <4 x float> @amd_vrs4_atanf(<4 x float> [[TMP4:%.*]])
 ; CHECK-VF8:    [[TMP5:%.*]] = call <8 x float> @amd_vrs8_atanf(<8 x float> [[TMP4:%.*]])
 ; CHECK-VF16:   [[TMP5:%.*]] = call <16 x float> @amd_vrs16_atanf(<16 x float> [[TMP4:%.*]])
@@ -683,6 +690,9 @@ for.end:
 define void @cosh_f64_intrinsic(ptr nocapture %varray) {
 ; CHECK-LABEL: @cosh_f64_intrinsic(
 ; CHECK-VF2:    [[TMP5:%.*]] = call <2 x double> @amd_vrd2_cosh(<2 x double> [[TMP4:%.*]])
+; CHECK-VF4:    [[TMP5:%.*]] = call <4 x double> @llvm.cosh.v4f64(<4 x double> [[TMP4:%.*]])
+; CHECK-VF8:    [[TMP5:%.*]] = call <8 x double> @llvm.cosh.v8f64(<8 x double> [[TMP4:%.*]])
+; CHECK-VF16:   [[TMP5:%.*]] = call <16 x double> @llvm.cosh.v16f64(<16 x double> [[TMP4:%.*]])
 ; CHECK:        ret void
 ;
 entry:
@@ -705,8 +715,10 @@ for.end:
 
 define void @cosh_f32_intrinsic(ptr nocapture %varray) {
 ; CHECK-LABEL: @cosh_f32_intrinsic(
+; CHECK-VF2:    [[TMP5:%.*]] = call <2 x float> @llvm.cosh.v2f32(<2 x float> [[TMP4:%.*]])
 ; CHECK-VF4:    [[TMP5:%.*]] = call <4 x float> @amd_vrs4_coshf(<4 x float> [[TMP4:%.*]])
 ; CHECK-VF8:    [[TMP5:%.*]] = call <8 x float> @amd_vrs8_coshf(<8 x float> [[TMP4:%.*]])
+; CHECK-VF16:   [[TMP5:%.*]] = call <16 x float> @llvm.cosh.v16f32(<16 x float> [[TMP4:%.*]])
 ; CHECK:        ret void
 ;
 entry:
@@ -754,6 +766,7 @@ for.end:
 
 define void @tanh_f32_intrinsic(ptr nocapture %varray) {
 ; CHECK-LABEL: @tanh_f32_intrinsic(
+; CHECK-VF2:    [[TMP5:%.*]] = call <2 x float> @llvm.tanh.v2f32(<2 x float> [[TMP4:%.*]])
 ; CHECK-VF4:    [[TMP5:%.*]] = call <4 x float> @amd_vrs4_tanhf(<4 x float> [[TMP4:%.*]])
 ; CHECK-VF8:    [[TMP5:%.*]] = call <8 x float> @amd_vrs8_tanhf(<8 x float> [[TMP4:%.*]])
 ; CHECK-VF16:   [[TMP5:%.*]] = call <16 x float> @amd_vrs16_tanhf(<16 x float> [[TMP4:%.*]])

farzonl · 2024-08-29T16:56:12Z

@RKSimon I didn't add isTriviallyVectorizable for these because it broke a number of tests in the RISCV backend. isTriviallyVectorizable is exposed across all backends and I think what we would want is something that could be opt in per backend. https://github.com/llvm/llvm-project/blob/main/llvm/test/Transforms/SLPVectorizer/RISCV/math-function.ll#L488

alexey-bataev · 2024-08-29T16:56:21Z

Could you add the tests for other targets?

RKSimon · 2024-08-29T21:51:01Z

@RKSimon I didn't add isTriviallyVectorizable for these because it broke a number of tests in the RISCV backend. isTriviallyVectorizable is exposed across all backends and I think what we would want is something that could be opt in per backend. https://github.com/llvm/llvm-project/blob/main/llvm/test/Transforms/SLPVectorizer/RISCV/math-function.ll#L488

This no longer appears to be an issue.

…nh/tanh intrinsics to support #106584

alexey-bataev · 2024-08-30T10:35:43Z

Could you add the tests for AArch64 to RISCV too?

RKSimon · 2024-08-30T10:43:57Z

What attributes / veclibs should I use for riscv? llvm-project\llvm\test\Transforms\SLPVectorizer\RISCV\math-function.ll doesn't seem to do much

alexey-bataev · 2024-08-30T10:50:07Z

What attributes / veclibs should I use for riscv? llvm-project\llvm\test\Transforms\SLPVectorizer\RISCV\math-function.ll doesn't seem to do much

Without veclibs, just some basic stuff

RKSimon · 2024-08-30T10:53:06Z

Thats what math-function.ll already does already

alexey-bataev · 2024-08-30T11:04:49Z

Thats what math-function.ll already does already

But not newly added functions

…intrinsics to support #106584

…vectorize acos/asin/atan and cosh/sinh/tanh intrinsics

…os/asin/atan and cosh/sinh/tanh intrinsics

RKSimon · 2024-08-30T13:05:03Z

ceb613a adds missing riscv coverage - checks that there is no vectorisation

alexey-bataev

LG, thanks!

…os/asin/atan and cosh/sinh/tanh libcalls Followup to #llvm#106584 - ensure acos/asin/atan and cosh/sinh/tanh libcalls correctly map to the llvm intrinsic equivalents

…os/asin/atan and cosh/sinh/tanh libcalls (#106844) Followup to #106584 - ensure acos/asin/atan and cosh/sinh/tanh libcalls correctly map to the llvm intrinsic equivalents

RKSimon requested review from farzonl, alexey-bataev and davemgreen August 29, 2024 16:52

llvmbot added llvm:analysis Includes value tracking, cost tables and constant folding llvm:transforms labels Aug 29, 2024

RKSimon added a commit that referenced this pull request Aug 30, 2024

[AArch64] Add accelerate test coverage for acos/asin/atan and cosh/si…

c4b5cb0

…nh/tanh intrinsics to support #106584

RKSimon force-pushed the vectorize-arc-hypot branch from 8d660e1 to 519c030 Compare August 30, 2024 10:31

RKSimon added a commit that referenced this pull request Aug 30, 2024

[RISCV] Add full test coverage for acos/asin/atan and cosh/sinh/tanh …

ceb613a

…intrinsics to support #106584

RKSimon added 3 commits August 30, 2024 14:02

[LoopVectorize][X86] amdlibm-calls.ll - add tests showing failure to …

399ec2e

…vectorize acos/asin/atan and cosh/sinh/tanh intrinsics

[Analysis] isTriviallyVectorizable - add vectorization support for ac…

5560892

…os/asin/atan and cosh/sinh/tanh intrinsics

[AArch64] Regenerate accelerate-vector-functions.ll tests

86e6eb7

RKSimon force-pushed the vectorize-arc-hypot branch from 519c030 to 86e6eb7 Compare August 30, 2024 13:04

farzonl approved these changes Aug 30, 2024

View reviewed changes

alexey-bataev approved these changes Aug 30, 2024

View reviewed changes

RKSimon merged commit d58d105 into llvm:main Aug 30, 2024
8 checks passed

RKSimon deleted the vectorize-arc-hypot branch August 30, 2024 15:49

RKSimon mentioned this pull request Aug 31, 2024

[Analysis] getIntrinsicForCallSite - add vectorization support for acos/asin/atan and cosh/sinh/tanh libcalls #106844

Merged

Provide feedback

Saved searches

Use saved searches to filter your results more quickly

Uh oh!

[Analysis] isTriviallyVectorizable - add vectorization support for acos/asin/atan and cosh/sinh/tanh intrinsics #106584

[Analysis] isTriviallyVectorizable - add vectorization support for acos/asin/atan and cosh/sinh/tanh intrinsics #106584

Uh oh!

RKSimon commented Aug 29, 2024

Uh oh!

llvmbot commented Aug 29, 2024 •

edited

Loading

Uh oh!

farzonl commented Aug 29, 2024 •

edited

Loading

Uh oh!

alexey-bataev commented Aug 29, 2024

Uh oh!

RKSimon commented Aug 29, 2024

Uh oh!

alexey-bataev commented Aug 30, 2024

Uh oh!

RKSimon commented Aug 30, 2024

Uh oh!

alexey-bataev commented Aug 30, 2024

Uh oh!

RKSimon commented Aug 30, 2024

Uh oh!

alexey-bataev commented Aug 30, 2024

Uh oh!

RKSimon commented Aug 30, 2024

Uh oh!

alexey-bataev left a comment

Uh oh!

Uh oh!

Uh oh!

[Analysis] isTriviallyVectorizable - add vectorization support for acos/asin/atan and cosh/sinh/tanh intrinsics #106584

[Analysis] isTriviallyVectorizable - add vectorization support for acos/asin/atan and cosh/sinh/tanh intrinsics #106584

Uh oh!

Conversation

RKSimon commented Aug 29, 2024

Uh oh!

llvmbot commented Aug 29, 2024 • edited Loading Uh oh! There was an error while loading. Please reload this page.

Uh oh!

Uh oh!

farzonl commented Aug 29, 2024 • edited Loading Uh oh! There was an error while loading. Please reload this page.

Uh oh!

Uh oh!

alexey-bataev commented Aug 29, 2024

Uh oh!

RKSimon commented Aug 29, 2024

Uh oh!

alexey-bataev commented Aug 30, 2024

Uh oh!

RKSimon commented Aug 30, 2024

Uh oh!

alexey-bataev commented Aug 30, 2024

Uh oh!

RKSimon commented Aug 30, 2024

Uh oh!

alexey-bataev commented Aug 30, 2024

Uh oh!

RKSimon commented Aug 30, 2024

Uh oh!

alexey-bataev left a comment

Choose a reason for hiding this comment

Uh oh!

Uh oh!

Uh oh!

llvmbot commented Aug 29, 2024 •

edited

Loading

farzonl commented Aug 29, 2024 •

edited

Loading