|
| 1 | +; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --version 4 |
| 2 | +; RUN: opt -S --passes=slp-vectorizer -mtriple=x86_64-unknown-linux-gnu < %s | FileCheck %s |
| 3 | + |
| 4 | +define double @test() { |
| 5 | +; CHECK-LABEL: define double @test() { |
| 6 | +; CHECK-NEXT: entry: |
| 7 | +; CHECK-NEXT: [[TMP0:%.*]] = load <2 x double>, ptr getelementptr inbounds ([13 x double], ptr null, i64 0, i64 5), align 8 |
| 8 | +; CHECK-NEXT: [[TMP1:%.*]] = load <2 x double>, ptr getelementptr inbounds ([13 x double], ptr null, i64 0, i64 8), align 16 |
| 9 | +; CHECK-NEXT: [[TMP2:%.*]] = shufflevector <2 x double> [[TMP0]], <2 x double> [[TMP1]], <2 x i32> <i32 1, i32 3> |
| 10 | +; CHECK-NEXT: [[TMP3:%.*]] = shufflevector <2 x double> [[TMP2]], <2 x double> poison, <4 x i32> <i32 0, i32 1, i32 poison, i32 poison> |
| 11 | +; CHECK-NEXT: [[TMP4:%.*]] = fmul <4 x double> zeroinitializer, [[TMP3]] |
| 12 | +; CHECK-NEXT: [[TMP5:%.*]] = call reassoc nsz double @llvm.vector.reduce.fadd.v4f64(double -0.000000e+00, <4 x double> [[TMP4]]) |
| 13 | +; CHECK-NEXT: [[TMP6:%.*]] = fmul double [[TMP5]], 0.000000e+00 |
| 14 | +; CHECK-NEXT: store double [[TMP6]], ptr null, align 16 |
| 15 | +; CHECK-NEXT: br label [[BB:%.*]] |
| 16 | +; CHECK: bb: |
| 17 | +; CHECK-NEXT: [[TMP7:%.*]] = fmul <2 x double> [[TMP1]], zeroinitializer |
| 18 | +; CHECK-NEXT: [[TMP8:%.*]] = extractelement <2 x double> [[TMP7]], i32 0 |
| 19 | +; CHECK-NEXT: [[TMP9:%.*]] = extractelement <2 x double> [[TMP7]], i32 1 |
| 20 | +; CHECK-NEXT: [[TMP10:%.*]] = fadd double [[TMP8]], [[TMP9]] |
| 21 | +; CHECK-NEXT: [[TMP11:%.*]] = fmul <2 x double> [[TMP0]], zeroinitializer |
| 22 | +; CHECK-NEXT: [[TMP12:%.*]] = extractelement <2 x double> [[TMP11]], i32 1 |
| 23 | +; CHECK-NEXT: [[TMP13:%.*]] = fadd double [[TMP12]], [[TMP10]] |
| 24 | +; CHECK-NEXT: [[TMP14:%.*]] = extractelement <2 x double> [[TMP11]], i32 0 |
| 25 | +; CHECK-NEXT: [[TMP15:%.*]] = fadd double [[TMP14]], [[TMP13]] |
| 26 | +; CHECK-NEXT: ret double [[TMP15]] |
| 27 | +; |
| 28 | +entry: |
| 29 | + %0 = fmul double 0.000000e+00, 0.000000e+00 |
| 30 | + %1 = fmul double 0.000000e+00, 0.000000e+00 |
| 31 | + %2 = fadd reassoc nsz double %1, %0 |
| 32 | + %3 = load double, ptr getelementptr inbounds ([13 x double], ptr null, i64 0, i64 5), align 8 |
| 33 | + %4 = load double, ptr getelementptr inbounds ([13 x double], ptr null, i64 0, i64 6), align 16 |
| 34 | + %5 = fmul double %4, 0.000000e+00 |
| 35 | + %6 = fadd reassoc nsz double %5, %2 |
| 36 | + %7 = load double, ptr getelementptr inbounds ([13 x double], ptr null, i64 0, i64 8), align 16 |
| 37 | + %8 = load double, ptr getelementptr inbounds ([13 x double], ptr null, i64 0, i64 9), align 8 |
| 38 | + %9 = fmul double %8, 0.000000e+00 |
| 39 | + %10 = fadd reassoc nsz double %9, %6 |
| 40 | + %11 = fmul double %10, 0.000000e+00 |
| 41 | + store double %11, ptr null, align 16 |
| 42 | + br label %bb |
| 43 | + |
| 44 | +bb: |
| 45 | + %12 = fmul double %8, 0.000000e+00 |
| 46 | + %13 = fmul double %7, 0.000000e+00 |
| 47 | + %14 = fadd double %13, %12 |
| 48 | + %15 = fmul double %4, 0.000000e+00 |
| 49 | + %16 = fadd double %15, %14 |
| 50 | + %17 = fmul double %3, 0.000000e+00 |
| 51 | + %18 = fadd double %17, %16 |
| 52 | + ret double %18 |
| 53 | +} |
0 commit comments