|
1 | 1 | # NOTE: Assertions have been autogenerated by utils/update_mir_test_checks.py UTC_ARGS: --version 3
|
2 | 2 | # RUN: llc -mtriple=amdgcn -mcpu=gfx1100 -mattr=+real-true16 -run-pass=si-fix-sgpr-copies -verify-machineinstrs -o - %s | FileCheck --check-prefixes=GCN %s
|
3 |
| -# XFAIL: * |
4 |
| -# FIXME-TRUE16 reenable after fix-sgpr-copies is updated for true16 flow |
5 | 3 |
|
6 | 4 | ---
|
7 |
| -name: cmp_f16 |
| 5 | +name: cvt_hi_f32_f16 |
8 | 6 | body: |
|
9 |
| - bb.0.entry: |
10 |
| - ; GCN-LABEL: name: cmp_f16 |
| 7 | + bb.0: |
| 8 | + ; GCN-LABEL: name: cvt_hi_f32_f16 |
11 | 9 | ; GCN: [[DEF:%[0-9]+]]:vgpr_16 = IMPLICIT_DEF
|
12 |
| - ; GCN-NEXT: [[DEF1:%[0-9]+]]:sreg_32 = IMPLICIT_DEF |
13 | 10 | ; GCN-NEXT: [[V_CVT_F16_U16_t16_e64_:%[0-9]+]]:vgpr_16 = V_CVT_F16_U16_t16_e64 0, [[DEF]], 0, 0, 0, implicit $mode, implicit $exec
|
14 |
| - ; GCN-NEXT: [[COPY:%[0-9]+]]:vgpr_32 = COPY [[V_CVT_F16_U16_t16_e64_]] |
15 |
| - ; GCN-NEXT: [[COPY1:%[0-9]+]]:vgpr_16 = COPY killed [[COPY]] |
16 |
| - ; GCN-NEXT: [[V_CMP_LT_F16_t16_e64_:%[0-9]+]]:sreg_32_xm0_xexec = nofpexcept V_CMP_LT_F16_t16_e64 0, [[COPY1]], 0, [[DEF1]], 0, 0, implicit $mode, implicit $exec |
17 |
| - ; GCN-NEXT: [[V_CNDMASK_B32_e64_:%[0-9]+]]:vgpr_32 = V_CNDMASK_B32_e64 0, 0, 0, -1, killed [[V_CMP_LT_F16_t16_e64_]], implicit $exec |
| 11 | + ; GCN-NEXT: [[SUBREG_TO_REG:%[0-9]+]]:vgpr_32 = SUBREG_TO_REG 0, [[V_CVT_F16_U16_t16_e64_]], %subreg.lo16 |
| 12 | + ; GCN-NEXT: [[COPY:%[0-9]+]]:vgpr_32 = COPY [[SUBREG_TO_REG]] |
| 13 | + ; GCN-NEXT: [[V_CVT_F32_F16_t16_e64_:%[0-9]+]]:vgpr_32 = V_CVT_F32_F16_t16_e64 0, [[COPY]].hi16, 0, 0, 0, implicit $mode, implicit $exec |
18 | 14 | %0:vgpr_16 = IMPLICIT_DEF
|
19 |
| - %1:sreg_32 = IMPLICIT_DEF |
20 |
| - %2:vgpr_16 = V_CVT_F16_U16_t16_e64 0, %0:vgpr_16, 0, 0, 0, implicit $mode, implicit $exec |
21 |
| - %3:sreg_32 = COPY %2:vgpr_16 |
22 |
| - nofpexcept S_CMP_LT_F16 killed %3:sreg_32, %1:sreg_32, implicit-def $scc, implicit $mode |
23 |
| - %4:sreg_32_xm0_xexec = COPY $scc |
24 |
| - %5:vgpr_32 = V_CNDMASK_B32_e64 0, 0, 0, -1, killed %4, implicit $exec |
| 15 | + %1:vgpr_16 = V_CVT_F16_U16_t16_e64 0, %0:vgpr_16, 0, 0, 0, implicit $mode, implicit $exec |
| 16 | + %2:sreg_32 = COPY %1:vgpr_16 |
| 17 | + %3:sreg_32 = S_CVT_HI_F32_F16 %2:sreg_32, implicit $mode |
25 | 18 | ...
|
26 | 19 |
|
27 | 20 | ---
|
28 |
| -name: cvt_hi_f32_f16 |
| 21 | +name: s_xor_b32 |
29 | 22 | body: |
|
30 | 23 | bb.0:
|
31 |
| - ; GCN-LABEL: name: cvt_hi_f32_f16 |
| 24 | + ; GCN-LABEL: name: s_xor_b32 |
32 | 25 | ; GCN: [[DEF:%[0-9]+]]:vgpr_16 = IMPLICIT_DEF
|
33 | 26 | ; GCN-NEXT: [[V_CVT_F16_U16_t16_e64_:%[0-9]+]]:vgpr_16 = V_CVT_F16_U16_t16_e64 0, [[DEF]], 0, 0, 0, implicit $mode, implicit $exec
|
34 |
| - ; GCN-NEXT: [[COPY:%[0-9]+]]:vgpr_32 = COPY [[V_CVT_F16_U16_t16_e64_]] |
35 |
| - ; GCN-NEXT: [[COPY1:%[0-9]+]]:vgpr_32 = COPY [[COPY]] |
36 |
| - ; GCN-NEXT: [[V_CVT_F32_F16_t16_e64_:%[0-9]+]]:vgpr_32 = V_CVT_F32_F16_t16_e64 0, [[COPY1]].hi16, 0, 0, 0, implicit $mode, implicit $exec |
| 27 | + ; GCN-NEXT: [[SUBREG_TO_REG:%[0-9]+]]:vgpr_32 = SUBREG_TO_REG 0, [[V_CVT_F16_U16_t16_e64_]], %subreg.lo16 |
| 28 | + ; GCN-NEXT: [[V_OR_B32_e64_:%[0-9]+]]:vgpr_32 = V_OR_B32_e64 [[SUBREG_TO_REG]], [[SUBREG_TO_REG]], implicit $exec |
| 29 | + ; GCN-NEXT: [[V_CVT_F16_U16_t16_e64_1:%[0-9]+]]:vgpr_16 = V_CVT_F16_U16_t16_e64 0, [[V_OR_B32_e64_]].lo16, 0, 0, 0, implicit $mode, implicit $exec |
37 | 30 | %0:vgpr_16 = IMPLICIT_DEF
|
38 | 31 | %1:vgpr_16 = V_CVT_F16_U16_t16_e64 0, %0:vgpr_16, 0, 0, 0, implicit $mode, implicit $exec
|
39 | 32 | %2:sreg_32 = COPY %1:vgpr_16
|
40 |
| - %3:sreg_32 = S_CVT_HI_F32_F16 %2:sreg_32, implicit $mode |
| 33 | + %3:sreg_32 = S_OR_B32 %2:sreg_32, %2:sreg_32, implicit-def $scc |
| 34 | + %4:vgpr_16 = V_CVT_F16_U16_t16_e64 0, %3:sreg_32, 0, 0, 0, implicit $mode, implicit $exec |
41 | 35 | ...
|
0 commit comments