Skip to content

Commit 84299df

Browse files
author
Thorsten Schütt
authored
[GlobalIsel] add trunc flags (#87045)
#85592
1 parent ea707ba commit 84299df

File tree

2 files changed

+96
-0
lines changed

2 files changed

+96
-0
lines changed

llvm/lib/CodeGen/MachineInstr.cpp

Lines changed: 6 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -39,6 +39,7 @@
3939
#include "llvm/IR/DebugLoc.h"
4040
#include "llvm/IR/Function.h"
4141
#include "llvm/IR/InlineAsm.h"
42+
#include "llvm/IR/Instructions.h"
4243
#include "llvm/IR/LLVMContext.h"
4344
#include "llvm/IR/Metadata.h"
4445
#include "llvm/IR/Module.h"
@@ -553,6 +554,11 @@ uint32_t MachineInstr::copyFlagsFromInstruction(const Instruction &I) {
553554
MIFlags |= MachineInstr::MIFlag::NoSWrap;
554555
if (OB->hasNoUnsignedWrap())
555556
MIFlags |= MachineInstr::MIFlag::NoUWrap;
557+
} else if (const TruncInst *TI = dyn_cast<TruncInst>(&I)) {
558+
if (TI->hasNoSignedWrap())
559+
MIFlags |= MachineInstr::MIFlag::NoSWrap;
560+
if (TI->hasNoUnsignedWrap())
561+
MIFlags |= MachineInstr::MIFlag::NoUWrap;
556562
}
557563

558564
// Copy the nonneg flag.
Lines changed: 90 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,90 @@
1+
; NOTE: Assertions have been autogenerated by utils/update_mir_test_checks.py
2+
; RUN: llc -O0 -mtriple=aarch64-linux-gnu -global-isel -stop-after=irtranslator %s -o - | FileCheck %s
3+
4+
define i32 @call_trunc_no_flags(i64 %a) {
5+
; CHECK-LABEL: name: call_trunc_no_flags
6+
; CHECK: bb.1.entry:
7+
; CHECK-NEXT: liveins: $x0
8+
; CHECK-NEXT: {{ $}}
9+
; CHECK-NEXT: [[COPY:%[0-9]+]]:_(s64) = COPY $x0
10+
; CHECK-NEXT: [[TRUNC:%[0-9]+]]:_(s32) = G_TRUNC [[COPY]](s64)
11+
; CHECK-NEXT: $w0 = COPY [[TRUNC]](s32)
12+
; CHECK-NEXT: RET_ReallyLR implicit $w0
13+
entry:
14+
%result = trunc i64 %a to i32
15+
ret i32 %result
16+
}
17+
18+
define i32 @call_trunc_nsw_flags(i64 %a) {
19+
; CHECK-LABEL: name: call_trunc_nsw_flags
20+
; CHECK: bb.1.entry:
21+
; CHECK-NEXT: liveins: $x0
22+
; CHECK-NEXT: {{ $}}
23+
; CHECK-NEXT: [[COPY:%[0-9]+]]:_(s64) = COPY $x0
24+
; CHECK-NEXT: [[TRUNC:%[0-9]+]]:_(s32) = nsw G_TRUNC [[COPY]](s64)
25+
; CHECK-NEXT: $w0 = COPY [[TRUNC]](s32)
26+
; CHECK-NEXT: RET_ReallyLR implicit $w0
27+
entry:
28+
%result = trunc nsw i64 %a to i32
29+
ret i32 %result
30+
}
31+
32+
define i32 @call_trunc_nuw_flags(i64 %a) {
33+
; CHECK-LABEL: name: call_trunc_nuw_flags
34+
; CHECK: bb.1.entry:
35+
; CHECK-NEXT: liveins: $x0
36+
; CHECK-NEXT: {{ $}}
37+
; CHECK-NEXT: [[COPY:%[0-9]+]]:_(s64) = COPY $x0
38+
; CHECK-NEXT: [[TRUNC:%[0-9]+]]:_(s32) = nuw G_TRUNC [[COPY]](s64)
39+
; CHECK-NEXT: $w0 = COPY [[TRUNC]](s32)
40+
; CHECK-NEXT: RET_ReallyLR implicit $w0
41+
entry:
42+
%result = trunc nuw i64 %a to i32
43+
ret i32 %result
44+
}
45+
46+
define i32 @call_trunc_all_flags(i64 %a) {
47+
; CHECK-LABEL: name: call_trunc_all_flags
48+
; CHECK: bb.1.entry:
49+
; CHECK-NEXT: liveins: $x0
50+
; CHECK-NEXT: {{ $}}
51+
; CHECK-NEXT: [[COPY:%[0-9]+]]:_(s64) = COPY $x0
52+
; CHECK-NEXT: [[TRUNC:%[0-9]+]]:_(s32) = nuw nsw G_TRUNC [[COPY]](s64)
53+
; CHECK-NEXT: $w0 = COPY [[TRUNC]](s32)
54+
; CHECK-NEXT: RET_ReallyLR implicit $w0
55+
entry:
56+
%result = trunc nsw nuw i64 %a to i32
57+
ret i32 %result
58+
}
59+
60+
define <2 x i64> @call_trunc_noop_signed_vector(<2 x i64> %a) {
61+
; CHECK-LABEL: name: call_trunc_noop_signed_vector
62+
; CHECK: bb.1.entry:
63+
; CHECK-NEXT: liveins: $q0
64+
; CHECK-NEXT: {{ $}}
65+
; CHECK-NEXT: [[COPY:%[0-9]+]]:_(<2 x s64>) = COPY $q0
66+
; CHECK-NEXT: [[TRUNC:%[0-9]+]]:_(<2 x s32>) = nsw G_TRUNC [[COPY]](<2 x s64>)
67+
; CHECK-NEXT: [[SEXT:%[0-9]+]]:_(<2 x s64>) = G_SEXT [[TRUNC]](<2 x s32>)
68+
; CHECK-NEXT: $q0 = COPY [[SEXT]](<2 x s64>)
69+
; CHECK-NEXT: RET_ReallyLR implicit $q0
70+
entry:
71+
%truncate = trunc nsw <2 x i64> %a to <2 x i32>
72+
%result = sext <2 x i32> %truncate to <2 x i64>
73+
ret <2 x i64> %result
74+
}
75+
76+
define <2 x i64> @call_trunc_noop_unsigned_vector(<2 x i64> %a) {
77+
; CHECK-LABEL: name: call_trunc_noop_unsigned_vector
78+
; CHECK: bb.1.entry:
79+
; CHECK-NEXT: liveins: $q0
80+
; CHECK-NEXT: {{ $}}
81+
; CHECK-NEXT: [[COPY:%[0-9]+]]:_(<2 x s64>) = COPY $q0
82+
; CHECK-NEXT: [[TRUNC:%[0-9]+]]:_(<2 x s32>) = nuw G_TRUNC [[COPY]](<2 x s64>)
83+
; CHECK-NEXT: [[ZEXT:%[0-9]+]]:_(<2 x s64>) = G_ZEXT [[TRUNC]](<2 x s32>)
84+
; CHECK-NEXT: $q0 = COPY [[ZEXT]](<2 x s64>)
85+
; CHECK-NEXT: RET_ReallyLR implicit $q0
86+
entry:
87+
%truncate = trunc nuw <2 x i64> %a to <2 x i32>
88+
%result = zext <2 x i32> %truncate to <2 x i64>
89+
ret <2 x i64> %result
90+
}

0 commit comments

Comments
 (0)