@@ -474,28 +474,27 @@ for.end: ; preds = %for.body
474
474
ret void
475
475
}
476
476
477
+ ; TODO: This case should be legal, but we run into a problem with SCEV's
478
+ ; ability to prove non-zero for sext expressions.
477
479
define void @expensive_expand_short_tc (ptr %a , i32 %offset , i32 %n ) {
478
480
; CHECK-LABEL: @expensive_expand_short_tc(
479
481
; CHECK-NEXT: entry:
482
+ ; CHECK-NEXT: [[OFFSET_NONZERO:%.*]] = or i32 [[OFFSET:%.*]], 1
480
483
; CHECK-NEXT: [[UGLYGEP:%.*]] = getelementptr i8, ptr [[A:%.*]], i64 84
481
- ; CHECK-NEXT: [[TMP0:%.*]] = add i32 [[N:%.*]], -1
482
- ; CHECK-NEXT: [[TMP1:%.*]] = zext i32 [[TMP0]] to i64
483
- ; CHECK-NEXT: [[TMP2:%.*]] = add nuw nsw i64 [[TMP1]], 1
484
- ; CHECK-NEXT: [[TMP3:%.*]] = sext i32 [[OFFSET:%.*]] to i64
485
- ; CHECK-NEXT: [[TMP4:%.*]] = mul i64 [[TMP2]], [[TMP3]]
486
- ; CHECK-NEXT: [[TMP5:%.*]] = add nsw i64 [[TMP4]], 84
487
- ; CHECK-NEXT: [[SCEVGEP:%.*]] = getelementptr i8, ptr [[A]], i64 [[TMP5]]
488
484
; CHECK-NEXT: br label [[FOR_BODY:%.*]]
489
485
; CHECK: for.body:
490
486
; CHECK-NEXT: [[LSR_IV1:%.*]] = phi ptr [ [[UGLYGEP2:%.*]], [[FOR_BODY]] ], [ [[UGLYGEP]], [[ENTRY:%.*]] ]
487
+ ; CHECK-NEXT: [[LSR_IV:%.*]] = phi i32 [ [[LSR_IV_NEXT:%.*]], [[FOR_BODY]] ], [ 0, [[ENTRY]] ]
491
488
; CHECK-NEXT: store i32 1, ptr [[LSR_IV1]], align 4
492
- ; CHECK-NEXT: [[UGLYGEP2]] = getelementptr i8, ptr [[LSR_IV1]], i32 [[OFFSET]]
493
- ; CHECK-NEXT: [[LSR_FOLD_TERM_COND_REPLACED_TERM_COND:%.*]] = icmp eq ptr [[UGLYGEP2]], [[SCEVGEP]]
494
- ; CHECK-NEXT: br i1 [[LSR_FOLD_TERM_COND_REPLACED_TERM_COND]], label [[FOR_END:%.*]], label [[FOR_BODY]], !prof [[PROF0:![0-9]+]]
489
+ ; CHECK-NEXT: [[LSR_IV_NEXT]] = add nsw i32 [[LSR_IV]], 1
490
+ ; CHECK-NEXT: [[UGLYGEP2]] = getelementptr i8, ptr [[LSR_IV1]], i32 [[OFFSET_NONZERO]]
491
+ ; CHECK-NEXT: [[EXITCOND_NOT:%.*]] = icmp eq i32 [[LSR_IV_NEXT]], [[N:%.*]]
492
+ ; CHECK-NEXT: br i1 [[EXITCOND_NOT]], label [[FOR_END:%.*]], label [[FOR_BODY]], !prof [[PROF0:![0-9]+]]
495
493
; CHECK: for.end:
496
494
; CHECK-NEXT: ret void
497
495
;
498
496
entry:
497
+ %offset.nonzero = or i32 %offset , 1
499
498
%uglygep = getelementptr i8 , ptr %a , i64 84
500
499
br label %for.body
501
500
@@ -504,36 +503,35 @@ for.body: ; preds = %for.body, %entry
504
503
%lsr.iv = phi i32 [ %lsr.iv.next , %for.body ], [ 0 , %entry ]
505
504
store i32 1 , ptr %lsr.iv1 , align 4
506
505
%lsr.iv.next = add nsw i32 %lsr.iv , 1
507
- %uglygep2 = getelementptr i8 , ptr %lsr.iv1 , i32 %offset
506
+ %uglygep2 = getelementptr i8 , ptr %lsr.iv1 , i32 %offset.nonzero
508
507
%exitcond.not = icmp eq i32 %lsr.iv.next , %n
509
508
br i1 %exitcond.not , label %for.end , label %for.body , !prof !{!"branch_weights" , i32 1 , i32 3 }
510
509
511
510
for.end: ; preds = %for.body
512
511
ret void
513
512
}
514
513
514
+ ; TODO: This case should be legal, but we run into a problem with SCEV's
515
+ ; ability to prove non-zero for sext expressions.
515
516
define void @expensive_expand_long_tc (ptr %a , i32 %offset , i32 %n ) {
516
517
; CHECK-LABEL: @expensive_expand_long_tc(
517
518
; CHECK-NEXT: entry:
519
+ ; CHECK-NEXT: [[OFFSET_NONZERO:%.*]] = or i32 [[OFFSET:%.*]], 1
518
520
; CHECK-NEXT: [[UGLYGEP:%.*]] = getelementptr i8, ptr [[A:%.*]], i64 84
519
- ; CHECK-NEXT: [[TMP0:%.*]] = add i32 [[N:%.*]], -1
520
- ; CHECK-NEXT: [[TMP1:%.*]] = zext i32 [[TMP0]] to i64
521
- ; CHECK-NEXT: [[TMP2:%.*]] = add nuw nsw i64 [[TMP1]], 1
522
- ; CHECK-NEXT: [[TMP3:%.*]] = sext i32 [[OFFSET:%.*]] to i64
523
- ; CHECK-NEXT: [[TMP4:%.*]] = mul i64 [[TMP2]], [[TMP3]]
524
- ; CHECK-NEXT: [[TMP5:%.*]] = add nsw i64 [[TMP4]], 84
525
- ; CHECK-NEXT: [[SCEVGEP:%.*]] = getelementptr i8, ptr [[A]], i64 [[TMP5]]
526
521
; CHECK-NEXT: br label [[FOR_BODY:%.*]]
527
522
; CHECK: for.body:
528
523
; CHECK-NEXT: [[LSR_IV1:%.*]] = phi ptr [ [[UGLYGEP2:%.*]], [[FOR_BODY]] ], [ [[UGLYGEP]], [[ENTRY:%.*]] ]
524
+ ; CHECK-NEXT: [[LSR_IV:%.*]] = phi i32 [ [[LSR_IV_NEXT:%.*]], [[FOR_BODY]] ], [ 0, [[ENTRY]] ]
529
525
; CHECK-NEXT: store i32 1, ptr [[LSR_IV1]], align 4
530
- ; CHECK-NEXT: [[UGLYGEP2]] = getelementptr i8, ptr [[LSR_IV1]], i32 [[OFFSET]]
531
- ; CHECK-NEXT: [[LSR_FOLD_TERM_COND_REPLACED_TERM_COND:%.*]] = icmp eq ptr [[UGLYGEP2]], [[SCEVGEP]]
532
- ; CHECK-NEXT: br i1 [[LSR_FOLD_TERM_COND_REPLACED_TERM_COND]], label [[FOR_END:%.*]], label [[FOR_BODY]], !prof [[PROF1:![0-9]+]]
526
+ ; CHECK-NEXT: [[LSR_IV_NEXT]] = add nsw i32 [[LSR_IV]], 1
527
+ ; CHECK-NEXT: [[UGLYGEP2]] = getelementptr i8, ptr [[LSR_IV1]], i32 [[OFFSET_NONZERO]]
528
+ ; CHECK-NEXT: [[EXITCOND_NOT:%.*]] = icmp eq i32 [[LSR_IV_NEXT]], [[N:%.*]]
529
+ ; CHECK-NEXT: br i1 [[EXITCOND_NOT]], label [[FOR_END:%.*]], label [[FOR_BODY]], !prof [[PROF1:![0-9]+]]
533
530
; CHECK: for.end:
534
531
; CHECK-NEXT: ret void
535
532
;
536
533
entry:
534
+ %offset.nonzero = or i32 %offset , 1
537
535
%uglygep = getelementptr i8 , ptr %a , i64 84
538
536
br label %for.body
539
537
@@ -542,36 +540,35 @@ for.body: ; preds = %for.body, %entry
542
540
%lsr.iv = phi i32 [ %lsr.iv.next , %for.body ], [ 0 , %entry ]
543
541
store i32 1 , ptr %lsr.iv1 , align 4
544
542
%lsr.iv.next = add nsw i32 %lsr.iv , 1
545
- %uglygep2 = getelementptr i8 , ptr %lsr.iv1 , i32 %offset
543
+ %uglygep2 = getelementptr i8 , ptr %lsr.iv1 , i32 %offset.nonzero
546
544
%exitcond.not = icmp eq i32 %lsr.iv.next , %n
547
545
br i1 %exitcond.not , label %for.end , label %for.body , !prof !{!"branch_weights" , i32 1 , i32 300 }
548
546
549
547
for.end: ; preds = %for.body
550
548
ret void
551
549
}
552
550
551
+ ; TODO: This case should be legal, but we run into a problem with SCEV's
552
+ ; ability to prove non-zero for sext expressions.
553
553
define void @expensive_expand_unknown_tc (ptr %a , i32 %offset , i32 %n ) {
554
554
; CHECK-LABEL: @expensive_expand_unknown_tc(
555
555
; CHECK-NEXT: entry:
556
+ ; CHECK-NEXT: [[OFFSET_NONZERO:%.*]] = or i32 [[OFFSET:%.*]], 1
556
557
; CHECK-NEXT: [[UGLYGEP:%.*]] = getelementptr i8, ptr [[A:%.*]], i64 84
557
- ; CHECK-NEXT: [[TMP0:%.*]] = add i32 [[N:%.*]], -1
558
- ; CHECK-NEXT: [[TMP1:%.*]] = zext i32 [[TMP0]] to i64
559
- ; CHECK-NEXT: [[TMP2:%.*]] = add nuw nsw i64 [[TMP1]], 1
560
- ; CHECK-NEXT: [[TMP3:%.*]] = sext i32 [[OFFSET:%.*]] to i64
561
- ; CHECK-NEXT: [[TMP4:%.*]] = mul i64 [[TMP2]], [[TMP3]]
562
- ; CHECK-NEXT: [[TMP5:%.*]] = add nsw i64 [[TMP4]], 84
563
- ; CHECK-NEXT: [[SCEVGEP:%.*]] = getelementptr i8, ptr [[A]], i64 [[TMP5]]
564
558
; CHECK-NEXT: br label [[FOR_BODY:%.*]]
565
559
; CHECK: for.body:
566
560
; CHECK-NEXT: [[LSR_IV1:%.*]] = phi ptr [ [[UGLYGEP2:%.*]], [[FOR_BODY]] ], [ [[UGLYGEP]], [[ENTRY:%.*]] ]
561
+ ; CHECK-NEXT: [[LSR_IV:%.*]] = phi i32 [ [[LSR_IV_NEXT:%.*]], [[FOR_BODY]] ], [ 0, [[ENTRY]] ]
567
562
; CHECK-NEXT: store i32 1, ptr [[LSR_IV1]], align 4
568
- ; CHECK-NEXT: [[UGLYGEP2]] = getelementptr i8, ptr [[LSR_IV1]], i32 [[OFFSET]]
569
- ; CHECK-NEXT: [[LSR_FOLD_TERM_COND_REPLACED_TERM_COND:%.*]] = icmp eq ptr [[UGLYGEP2]], [[SCEVGEP]]
570
- ; CHECK-NEXT: br i1 [[LSR_FOLD_TERM_COND_REPLACED_TERM_COND]], label [[FOR_END:%.*]], label [[FOR_BODY]]
563
+ ; CHECK-NEXT: [[LSR_IV_NEXT]] = add nsw i32 [[LSR_IV]], 1
564
+ ; CHECK-NEXT: [[UGLYGEP2]] = getelementptr i8, ptr [[LSR_IV1]], i32 [[OFFSET_NONZERO]]
565
+ ; CHECK-NEXT: [[EXITCOND_NOT:%.*]] = icmp eq i32 [[LSR_IV_NEXT]], [[N:%.*]]
566
+ ; CHECK-NEXT: br i1 [[EXITCOND_NOT]], label [[FOR_END:%.*]], label [[FOR_BODY]]
571
567
; CHECK: for.end:
572
568
; CHECK-NEXT: ret void
573
569
;
574
570
entry:
571
+ %offset.nonzero = or i32 %offset , 1
575
572
%uglygep = getelementptr i8 , ptr %a , i64 84
576
573
br label %for.body
577
574
@@ -580,7 +577,7 @@ for.body: ; preds = %for.body, %entry
580
577
%lsr.iv = phi i32 [ %lsr.iv.next , %for.body ], [ 0 , %entry ]
581
578
store i32 1 , ptr %lsr.iv1 , align 4
582
579
%lsr.iv.next = add nsw i32 %lsr.iv , 1
583
- %uglygep2 = getelementptr i8 , ptr %lsr.iv1 , i32 %offset
580
+ %uglygep2 = getelementptr i8 , ptr %lsr.iv1 , i32 %offset.nonzero
584
581
%exitcond.not = icmp eq i32 %lsr.iv.next , %n
585
582
br i1 %exitcond.not , label %for.end , label %for.body
586
583
0 commit comments