@@ -1321,3 +1321,93 @@ exit:
1321
1321
ret i32 %accum
1322
1322
}
1323
1323
1324
+ define i16 @multiple_exit_none_via_latch (ptr %dst , i64 %x ) {
1325
+ ; CHECK-LABEL: @multiple_exit_none_via_latch(
1326
+ ; CHECK-NEXT: entry:
1327
+ ; CHECK-NEXT: [[UMIN:%.*]] = call i64 @llvm.umin.i64(i64 [[X:%.*]], i64 100)
1328
+ ; CHECK-NEXT: [[TMP0:%.*]] = add nuw nsw i64 [[UMIN]], 1
1329
+ ; CHECK-NEXT: [[MIN_ITERS_CHECK:%.*]] = icmp ule i64 [[TMP0]], 2
1330
+ ; CHECK-NEXT: br i1 [[MIN_ITERS_CHECK]], label [[SCALAR_PH:%.*]], label [[VECTOR_PH:%.*]]
1331
+ ; CHECK: vector.ph:
1332
+ ; CHECK-NEXT: [[N_MOD_VF:%.*]] = urem i64 [[TMP0]], 2
1333
+ ; CHECK-NEXT: [[TMP1:%.*]] = icmp eq i64 [[N_MOD_VF]], 0
1334
+ ; CHECK-NEXT: [[TMP2:%.*]] = select i1 [[TMP1]], i64 2, i64 [[N_MOD_VF]]
1335
+ ; CHECK-NEXT: [[N_VEC:%.*]] = sub i64 [[TMP0]], [[TMP2]]
1336
+ ; CHECK-NEXT: br label [[VECTOR_BODY:%.*]]
1337
+ ; CHECK: vector.body:
1338
+ ; CHECK-NEXT: [[INDEX:%.*]] = phi i64 [ 0, [[VECTOR_PH]] ], [ [[INDEX_NEXT:%.*]], [[VECTOR_BODY]] ]
1339
+ ; CHECK-NEXT: [[TMP3:%.*]] = add i64 [[INDEX]], 0
1340
+ ; CHECK-NEXT: [[TMP4:%.*]] = add i64 [[INDEX]], 1
1341
+ ; CHECK-NEXT: [[TMP5:%.*]] = getelementptr inbounds i32, ptr [[DST:%.*]], i64 [[TMP3]]
1342
+ ; CHECK-NEXT: [[TMP6:%.*]] = getelementptr inbounds i32, ptr [[DST]], i64 [[TMP4]]
1343
+ ; CHECK-NEXT: store i64 0, ptr [[TMP5]], align 8
1344
+ ; CHECK-NEXT: store i64 0, ptr [[TMP6]], align 8
1345
+ ; CHECK-NEXT: [[INDEX_NEXT]] = add nuw i64 [[INDEX]], 2
1346
+ ; CHECK-NEXT: [[TMP7:%.*]] = icmp eq i64 [[INDEX_NEXT]], [[N_VEC]]
1347
+ ; CHECK-NEXT: br i1 [[TMP7]], label [[MIDDLE_BLOCK:%.*]], label [[VECTOR_BODY]], !llvm.loop [[LOOP24:![0-9]+]]
1348
+ ; CHECK: middle.block:
1349
+ ; CHECK-NEXT: br label [[SCALAR_PH]]
1350
+ ; CHECK: scalar.ph:
1351
+ ; CHECK-NEXT: [[BC_RESUME_VAL:%.*]] = phi i64 [ [[N_VEC]], [[MIDDLE_BLOCK]] ], [ 0, [[ENTRY:%.*]] ]
1352
+ ; CHECK-NEXT: br label [[LOOP_HEADER:%.*]]
1353
+ ; CHECK: loop.header:
1354
+ ; CHECK-NEXT: [[IV:%.*]] = phi i64 [ [[BC_RESUME_VAL]], [[SCALAR_PH]] ], [ [[IV_NEXT:%.*]], [[LOOP_LATCH:%.*]] ]
1355
+ ; CHECK-NEXT: [[GEP:%.*]] = getelementptr inbounds i32, ptr [[DST]], i64 [[IV]]
1356
+ ; CHECK-NEXT: store i64 0, ptr [[GEP]], align 8
1357
+ ; CHECK-NEXT: [[CMP120:%.*]] = icmp slt i64 [[IV]], 100
1358
+ ; CHECK-NEXT: br i1 [[CMP120]], label [[LOOP_THEN:%.*]], label [[EXIT_2:%.*]]
1359
+ ; CHECK: loop.then:
1360
+ ; CHECK-NEXT: [[CMP3:%.*]] = icmp ne i64 [[IV]], [[X]]
1361
+ ; CHECK-NEXT: br i1 [[CMP3]], label [[LOOP_LATCH]], label [[EXIT_1:%.*]]
1362
+ ; CHECK: loop.latch:
1363
+ ; CHECK-NEXT: [[IV_NEXT]] = add i64 [[IV]], 1
1364
+ ; CHECK-NEXT: br label [[LOOP_HEADER]], !llvm.loop [[LOOP25:![0-9]+]]
1365
+ ; CHECK: exit.1:
1366
+ ; CHECK-NEXT: ret i16 0
1367
+ ; CHECK: exit.2:
1368
+ ; CHECK-NEXT: ret i16 1
1369
+ ;
1370
+ ; TAILFOLD-LABEL: @multiple_exit_none_via_latch(
1371
+ ; TAILFOLD-NEXT: entry:
1372
+ ; TAILFOLD-NEXT: br label [[LOOP_HEADER:%.*]]
1373
+ ; TAILFOLD: loop.header:
1374
+ ; TAILFOLD-NEXT: [[IV:%.*]] = phi i64 [ 0, [[ENTRY:%.*]] ], [ [[IV_NEXT:%.*]], [[LOOP_LATCH:%.*]] ]
1375
+ ; TAILFOLD-NEXT: [[GEP:%.*]] = getelementptr inbounds i32, ptr [[DST:%.*]], i64 [[IV]]
1376
+ ; TAILFOLD-NEXT: store i64 0, ptr [[GEP]], align 8
1377
+ ; TAILFOLD-NEXT: [[CMP120:%.*]] = icmp slt i64 [[IV]], 100
1378
+ ; TAILFOLD-NEXT: br i1 [[CMP120]], label [[LOOP_THEN:%.*]], label [[EXIT_2:%.*]]
1379
+ ; TAILFOLD: loop.then:
1380
+ ; TAILFOLD-NEXT: [[CMP3:%.*]] = icmp ne i64 [[IV]], [[X:%.*]]
1381
+ ; TAILFOLD-NEXT: br i1 [[CMP3]], label [[LOOP_LATCH]], label [[EXIT_1:%.*]]
1382
+ ; TAILFOLD: loop.latch:
1383
+ ; TAILFOLD-NEXT: [[IV_NEXT]] = add i64 [[IV]], 1
1384
+ ; TAILFOLD-NEXT: br label [[LOOP_HEADER]]
1385
+ ; TAILFOLD: exit.1:
1386
+ ; TAILFOLD-NEXT: ret i16 0
1387
+ ; TAILFOLD: exit.2:
1388
+ ; TAILFOLD-NEXT: ret i16 1
1389
+ ;
1390
+ entry:
1391
+ br label %loop.header
1392
+
1393
+ loop.header:
1394
+ %iv = phi i64 [ 0 , %entry ], [ %iv.next , %loop.latch ]
1395
+ %gep = getelementptr inbounds i32 , ptr %dst , i64 %iv
1396
+ store i64 0 , ptr %gep
1397
+ %cmp120 = icmp slt i64 %iv , 100
1398
+ br i1 %cmp120 , label %loop.then , label %exit.2
1399
+
1400
+ loop.then:
1401
+ %cmp3 = icmp ne i64 %iv , %x
1402
+ br i1 %cmp3 , label %loop.latch , label %exit.1
1403
+
1404
+ loop.latch:
1405
+ %iv.next = add i64 %iv , 1
1406
+ br label %loop.header
1407
+
1408
+ exit.1 :
1409
+ ret i16 0
1410
+
1411
+ exit.2 :
1412
+ ret i16 1
1413
+ }
0 commit comments