Skip to content

Commit 3ecb0b8

Browse files
committed
[X86][BtVer2] Partial vector stores (inc MMX) have a 2cy latency
llvm-svn: 332722
1 parent 804f4d4 commit 3ecb0b8

File tree

8 files changed

+38
-38
lines changed

8 files changed

+38
-38
lines changed

llvm/lib/Target/X86/X86ScheduleBtVer2.td

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -277,7 +277,7 @@ defm : X86WriteRes<WriteFLoadY, [JLAGU, JFPU01, JFPX], 5, [1, 1, 1], 1>;
277277
defm : X86WriteRes<WriteFMaskedLoad, [JLAGU, JFPU01, JFPX], 6, [1, 1, 2], 1>;
278278
defm : X86WriteRes<WriteFMaskedLoadY, [JLAGU, JFPU01, JFPX], 6, [2, 2, 4], 2>;
279279

280-
defm : X86WriteRes<WriteFStore, [JSAGU, JFPU1, JSTC], 1, [1, 1, 1], 1>;
280+
defm : X86WriteRes<WriteFStore, [JSAGU, JFPU1, JSTC], 2, [1, 1, 1], 1>;
281281
defm : X86WriteRes<WriteFStoreX, [JSAGU, JFPU1, JSTC], 1, [1, 1, 1], 1>;
282282
defm : X86WriteRes<WriteFStoreY, [JSAGU, JFPU1, JSTC], 1, [1, 1, 1], 1>;
283283
defm : X86WriteRes<WriteFStoreNT, [JSAGU, JFPU1, JSTC], 3, [1, 1, 1], 1>;
@@ -405,7 +405,7 @@ defm : X86WriteRes<WriteVecLoadNTY, [JLAGU, JFPU01, JVALU], 5, [1, 1, 1],
405405
defm : X86WriteRes<WriteVecMaskedLoad, [JLAGU, JFPU01, JVALU], 6, [1, 1, 2], 1>;
406406
defm : X86WriteRes<WriteVecMaskedLoadY, [JLAGU, JFPU01, JVALU], 6, [2, 2, 4], 2>;
407407

408-
defm : X86WriteRes<WriteVecStore, [JSAGU, JFPU1, JSTC], 1, [1, 1, 1], 1>;
408+
defm : X86WriteRes<WriteVecStore, [JSAGU, JFPU1, JSTC], 2, [1, 1, 1], 1>;
409409
defm : X86WriteRes<WriteVecStoreX, [JSAGU, JFPU1, JSTC], 1, [1, 1, 1], 1>;
410410
defm : X86WriteRes<WriteVecStoreY, [JSAGU, JFPU1, JSTC], 1, [1, 1, 1], 1>;
411411
defm : X86WriteRes<WriteVecStoreNT, [JSAGU, JFPU1, JSTC], 2, [1, 1, 1], 1>;

llvm/test/CodeGen/X86/mmx-schedule.ll

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -953,7 +953,7 @@ define void @test_movq(i64 *%a0) {
953953
; BTVER2: # %bb.0:
954954
; BTVER2-NEXT: movq (%rdi), %mm0 # sched: [5:1.00]
955955
; BTVER2-NEXT: paddd %mm0, %mm0 # sched: [1:0.50]
956-
; BTVER2-NEXT: movq %mm0, (%rdi) # sched: [1:1.00]
956+
; BTVER2-NEXT: movq %mm0, (%rdi) # sched: [2:1.00]
957957
; BTVER2-NEXT: retq # sched: [4:1.00]
958958
;
959959
; ZNVER1-LABEL: test_movq:

llvm/test/CodeGen/X86/sse-schedule.ll

Lines changed: 5 additions & 5 deletions
Original file line numberDiff line numberDiff line change
@@ -2812,7 +2812,7 @@ define void @test_movhps(<4 x float> %a0, <4 x float> %a1, x86_mmx *%a2) {
28122812
; BTVER2-SSE-NEXT: movhpd {{.*#+}} xmm1 = xmm1[0],mem[0] sched: [6:1.00]
28132813
; BTVER2-SSE-NEXT: addps %xmm0, %xmm1 # sched: [3:1.00]
28142814
; BTVER2-SSE-NEXT: movhlps {{.*#+}} xmm1 = xmm1[1,1] sched: [1:0.50]
2815-
; BTVER2-SSE-NEXT: movlps %xmm1, (%rdi) # sched: [1:1.00]
2815+
; BTVER2-SSE-NEXT: movlps %xmm1, (%rdi) # sched: [2:1.00]
28162816
; BTVER2-SSE-NEXT: retq # sched: [4:1.00]
28172817
;
28182818
; BTVER2-LABEL: test_movhps:
@@ -3051,14 +3051,14 @@ define void @test_movlps(<4 x float> %a0, <4 x float> %a1, x86_mmx *%a2) {
30513051
; BTVER2-SSE: # %bb.0:
30523052
; BTVER2-SSE-NEXT: movlpd {{.*#+}} xmm1 = mem[0],xmm1[1] sched: [6:1.00]
30533053
; BTVER2-SSE-NEXT: addps %xmm0, %xmm1 # sched: [3:1.00]
3054-
; BTVER2-SSE-NEXT: movlps %xmm1, (%rdi) # sched: [1:1.00]
3054+
; BTVER2-SSE-NEXT: movlps %xmm1, (%rdi) # sched: [2:1.00]
30553055
; BTVER2-SSE-NEXT: retq # sched: [4:1.00]
30563056
;
30573057
; BTVER2-LABEL: test_movlps:
30583058
; BTVER2: # %bb.0:
30593059
; BTVER2-NEXT: vmovlpd {{.*#+}} xmm1 = mem[0],xmm1[1] sched: [6:1.00]
30603060
; BTVER2-NEXT: vaddps %xmm1, %xmm0, %xmm0 # sched: [3:1.00]
3061-
; BTVER2-NEXT: vmovlps %xmm0, (%rdi) # sched: [1:1.00]
3061+
; BTVER2-NEXT: vmovlps %xmm0, (%rdi) # sched: [2:1.00]
30623062
; BTVER2-NEXT: retq # sched: [4:1.00]
30633063
;
30643064
; ZNVER1-SSE-LABEL: test_movlps:
@@ -3367,14 +3367,14 @@ define void @test_movss_mem(float* %a0, float* %a1) {
33673367
; BTVER2-SSE: # %bb.0:
33683368
; BTVER2-SSE-NEXT: movss {{.*#+}} xmm0 = mem[0],zero,zero,zero sched: [5:1.00]
33693369
; BTVER2-SSE-NEXT: addss %xmm0, %xmm0 # sched: [3:1.00]
3370-
; BTVER2-SSE-NEXT: movss %xmm0, (%rsi) # sched: [1:1.00]
3370+
; BTVER2-SSE-NEXT: movss %xmm0, (%rsi) # sched: [2:1.00]
33713371
; BTVER2-SSE-NEXT: retq # sched: [4:1.00]
33723372
;
33733373
; BTVER2-LABEL: test_movss_mem:
33743374
; BTVER2: # %bb.0:
33753375
; BTVER2-NEXT: vmovss {{.*#+}} xmm0 = mem[0],zero,zero,zero sched: [5:1.00]
33763376
; BTVER2-NEXT: vaddss %xmm0, %xmm0, %xmm0 # sched: [3:1.00]
3377-
; BTVER2-NEXT: vmovss %xmm0, (%rsi) # sched: [1:1.00]
3377+
; BTVER2-NEXT: vmovss %xmm0, (%rsi) # sched: [2:1.00]
33783378
; BTVER2-NEXT: retq # sched: [4:1.00]
33793379
;
33803380
; ZNVER1-SSE-LABEL: test_movss_mem:

llvm/test/CodeGen/X86/sse2-schedule.ll

Lines changed: 12 additions & 12 deletions
Original file line numberDiff line numberDiff line change
@@ -4610,7 +4610,7 @@ define i32 @test_movd(<4 x i32> %a0, i32 %a1, i32 *%a2) {
46104610
; BTVER2-SSE-NEXT: movd {{.*#+}} xmm2 = mem[0],zero,zero,zero sched: [5:1.00]
46114611
; BTVER2-SSE-NEXT: movd %edi, %xmm1 # sched: [1:0.50]
46124612
; BTVER2-SSE-NEXT: paddd %xmm0, %xmm1 # sched: [1:0.50]
4613-
; BTVER2-SSE-NEXT: movd %xmm1, (%rsi) # sched: [1:1.00]
4613+
; BTVER2-SSE-NEXT: movd %xmm1, (%rsi) # sched: [2:1.00]
46144614
; BTVER2-SSE-NEXT: paddd %xmm0, %xmm2 # sched: [1:0.50]
46154615
; BTVER2-SSE-NEXT: movd %xmm2, %eax # sched: [1:0.50]
46164616
; BTVER2-SSE-NEXT: retq # sched: [4:1.00]
@@ -4620,7 +4620,7 @@ define i32 @test_movd(<4 x i32> %a0, i32 %a1, i32 *%a2) {
46204620
; BTVER2-NEXT: vmovd {{.*#+}} xmm2 = mem[0],zero,zero,zero sched: [5:1.00]
46214621
; BTVER2-NEXT: vmovd %edi, %xmm1 # sched: [1:0.50]
46224622
; BTVER2-NEXT: vpaddd %xmm1, %xmm0, %xmm1 # sched: [1:0.50]
4623-
; BTVER2-NEXT: vmovd %xmm1, (%rsi) # sched: [1:1.00]
4623+
; BTVER2-NEXT: vmovd %xmm1, (%rsi) # sched: [2:1.00]
46244624
; BTVER2-NEXT: vpaddd %xmm2, %xmm0, %xmm0 # sched: [1:0.50]
46254625
; BTVER2-NEXT: vmovd %xmm0, %eax # sched: [1:0.50]
46264626
; BTVER2-NEXT: retq # sched: [4:1.00]
@@ -4791,7 +4791,7 @@ define i64 @test_movd_64(<2 x i64> %a0, i64 %a1, i64 *%a2) {
47914791
; BTVER2-SSE-NEXT: movq {{.*#+}} xmm2 = mem[0],zero sched: [5:1.00]
47924792
; BTVER2-SSE-NEXT: movq %rdi, %xmm1 # sched: [1:0.50]
47934793
; BTVER2-SSE-NEXT: paddq %xmm0, %xmm1 # sched: [1:0.50]
4794-
; BTVER2-SSE-NEXT: movq %xmm1, (%rsi) # sched: [1:1.00]
4794+
; BTVER2-SSE-NEXT: movq %xmm1, (%rsi) # sched: [2:1.00]
47954795
; BTVER2-SSE-NEXT: paddq %xmm0, %xmm2 # sched: [1:0.50]
47964796
; BTVER2-SSE-NEXT: movq %xmm2, %rax # sched: [1:0.50]
47974797
; BTVER2-SSE-NEXT: retq # sched: [4:1.00]
@@ -4801,7 +4801,7 @@ define i64 @test_movd_64(<2 x i64> %a0, i64 %a1, i64 *%a2) {
48014801
; BTVER2-NEXT: vmovq {{.*#+}} xmm2 = mem[0],zero sched: [5:1.00]
48024802
; BTVER2-NEXT: vmovq %rdi, %xmm1 # sched: [1:0.50]
48034803
; BTVER2-NEXT: vpaddq %xmm1, %xmm0, %xmm1 # sched: [1:0.50]
4804-
; BTVER2-NEXT: vmovq %xmm1, (%rsi) # sched: [1:1.00]
4804+
; BTVER2-NEXT: vmovq %xmm1, (%rsi) # sched: [2:1.00]
48054805
; BTVER2-NEXT: vpaddq %xmm2, %xmm0, %xmm0 # sched: [1:0.50]
48064806
; BTVER2-NEXT: vmovq %xmm0, %rax # sched: [1:0.50]
48074807
; BTVER2-NEXT: retq # sched: [4:1.00]
@@ -4932,14 +4932,14 @@ define void @test_movhpd(<2 x double> %a0, <2 x double> %a1, x86_mmx *%a2) {
49324932
; BTVER2-SSE: # %bb.0:
49334933
; BTVER2-SSE-NEXT: movhpd {{.*#+}} xmm1 = xmm1[0],mem[0] sched: [6:1.00]
49344934
; BTVER2-SSE-NEXT: addpd %xmm0, %xmm1 # sched: [3:1.00]
4935-
; BTVER2-SSE-NEXT: movhpd %xmm1, (%rdi) # sched: [1:1.00]
4935+
; BTVER2-SSE-NEXT: movhpd %xmm1, (%rdi) # sched: [2:1.00]
49364936
; BTVER2-SSE-NEXT: retq # sched: [4:1.00]
49374937
;
49384938
; BTVER2-LABEL: test_movhpd:
49394939
; BTVER2: # %bb.0:
49404940
; BTVER2-NEXT: vmovhpd {{.*#+}} xmm1 = xmm1[0],mem[0] sched: [6:1.00]
49414941
; BTVER2-NEXT: vaddpd %xmm1, %xmm0, %xmm0 # sched: [3:1.00]
4942-
; BTVER2-NEXT: vmovhpd %xmm0, (%rdi) # sched: [1:1.00]
4942+
; BTVER2-NEXT: vmovhpd %xmm0, (%rdi) # sched: [2:1.00]
49434943
; BTVER2-NEXT: retq # sched: [4:1.00]
49444944
;
49454945
; ZNVER1-SSE-LABEL: test_movhpd:
@@ -5060,14 +5060,14 @@ define void @test_movlpd(<2 x double> %a0, <2 x double> %a1, x86_mmx *%a2) {
50605060
; BTVER2-SSE: # %bb.0:
50615061
; BTVER2-SSE-NEXT: movlpd {{.*#+}} xmm1 = mem[0],xmm1[1] sched: [6:1.00]
50625062
; BTVER2-SSE-NEXT: addpd %xmm0, %xmm1 # sched: [3:1.00]
5063-
; BTVER2-SSE-NEXT: movlpd %xmm1, (%rdi) # sched: [1:1.00]
5063+
; BTVER2-SSE-NEXT: movlpd %xmm1, (%rdi) # sched: [2:1.00]
50645064
; BTVER2-SSE-NEXT: retq # sched: [4:1.00]
50655065
;
50665066
; BTVER2-LABEL: test_movlpd:
50675067
; BTVER2: # %bb.0:
50685068
; BTVER2-NEXT: vmovlpd {{.*#+}} xmm1 = mem[0],xmm1[1] sched: [6:1.00]
50695069
; BTVER2-NEXT: vaddpd %xmm1, %xmm0, %xmm0 # sched: [3:1.00]
5070-
; BTVER2-NEXT: vmovlpd %xmm0, (%rdi) # sched: [1:1.00]
5070+
; BTVER2-NEXT: vmovlpd %xmm0, (%rdi) # sched: [2:1.00]
50715071
; BTVER2-NEXT: retq # sched: [4:1.00]
50725072
;
50735073
; ZNVER1-SSE-LABEL: test_movlpd:
@@ -5496,14 +5496,14 @@ define <2 x i64> @test_movq_mem(<2 x i64> %a0, i64 *%a1) {
54965496
; BTVER2-SSE: # %bb.0:
54975497
; BTVER2-SSE-NEXT: movq {{.*#+}} xmm1 = mem[0],zero sched: [5:1.00]
54985498
; BTVER2-SSE-NEXT: paddq %xmm1, %xmm0 # sched: [1:0.50]
5499-
; BTVER2-SSE-NEXT: movq %xmm0, (%rdi) # sched: [1:1.00]
5499+
; BTVER2-SSE-NEXT: movq %xmm0, (%rdi) # sched: [2:1.00]
55005500
; BTVER2-SSE-NEXT: retq # sched: [4:1.00]
55015501
;
55025502
; BTVER2-LABEL: test_movq_mem:
55035503
; BTVER2: # %bb.0:
55045504
; BTVER2-NEXT: vmovq {{.*#+}} xmm1 = mem[0],zero sched: [5:1.00]
55055505
; BTVER2-NEXT: vpaddq %xmm1, %xmm0, %xmm0 # sched: [1:0.50]
5506-
; BTVER2-NEXT: vmovq %xmm0, (%rdi) # sched: [1:1.00]
5506+
; BTVER2-NEXT: vmovq %xmm0, (%rdi) # sched: [2:1.00]
55075507
; BTVER2-NEXT: retq # sched: [4:1.00]
55085508
;
55095509
; ZNVER1-SSE-LABEL: test_movq_mem:
@@ -5732,14 +5732,14 @@ define void @test_movsd_mem(double* %a0, double* %a1) {
57325732
; BTVER2-SSE: # %bb.0:
57335733
; BTVER2-SSE-NEXT: movsd {{.*#+}} xmm0 = mem[0],zero sched: [5:1.00]
57345734
; BTVER2-SSE-NEXT: addsd %xmm0, %xmm0 # sched: [3:1.00]
5735-
; BTVER2-SSE-NEXT: movsd %xmm0, (%rsi) # sched: [1:1.00]
5735+
; BTVER2-SSE-NEXT: movsd %xmm0, (%rsi) # sched: [2:1.00]
57365736
; BTVER2-SSE-NEXT: retq # sched: [4:1.00]
57375737
;
57385738
; BTVER2-LABEL: test_movsd_mem:
57395739
; BTVER2: # %bb.0:
57405740
; BTVER2-NEXT: vmovsd {{.*#+}} xmm0 = mem[0],zero sched: [5:1.00]
57415741
; BTVER2-NEXT: vaddsd %xmm0, %xmm0, %xmm0 # sched: [3:1.00]
5742-
; BTVER2-NEXT: vmovsd %xmm0, (%rsi) # sched: [1:1.00]
5742+
; BTVER2-NEXT: vmovsd %xmm0, (%rsi) # sched: [2:1.00]
57435743
; BTVER2-NEXT: retq # sched: [4:1.00]
57445744
;
57455745
; ZNVER1-SSE-LABEL: test_movsd_mem:

llvm/test/tools/llvm-mca/X86/BtVer2/resources-avx1.s

Lines changed: 8 additions & 8 deletions
Original file line numberDiff line numberDiff line change
@@ -1255,7 +1255,7 @@ vzeroupper
12551255
# CHECK-NEXT: 1 1 0.50 vmovd %eax, %xmm2
12561256
# CHECK-NEXT: 1 5 1.00 * vmovd (%rax), %xmm2
12571257
# CHECK-NEXT: 1 1 0.50 vmovd %xmm0, %ecx
1258-
# CHECK-NEXT: 1 1 1.00 * vmovd %xmm0, (%rax)
1258+
# CHECK-NEXT: 1 2 1.00 * vmovd %xmm0, (%rax)
12591259
# CHECK-NEXT: 1 1 0.50 vmovddup %xmm0, %xmm2
12601260
# CHECK-NEXT: 1 6 1.00 * vmovddup (%rax), %xmm2
12611261
# CHECK-NEXT: 2 1 1.00 vmovddup %ymm0, %ymm2
@@ -1274,13 +1274,13 @@ vzeroupper
12741274
# CHECK-NEXT: 1 5 1.00 * vmovdqu (%rax), %ymm2
12751275
# CHECK-NEXT: 1 1 0.50 vmovhlps %xmm0, %xmm1, %xmm2
12761276
# CHECK-NEXT: 1 1 0.50 vmovlhps %xmm0, %xmm1, %xmm2
1277-
# CHECK-NEXT: 1 1 1.00 * vmovhpd %xmm0, (%rax)
1277+
# CHECK-NEXT: 1 2 1.00 * vmovhpd %xmm0, (%rax)
12781278
# CHECK-NEXT: 1 6 1.00 * vmovhpd (%rax), %xmm1, %xmm2
1279-
# CHECK-NEXT: 1 1 1.00 * vmovhps %xmm0, (%rax)
1279+
# CHECK-NEXT: 1 2 1.00 * vmovhps %xmm0, (%rax)
12801280
# CHECK-NEXT: 1 6 1.00 * vmovhps (%rax), %xmm1, %xmm2
1281-
# CHECK-NEXT: 1 1 1.00 * vmovlpd %xmm0, (%rax)
1281+
# CHECK-NEXT: 1 2 1.00 * vmovlpd %xmm0, (%rax)
12821282
# CHECK-NEXT: 1 6 1.00 * vmovlpd (%rax), %xmm1, %xmm2
1283-
# CHECK-NEXT: 1 1 1.00 * vmovlps %xmm0, (%rax)
1283+
# CHECK-NEXT: 1 2 1.00 * vmovlps %xmm0, (%rax)
12841284
# CHECK-NEXT: 1 6 1.00 * vmovlps (%rax), %xmm1, %xmm2
12851285
# CHECK-NEXT: 1 3 1.00 vmovmskpd %xmm0, %ecx
12861286
# CHECK-NEXT: 1 3 1.00 vmovmskpd %ymm0, %ecx
@@ -1298,9 +1298,9 @@ vzeroupper
12981298
# CHECK-NEXT: 1 1 0.50 vmovq %rax, %xmm2
12991299
# CHECK-NEXT: 1 5 1.00 * vmovq (%rax), %xmm2
13001300
# CHECK-NEXT: 1 1 0.50 vmovq %xmm0, %rcx
1301-
# CHECK-NEXT: 1 1 1.00 * vmovq %xmm0, (%rax)
1301+
# CHECK-NEXT: 1 2 1.00 * vmovq %xmm0, (%rax)
13021302
# CHECK-NEXT: 1 1 0.50 vmovsd %xmm0, %xmm1, %xmm2
1303-
# CHECK-NEXT: 1 1 1.00 * vmovsd %xmm0, (%rax)
1303+
# CHECK-NEXT: 1 2 1.00 * vmovsd %xmm0, (%rax)
13041304
# CHECK-NEXT: 1 5 1.00 * vmovsd (%rax), %xmm2
13051305
# CHECK-NEXT: 1 1 0.50 vmovshdup %xmm0, %xmm2
13061306
# CHECK-NEXT: 1 6 1.00 * vmovshdup (%rax), %xmm2
@@ -1311,7 +1311,7 @@ vzeroupper
13111311
# CHECK-NEXT: 2 1 1.00 vmovsldup %ymm0, %ymm2
13121312
# CHECK-NEXT: 2 6 2.00 * vmovsldup (%rax), %ymm2
13131313
# CHECK-NEXT: 1 1 0.50 vmovss %xmm0, %xmm1, %xmm2
1314-
# CHECK-NEXT: 1 1 1.00 * vmovss %xmm0, (%rax)
1314+
# CHECK-NEXT: 1 2 1.00 * vmovss %xmm0, (%rax)
13151315
# CHECK-NEXT: 1 5 1.00 * vmovss (%rax), %xmm2
13161316
# CHECK-NEXT: 1 1 0.50 vmovupd %xmm0, %xmm2
13171317
# CHECK-NEXT: 1 1 1.00 * vmovupd %xmm0, (%rax)

llvm/test/tools/llvm-mca/X86/BtVer2/resources-mmx.s

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -168,11 +168,11 @@ pxor (%rax), %mm2
168168
# CHECK-NEXT: 1 1 0.50 movd %eax, %mm2
169169
# CHECK-NEXT: 1 5 1.00 * movd (%rax), %mm2
170170
# CHECK-NEXT: 1 1 0.50 movd %mm0, %ecx
171-
# CHECK-NEXT: 1 1 1.00 * * movd %mm0, (%rax)
171+
# CHECK-NEXT: 1 2 1.00 * * movd %mm0, (%rax)
172172
# CHECK-NEXT: 1 1 0.50 movq %rax, %mm2
173173
# CHECK-NEXT: 1 5 1.00 * movq (%rax), %mm2
174174
# CHECK-NEXT: 1 1 0.50 movq %mm0, %rcx
175-
# CHECK-NEXT: 1 1 1.00 * movq %mm0, (%rax)
175+
# CHECK-NEXT: 1 2 1.00 * movq %mm0, (%rax)
176176
# CHECK-NEXT: 1 1 0.50 packsswb %mm0, %mm2
177177
# CHECK-NEXT: 1 6 1.00 * packsswb (%rax), %mm2
178178
# CHECK-NEXT: 1 1 0.50 packssdw %mm0, %mm2

llvm/test/tools/llvm-mca/X86/BtVer2/resources-sse1.s

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -245,15 +245,15 @@ xorps (%rax), %xmm2
245245
# CHECK-NEXT: 1 5 1.00 * movaps (%rax), %xmm2
246246
# CHECK-NEXT: 1 1 0.50 movhlps %xmm0, %xmm2
247247
# CHECK-NEXT: 1 1 0.50 movlhps %xmm0, %xmm2
248-
# CHECK-NEXT: 1 1 1.00 * movhps %xmm0, (%rax)
248+
# CHECK-NEXT: 1 2 1.00 * movhps %xmm0, (%rax)
249249
# CHECK-NEXT: 1 6 1.00 * movhps (%rax), %xmm2
250-
# CHECK-NEXT: 1 1 1.00 * movlps %xmm0, (%rax)
250+
# CHECK-NEXT: 1 2 1.00 * movlps %xmm0, (%rax)
251251
# CHECK-NEXT: 1 6 1.00 * movlps (%rax), %xmm2
252252
# CHECK-NEXT: 1 3 1.00 movmskps %xmm0, %ecx
253253
# CHECK-NEXT: 1 3 1.00 * movntps %xmm0, (%rax)
254254
# CHECK-NEXT: 1 2 1.00 * * * movntq %mm0, (%rax)
255255
# CHECK-NEXT: 1 1 0.50 movss %xmm0, %xmm2
256-
# CHECK-NEXT: 1 1 1.00 * movss %xmm0, (%rax)
256+
# CHECK-NEXT: 1 2 1.00 * movss %xmm0, (%rax)
257257
# CHECK-NEXT: 1 5 1.00 * movss (%rax), %xmm2
258258
# CHECK-NEXT: 1 1 0.50 movups %xmm0, %xmm2
259259
# CHECK-NEXT: 1 1 1.00 * movups %xmm0, (%rax)

llvm/test/tools/llvm-mca/X86/BtVer2/resources-sse2.s

Lines changed: 5 additions & 5 deletions
Original file line numberDiff line numberDiff line change
@@ -475,17 +475,17 @@ xorpd (%rax), %xmm2
475475
# CHECK-NEXT: 1 1 0.50 movd %eax, %xmm2
476476
# CHECK-NEXT: 1 5 1.00 * movd (%rax), %xmm2
477477
# CHECK-NEXT: 1 1 0.50 movd %xmm0, %ecx
478-
# CHECK-NEXT: 1 1 1.00 * movd %xmm0, (%rax)
478+
# CHECK-NEXT: 1 2 1.00 * movd %xmm0, (%rax)
479479
# CHECK-NEXT: 1 1 0.50 movdqa %xmm0, %xmm2
480480
# CHECK-NEXT: 1 1 1.00 * movdqa %xmm0, (%rax)
481481
# CHECK-NEXT: 1 5 1.00 * movdqa (%rax), %xmm2
482482
# CHECK-NEXT: 1 1 0.50 movdqu %xmm0, %xmm2
483483
# CHECK-NEXT: 1 1 1.00 * movdqu %xmm0, (%rax)
484484
# CHECK-NEXT: 1 5 1.00 * movdqu (%rax), %xmm2
485485
# CHECK-NEXT: 1 1 0.50 movdq2q %xmm0, %mm2
486-
# CHECK-NEXT: 1 1 1.00 * movhpd %xmm0, (%rax)
486+
# CHECK-NEXT: 1 2 1.00 * movhpd %xmm0, (%rax)
487487
# CHECK-NEXT: 1 6 1.00 * movhpd (%rax), %xmm2
488-
# CHECK-NEXT: 1 1 1.00 * movlpd %xmm0, (%rax)
488+
# CHECK-NEXT: 1 2 1.00 * movlpd %xmm0, (%rax)
489489
# CHECK-NEXT: 1 6 1.00 * movlpd (%rax), %xmm2
490490
# CHECK-NEXT: 1 3 1.00 movmskpd %xmm0, %ecx
491491
# CHECK-NEXT: 1 1 1.00 * movntil %eax, (%rax)
@@ -496,10 +496,10 @@ xorpd (%rax), %xmm2
496496
# CHECK-NEXT: 1 1 0.50 movq %rax, %xmm2
497497
# CHECK-NEXT: 1 5 1.00 * movq (%rax), %xmm2
498498
# CHECK-NEXT: 1 1 0.50 movq %xmm0, %rcx
499-
# CHECK-NEXT: 1 1 1.00 * movq %xmm0, (%rax)
499+
# CHECK-NEXT: 1 2 1.00 * movq %xmm0, (%rax)
500500
# CHECK-NEXT: 1 1 0.50 movq2dq %mm0, %xmm2
501501
# CHECK-NEXT: 1 1 0.50 movsd %xmm0, %xmm2
502-
# CHECK-NEXT: 1 1 1.00 * movsd %xmm0, (%rax)
502+
# CHECK-NEXT: 1 2 1.00 * movsd %xmm0, (%rax)
503503
# CHECK-NEXT: 1 5 1.00 * movsd (%rax), %xmm2
504504
# CHECK-NEXT: 1 1 0.50 movupd %xmm0, %xmm2
505505
# CHECK-NEXT: 1 1 1.00 * movupd %xmm0, (%rax)

0 commit comments

Comments
 (0)