@@ -1311,18 +1311,18 @@ vzeroupper
1311
1311
# CHECK-NEXT: 1 5 0.50 * vmovq (%rax), %xmm2
1312
1312
# CHECK-NEXT: 1 2 1.00 vmovq %xmm0, %rcx
1313
1313
# CHECK-NEXT: 2 1 1.00 * vmovq %xmm0, (%rax)
1314
- # CHECK-NEXT: 1 1 1.00 vmovsd %xmm0, %xmm1, %xmm2
1314
+ # CHECK-NEXT: 1 1 0.33 vmovsd %xmm0, %xmm1, %xmm2
1315
1315
# CHECK-NEXT: 2 1 1.00 * vmovsd %xmm0, (%rax)
1316
1316
# CHECK-NEXT: 1 5 0.50 * vmovsd (%rax), %xmm2
1317
- # CHECK-NEXT: 1 1 1.00 vmovshdup %xmm0, %xmm2
1317
+ # CHECK-NEXT: 1 1 0.50 vmovshdup %xmm0, %xmm2
1318
1318
# CHECK-NEXT: 1 6 0.50 * vmovshdup (%rax), %xmm2
1319
- # CHECK-NEXT: 1 1 1.00 vmovshdup %ymm0, %ymm2
1319
+ # CHECK-NEXT: 1 1 0.50 vmovshdup %ymm0, %ymm2
1320
1320
# CHECK-NEXT: 1 7 0.50 * vmovshdup (%rax), %ymm2
1321
- # CHECK-NEXT: 1 1 1.00 vmovsldup %xmm0, %xmm2
1321
+ # CHECK-NEXT: 1 1 0.50 vmovsldup %xmm0, %xmm2
1322
1322
# CHECK-NEXT: 1 6 0.50 * vmovsldup (%rax), %xmm2
1323
- # CHECK-NEXT: 1 1 1.00 vmovsldup %ymm0, %ymm2
1323
+ # CHECK-NEXT: 1 1 0.50 vmovsldup %ymm0, %ymm2
1324
1324
# CHECK-NEXT: 1 7 0.50 * vmovsldup (%rax), %ymm2
1325
- # CHECK-NEXT: 1 1 1.00 vmovss %xmm0, %xmm1, %xmm2
1325
+ # CHECK-NEXT: 1 1 0.33 vmovss %xmm0, %xmm1, %xmm2
1326
1326
# CHECK-NEXT: 2 1 1.00 * vmovss %xmm0, (%rax)
1327
1327
# CHECK-NEXT: 1 5 0.50 * vmovss (%rax), %xmm2
1328
1328
# CHECK-NEXT: 1 1 0.33 vmovupd %xmm0, %xmm2
@@ -1650,14 +1650,14 @@ vzeroupper
1650
1650
# CHECK-NEXT: 2 11 1.00 * vrsqrtps (%rax), %ymm2
1651
1651
# CHECK-NEXT: 1 4 1.00 vrsqrtss %xmm0, %xmm1, %xmm2
1652
1652
# CHECK-NEXT: 2 9 1.00 * vrsqrtss (%rax), %xmm1, %xmm2
1653
- # CHECK-NEXT: 1 1 1.00 vshufpd $1, %xmm0, %xmm1, %xmm2
1654
- # CHECK-NEXT: 2 7 1.00 * vshufpd $1, (%rax), %xmm1, %xmm2
1655
- # CHECK-NEXT: 1 1 1.00 vshufpd $1, %ymm0, %ymm1, %ymm2
1656
- # CHECK-NEXT: 2 8 1.00 * vshufpd $1, (%rax), %ymm1, %ymm2
1657
- # CHECK-NEXT: 1 1 1.00 vshufps $1, %xmm0, %xmm1, %xmm2
1658
- # CHECK-NEXT: 2 7 1.00 * vshufps $1, (%rax), %xmm1, %xmm2
1659
- # CHECK-NEXT: 1 1 1.00 vshufps $1, %ymm0, %ymm1, %ymm2
1660
- # CHECK-NEXT: 2 8 1.00 * vshufps $1, (%rax), %ymm1, %ymm2
1653
+ # CHECK-NEXT: 1 1 0.50 vshufpd $1, %xmm0, %xmm1, %xmm2
1654
+ # CHECK-NEXT: 2 7 0.50 * vshufpd $1, (%rax), %xmm1, %xmm2
1655
+ # CHECK-NEXT: 1 1 0.50 vshufpd $1, %ymm0, %ymm1, %ymm2
1656
+ # CHECK-NEXT: 2 8 0.50 * vshufpd $1, (%rax), %ymm1, %ymm2
1657
+ # CHECK-NEXT: 1 1 0.50 vshufps $1, %xmm0, %xmm1, %xmm2
1658
+ # CHECK-NEXT: 2 7 0.50 * vshufps $1, (%rax), %xmm1, %xmm2
1659
+ # CHECK-NEXT: 1 1 0.50 vshufps $1, %ymm0, %ymm1, %ymm2
1660
+ # CHECK-NEXT: 2 8 0.50 * vshufps $1, (%rax), %ymm1, %ymm2
1661
1661
# CHECK-NEXT: 1 18 6.00 vsqrtpd %xmm0, %xmm2
1662
1662
# CHECK-NEXT: 2 24 6.00 * vsqrtpd (%rax), %xmm2
1663
1663
# CHECK-NEXT: 1 18 12.00 vsqrtpd %ymm0, %ymm2
@@ -1738,7 +1738,7 @@ vzeroupper
1738
1738
1739
1739
# CHECK: Resource pressure per iteration:
1740
1740
# CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9] [10] [11]
1741
- # CHECK-NEXT: - 123.00 317.42 221.42 173.17 173.17 34.00 312.92 6.25 12.67 - -
1741
+ # CHECK-NEXT: - 123.00 318.08 228.08 173.17 173.17 34.00 305.58 6.25 12.67 - -
1742
1742
1743
1743
# CHECK: Resource pressure by instruction:
1744
1744
# CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9] [10] [11] Instructions:
@@ -2023,18 +2023,18 @@ vzeroupper
2023
2023
# CHECK-NEXT: - - - - 0.50 0.50 - - - - - - vmovq (%rax), %xmm2
2024
2024
# CHECK-NEXT: - - 1.00 - - - - - - - - - vmovq %xmm0, %rcx
2025
2025
# CHECK-NEXT: - - - - 0.33 0.33 1.00 - - 0.33 - - vmovq %xmm0, (%rax)
2026
- # CHECK-NEXT: - - - - - - - 1.00 - - - - vmovsd %xmm0, %xmm1, %xmm2
2026
+ # CHECK-NEXT: - - 0.33 0.33 - - - 0.33 - - - - vmovsd %xmm0, %xmm1, %xmm2
2027
2027
# CHECK-NEXT: - - - - 0.33 0.33 1.00 - - 0.33 - - vmovsd %xmm0, (%rax)
2028
2028
# CHECK-NEXT: - - - - 0.50 0.50 - - - - - - vmovsd (%rax), %xmm2
2029
- # CHECK-NEXT: - - - - - - - 1.00 - - - - vmovshdup %xmm0, %xmm2
2029
+ # CHECK-NEXT: - - - 0.50 - - - 0.50 - - - - vmovshdup %xmm0, %xmm2
2030
2030
# CHECK-NEXT: - - - - 0.50 0.50 - - - - - - vmovshdup (%rax), %xmm2
2031
- # CHECK-NEXT: - - - - - - - 1.00 - - - - vmovshdup %ymm0, %ymm2
2031
+ # CHECK-NEXT: - - - 0.50 - - - 0.50 - - - - vmovshdup %ymm0, %ymm2
2032
2032
# CHECK-NEXT: - - - - 0.50 0.50 - - - - - - vmovshdup (%rax), %ymm2
2033
- # CHECK-NEXT: - - - - - - - 1.00 - - - - vmovsldup %xmm0, %xmm2
2033
+ # CHECK-NEXT: - - - 0.50 - - - 0.50 - - - - vmovsldup %xmm0, %xmm2
2034
2034
# CHECK-NEXT: - - - - 0.50 0.50 - - - - - - vmovsldup (%rax), %xmm2
2035
- # CHECK-NEXT: - - - - - - - 1.00 - - - - vmovsldup %ymm0, %ymm2
2035
+ # CHECK-NEXT: - - - 0.50 - - - 0.50 - - - - vmovsldup %ymm0, %ymm2
2036
2036
# CHECK-NEXT: - - - - 0.50 0.50 - - - - - - vmovsldup (%rax), %ymm2
2037
- # CHECK-NEXT: - - - - - - - 1.00 - - - - vmovss %xmm0, %xmm1, %xmm2
2037
+ # CHECK-NEXT: - - 0.33 0.33 - - - 0.33 - - - - vmovss %xmm0, %xmm1, %xmm2
2038
2038
# CHECK-NEXT: - - - - 0.33 0.33 1.00 - - 0.33 - - vmovss %xmm0, (%rax)
2039
2039
# CHECK-NEXT: - - - - 0.50 0.50 - - - - - - vmovss (%rax), %xmm2
2040
2040
# CHECK-NEXT: - - 0.33 0.33 - - - 0.33 - - - - vmovupd %xmm0, %xmm2
@@ -2362,14 +2362,14 @@ vzeroupper
2362
2362
# CHECK-NEXT: - - 1.00 - 0.50 0.50 - - - - - - vrsqrtps (%rax), %ymm2
2363
2363
# CHECK-NEXT: - - 1.00 - - - - - - - - - vrsqrtss %xmm0, %xmm1, %xmm2
2364
2364
# CHECK-NEXT: - - 1.00 - 0.50 0.50 - - - - - - vrsqrtss (%rax), %xmm1, %xmm2
2365
- # CHECK-NEXT: - - - - - - - 1.00 - - - - vshufpd $1, %xmm0, %xmm1, %xmm2
2366
- # CHECK-NEXT: - - - - 0.50 0.50 - 1.00 - - - - vshufpd $1, (%rax), %xmm1, %xmm2
2367
- # CHECK-NEXT: - - - - - - - 1.00 - - - - vshufpd $1, %ymm0, %ymm1, %ymm2
2368
- # CHECK-NEXT: - - - - 0.50 0.50 - 1.00 - - - - vshufpd $1, (%rax), %ymm1, %ymm2
2369
- # CHECK-NEXT: - - - - - - - 1.00 - - - - vshufps $1, %xmm0, %xmm1, %xmm2
2370
- # CHECK-NEXT: - - - - 0.50 0.50 - 1.00 - - - - vshufps $1, (%rax), %xmm1, %xmm2
2371
- # CHECK-NEXT: - - - - - - - 1.00 - - - - vshufps $1, %ymm0, %ymm1, %ymm2
2372
- # CHECK-NEXT: - - - - 0.50 0.50 - 1.00 - - - - vshufps $1, (%rax), %ymm1, %ymm2
2365
+ # CHECK-NEXT: - - - 0.50 - - - 0.50 - - - - vshufpd $1, %xmm0, %xmm1, %xmm2
2366
+ # CHECK-NEXT: - - - 0.50 0.50 0.50 - 0.50 - - - - vshufpd $1, (%rax), %xmm1, %xmm2
2367
+ # CHECK-NEXT: - - - 0.50 - - - 0.50 - - - - vshufpd $1, %ymm0, %ymm1, %ymm2
2368
+ # CHECK-NEXT: - - - 0.50 0.50 0.50 - 0.50 - - - - vshufpd $1, (%rax), %ymm1, %ymm2
2369
+ # CHECK-NEXT: - - - 0.50 - - - 0.50 - - - - vshufps $1, %xmm0, %xmm1, %xmm2
2370
+ # CHECK-NEXT: - - - 0.50 0.50 0.50 - 0.50 - - - - vshufps $1, (%rax), %xmm1, %xmm2
2371
+ # CHECK-NEXT: - - - 0.50 - - - 0.50 - - - - vshufps $1, %ymm0, %ymm1, %ymm2
2372
+ # CHECK-NEXT: - - - 0.50 0.50 0.50 - 0.50 - - - - vshufps $1, (%rax), %ymm1, %ymm2
2373
2373
# CHECK-NEXT: - 6.00 1.00 - - - - - - - - - vsqrtpd %xmm0, %xmm2
2374
2374
# CHECK-NEXT: - 6.00 1.00 - 0.50 0.50 - - - - - - vsqrtpd (%rax), %xmm2
2375
2375
# CHECK-NEXT: - 12.00 1.00 - - - - - - - - - vsqrtpd %ymm0, %ymm2
0 commit comments