11Iterations: 100
2- Instructions: 2500
3- Total Cycles: 849
4- Total uOps: 2800
2+ Instructions: 2400
3+ Total Cycles: 1406
4+ Total uOps: 2700
55
66Dispatch Width: 4
7- uOps Per Cycle: 3.30
8- IPC: 2.94
9- Block RThroughput: 7.0
7+ uOps Per Cycle: 1.92
8+ IPC: 1.71
9+ Block RThroughput: 6.8
1010
1111
1212Instruction Info:
@@ -18,18 +18,14 @@ Instruction Info:
1818[6]: HasSideEffects (U)
1919
2020[1] [2] [3] [4] [5] [6] Instructions:
21- 1 1 0.33 test dil, 3
22- 1 1 1.00 je .LBB5_2
23- 1 0 0.25 xor eax, eax
24- 1 1 0.33 mov rdx, rsi
25- 1 1 1.00 U ret
2621 1 1 0.33 movabs rax, 9223372036854775804
2722 1 1 0.33 and rax, rsi
2823 1 1 0.33 cmp rax, 9
29- 1 1 1.00 jae .LBB5_4
30- 1 0 0.25 xor eax, eax
31- 1 1 0.33 mov rdx, rsi
32- 1 1 1.00 U ret
24+ 1 1 0.50 setb cl
25+ 1 1 0.33 test dil, 3
26+ 1 1 0.50 setne dl
27+ 1 1 0.33 or dl, cl
28+ 1 1 1.00 jne .LBB5_1
3329 1 1 0.33 add rax, -9
3430 1 1 0.33 movabs rcx, -6148914691236517205
3531 2 4 1.00 mul rcx
@@ -43,6 +39,9 @@ Instruction Info:
4339 2 2 0.67 cmove rax, rdi
4440 1 1 0.33 mov rdx, rsi
4541 1 1 1.00 U ret
42+ 1 0 0.25 xor eax, eax
43+ 1 1 0.33 mov rdx, rsi
44+ 1 1 1.00 U ret
4645
4746
4847Resources:
@@ -58,32 +57,31 @@ Resources:
5857
5958Resource pressure per iteration:
6059[0] [1] [2] [3] [4] [5] [6.0] [6.1]
61- - - 8.33 8.32 - 8.35 - -
60+ - - 8.02 8.02 - 8.96 - -
6261
6362Resource pressure by instruction:
6463[0] [1] [2] [3] [4] [5] [6.0] [6.1] Instructions:
65- - - 0.35 0.33 - 0.32 - - test dil, 3
66- - - - - - 1.00 - - je .LBB5_2
67- - - - - - - - - xor eax, eax
68- - - 0.92 0.04 - 0.04 - - mov rdx, rsi
69- - - - - - 1.00 - - ret
70- - - 0.32 0.15 - 0.53 - - movabs rax, 9223372036854775804
71- - - 0.03 0.06 - 0.91 - - and rax, rsi
72- - - 0.05 0.93 - 0.02 - - cmp rax, 9
73- - - - - - 1.00 - - jae .LBB5_4
64+ - - 0.02 0.03 - 0.95 - - movabs rax, 9223372036854775804
65+ - - 0.94 0.02 - 0.04 - - and rax, rsi
66+ - - 0.01 0.04 - 0.95 - - cmp rax, 9
67+ - - 0.97 - - 0.03 - - setb cl
68+ - - 0.98 - - 0.02 - - test dil, 3
69+ - - 0.04 - - 0.96 - - setne dl
70+ - - 0.01 0.03 - 0.96 - - or dl, cl
71+ - - - - - 1.00 - - jne .LBB5_1
72+ - - 0.04 0.95 - 0.01 - - add rax, -9
73+ - - 0.02 0.98 - - - - movabs rcx, -6148914691236517205
74+ - - 1.00 1.00 - - - - mul rcx
75+ - - 0.98 - - 0.02 - - shr rdx
76+ - - 0.01 0.99 - - - - lea rcx, [rdx + 2*rdx]
77+ - - 0.02 0.02 - 0.96 - - or rcx, 3
78+ - - 0.02 0.95 - 0.03 - - add rcx, 9
7479 - - - - - - - - xor eax, eax
75- - - 0.93 0.04 - 0.03 - - mov rdx, rsi
80+ - - 0.95 0.04 - 0.01 - - cmp rsi, rcx
81+ - - 0.98 0.99 - 0.03 - - cmove rsi, rdx
82+ - - 0.98 0.99 - 0.03 - - cmove rax, rdi
83+ - - 0.01 0.04 - 0.95 - - mov rdx, rsi
7684 - - - - - 1.00 - - ret
77- - - 0.37 0.33 - 0.30 - - add rax, -9
78- - - 0.61 0.09 - 0.30 - - movabs rcx, -6148914691236517205
79- - - 1.00 1.00 - - - - mul rcx
80- - - 0.67 - - 0.33 - - shr rdx
81- - - 0.33 0.67 - - - - lea rcx, [rdx + 2*rdx]
82- - - 0.34 0.61 - 0.05 - - or rcx, 3
83- - - 0.36 0.61 - 0.03 - - add rcx, 9
8485 - - - - - - - - xor eax, eax
85- - - 0.04 0.63 - 0.33 - - cmp rsi, rcx
86- - - 0.98 0.97 - 0.05 - - cmove rsi, rdx
87- - - 0.98 0.94 - 0.08 - - cmove rax, rdi
88- - - 0.05 0.92 - 0.03 - - mov rdx, rsi
86+ - - 0.04 0.95 - 0.01 - - mov rdx, rsi
8987 - - - - - 1.00 - - ret
0 commit comments