Copyright (C) 2003, 2009 Lavalys Consulting Group, Inc. All rights reserved. everest_bench.dll build: 2.4.257.0 Jan 19 2009 01:57:35 CPUCount: 1, procMask: 0x00000001 Size of Memory: 245232KB Priority:080 CPU#00 Vendor: CentaurHauls CoreType:0x30000698 CPU#00 Family: 6 Model: 09 Stepping: 8 Type: "VIA Nehemiah" CPU#00 Features: TSC, FPU, CMOV, MMX, SSE, ACE, CMPXCHG8B CPU#00 Frequency: 1333.31MHz OS:5.1.2600 Service Pack 2 CPU#00 AffMask:0x00000001 APIC_ID:0x00000000 Phys_ID:000 Core_ID:00 SMT_ID:00 PhysMask:0x00000001 CPU#00 L1I cache: 64KB, 32 byte cache line, 4 way, SMask:00000001 CPU#00 L1D cache: 64KB, 32 byte cache line, 4 way, SMask:00000001 CPU#00 L2 cache: 64KB, 32 byte cache line, 16 way, SMask:00000001, exclusive Parameters: "-ph -d4031 " Instruction Latency: Used CPUs: 1 ProcMask:0x00000001 0 X86 :NOP L: [no true dep.] T: 0.75ns= 1.00c 1 X86 :0x66 NOP L: [no true dep.] T: 1.50ns= 2.00c 2 X86 : 2x 0x66 NOP L: [no true dep.] T: 2.25ns= 3.00c 3 X86 : 3x 0x66 NOP L: [no true dep.] T: 3.00ns= 4.00c 4 X86 : 4x 0x66 NOP L: [no true dep.] T: 3.75ns= 5.00c 5 X86 : 5x 0x66 NOP L: [no true dep.] T: 4.50ns= 6.00c 6 X86 : 6x 0x66 NOP L: [no true dep.] T: 5.25ns= 7.00c 7 X86 : 7x 0x66 NOP L: [no true dep.] T: 6.00ns= 8.00c 8 X86 : 8x 0x66 NOP L: [no true dep.] T: 6.75ns= 9.00c 9 X86 : 9x 0x66 NOP L: [no true dep.] T: 7.50ns= 10.00c 10 X86 :10x 0x66 NOP L: [no true dep.] T: 8.25ns= 11.00c 11 X86 :11x 0x66 NOP L: [no true dep.] T: 9.00ns= 12.00c 12 X86 :12x 0x66 NOP L: [no true dep.] T: 9.75ns= 13.00c 13 X86 :13x 0x66 NOP L: [no true dep.] T: 10.50ns= 14.00c 14 X86 :14x 0x66 NOP L: [no true dep.] T: 11.25ns= 15.00c 16 X86 :MOV r8, imm8 L: 0.75ns= 1.0c T: 0.75ns= 1.00c 17 X86 :MOV r16, imm16 L: 1.50ns= 2.0c T: 1.50ns= 2.00c 18 X86 :MOV r32, imm32 L: 0.75ns= 1.0c T: 0.75ns= 1.00c 20 X86 :MOV r8, r8 L: 0.75ns= 1.0c T: 0.75ns= 1.00c 21 X86 :MOV r16, r16 L: 1.50ns= 2.0c T: 1.50ns= 2.00c 22 X86 :MOV r32, r32 L: 0.75ns= 1.0c T: 0.75ns= 1.00c 24 X86 :MOV r8, [m8] L: 5.25ns= 7.0c T: 0.75ns= 1.00c 25 X86 :MOV r16, [m16] L: 4.50ns= 6.0c T: 1.56ns= 2.08c 26 X86 :MOV r32, [m32] L: 4.50ns= 6.0c T: 0.81ns= 1.08c 28 X86 :MOV [m8], r8 L: [memory dep.] T: 0.81ns= 1.08c 29 X86 :MOV [m16], r16 L: [memory dep.] T: 1.56ns= 2.08c 30 X86 :MOV [m32], r32 L: [memory dep.] T: 0.81ns= 1.08c 31 X86 :MOV [m32 + 8], r32 L: [memory dep.] T: 0.81ns= 1.08c 34 X86 :MOV r8,[m8]+MOV [m8],r8 L: 6.00ns= 8.0c T: 3.25ns= 4.33c 35 X86 :MOV r16,[m16]+MOV [m16],r16 L: 11.25ns= 15.0c T: 1.44ns= 1.92c 36 X86 :MOV r32,[m32]+MOV [m32],r32 L: 11.25ns= 15.0c T: 1.31ns= 1.75c 40 CMOV :CMOVNZ r16, r16 L: 1.50ns= 2.0c T: 1.50ns= 2.00c 41 CMOV :CMOVNZ r32, r32 L: 0.75ns= 1.0c T: 0.75ns= 1.00c 43 X86 :MOVSX r16, r8 L: 1.50ns= 2.0c T: 1.50ns= 2.00c 44 X86 :MOVSX r32, r8 L: 0.75ns= 1.0c T: 0.75ns= 1.00c 46 X86 :MOVSX r32, r16 L: 0.75ns= 1.0c T: 0.75ns= 1.00c 49 X86 :MOVZX r16, r8 L: 1.50ns= 2.0c T: 1.50ns= 2.00c 50 X86 :MOVZX r32, r8 L: 0.75ns= 1.0c T: 0.75ns= 1.00c 52 X86 :MOVZX r32, r16 L: 0.75ns= 1.0c T: 0.75ns= 1.00c 54 X86 :XCHG r8, r8 L: 0.75ns= 1.0c T: 0.75ns= 1.00c 55 X86 :XCHG r16, r16 L: 1.50ns= 2.0c T: 1.50ns= 2.00c 56 X86 :XCHG r32, r32 L: 0.75ns= 1.0c T: 0.75ns= 1.00c 58 X86 :XCHG r1_8, r2_8 L: 1.50ns= 2.0c T: 0.75ns= 1.00c 59 X86 :XCHG r1_16, r2_16 L: 1.50ns= 2.0c T: 1.50ns= 2.00c 60 X86 :XCHG r1_32, r2_32 L: 0.75ns= 1.0c T: 0.75ns= 1.00c 62 X86 :XCHG r8, [m8] L: 10.50ns= 14.0c T: 9.75ns= 13.00c 63 X86 :XCHG r16, [m16] L: 10.50ns= 14.0c T: 9.75ns= 13.00c 64 X86 :XCHG r32, [m32] L: 10.50ns= 14.0c T: 9.75ns= 13.00c 66 X86 :ADD r32, 0x04000 L: 0.75ns= 1.0c T: 0.75ns= 1.00c 67 X86 :ADD r32, 0x08000 L: 0.75ns= 1.0c T: 0.75ns= 1.00c 68 X86 :ADD r32, 0x10000 L: 0.75ns= 1.0c T: 0.75ns= 1.00c 69 X86 :ADD r32, 0x20000 L: 0.75ns= 1.0c T: 0.75ns= 1.00c 70 X86 :ADD r8, r8 L: 0.75ns= 1.0c T: 0.75ns= 1.00c 71 X86 :ADD r16, r16 L: 1.50ns= 2.0c T: 1.50ns= 2.00c 72 X86 :ADD r32, r32 L: 0.75ns= 1.0c T: 0.75ns= 1.00c 74 X86 :ADD r8, [m8] L: 5.25ns= 7.0c T: 0.75ns= 1.00c 75 X86 :ADD r16, [m16] L: 5.25ns= 7.0c T: 1.56ns= 2.08c 76 X86 :ADD r32, [m32] L: 5.25ns= 7.0c T: 0.81ns= 1.08c 78 X86 :ADD [m8], r8 L: 6.75ns= 9.0c T: 4.06ns= 5.42c 79 X86 :ADD [m16], r16 L: 6.75ns= 9.0c T: 1.75ns= 2.33c 80 X86 :ADD [m32], r32 L: 6.75ns= 9.0c T: 4.00ns= 5.33c 81 X86 :ADD [m32 + 8], r32 L: 6.75ns= 9.0c T: 6.25ns= 8.33c 84 X86 :LOCK ADD [m8], r8 L: 9.75ns= 13.0c T: 9.75ns= 13.00c 85 X86 :LOCK ADD [m16], r16 L: 9.75ns= 13.0c T: 9.75ns= 13.00c 86 X86 :LOCK ADD [m32], r32 L: 9.75ns= 13.0c T: 9.75ns= 13.00c 87 X86 :LOCK ADD [m32 + 8], r32 L: 9.75ns= 13.0c T: 9.75ns= 13.00c 90 X86 :ADD r8, imm8 L: 0.75ns= 1.0c T: 0.75ns= 1.00c 91 X86 :ADD r16, imm8 L: 1.50ns= 2.0c T: 1.50ns= 2.00c 92 X86 :ADD r32, imm8 L: 0.75ns= 1.0c T: 0.75ns= 1.00c 94 X86 :ADD r16, imm16 L: 1.50ns= 2.0c T: 1.50ns= 2.00c 95 X86 :ADD r32, imm32 L: 0.75ns= 1.0c T: 0.75ns= 1.00c 97 X86 :ADD [m8], imm8 L: 6.75ns= 9.0c T: 3.94ns= 5.25c 98 X86 :ADD [m16], imm8 L: 6.75ns= 9.0c T: 1.75ns= 2.33c 99 X86 :ADD [m32], imm8 L: 6.75ns= 9.0c T: 3.94ns= 5.25c 101 X86 :ADD [m16], imm16 L: 6.69ns= 8.9c T: 1.69ns= 2.25c 102 X86 :ADD [m32], imm32 L: 6.75ns= 9.0c T: 3.94ns= 5.25c 104 X86 :ADD al, imm8 L: 0.75ns= 1.0c T: 0.75ns= 1.00c 105 X86 :ADD ax, imm16 L: 1.50ns= 2.0c T: 1.50ns= 2.00c 106 X86 :ADD eax, imm32 L: 0.75ns= 1.0c T: 0.75ns= 1.00c 108 X86 :SUB r8, r8 L: 0.75ns= 1.0c T: 0.75ns= 1.00c 109 X86 :SUB r16, r16 L: 1.50ns= 2.0c T: 1.50ns= 2.00c 110 X86 :SUB r32, r32 L: 0.75ns= 1.0c T: 0.75ns= 1.00c 112 X86 :SUB r1_8, r2_8 L: 0.75ns= 1.0c T: 0.75ns= 1.00c 113 X86 :SUB r1_16, r2_16 L: 1.50ns= 2.0c T: 1.50ns= 2.00c 114 X86 :SUB r1_32, r2_32 L: 0.75ns= 1.0c T: 0.75ns= 1.00c 116 X86 :ADC r8, r8 L: 0.75ns= 1.0c T: 0.75ns= 1.00c 117 X86 :ADC r16, r16 L: 1.50ns= 2.0c T: 1.50ns= 2.00c 118 X86 :ADC r32, r32 L: 0.75ns= 1.0c T: 0.75ns= 1.00c 120 X86 :SBB r8, r8 L: 0.75ns= 1.0c T: 0.75ns= 1.00c 121 X86 :SBB r16, r16 L: 1.50ns= 2.0c T: 1.50ns= 2.00c 122 X86 :SBB r32, r32 L: 0.75ns= 1.0c T: 0.75ns= 1.00c 124 X86 :SBB r1_8, r2_8 L: 0.75ns= 1.0c T: 0.75ns= 1.00c 125 X86 :SBB r1_16, r2_16 L: 1.50ns= 2.0c T: 1.50ns= 2.00c 126 X86 :SBB r1_32, r2_32 L: 0.75ns= 1.0c T: 0.75ns= 1.00c 128 X86 :CMP r8, r8 L: [no true dep.] T: 0.75ns= 1.00c 129 X86 :CMP r16, r16 L: [no true dep.] T: 1.50ns= 2.00c 130 X86 :CMP r32, r32 L: [no true dep.] T: 0.75ns= 1.00c 132 X86 :CMP r1_8, r2_8 L: [no true dep.] T: 0.75ns= 1.00c 133 X86 :CMP r1_16, r2_16 L: [no true dep.] T: 1.50ns= 2.00c 134 X86 :CMP r1_32, r2_32 L: [no true dep.] T: 0.75ns= 1.00c 136 X86 :AND r8, r8 L: 0.75ns= 1.0c T: 0.75ns= 1.00c 137 X86 :AND r16, r16 L: 1.50ns= 2.0c T: 1.50ns= 2.00c 138 X86 :AND r32, r32 L: 0.75ns= 1.0c T: 0.75ns= 1.00c 140 X86 :AND r1_8, r2_8 L: 0.75ns= 1.0c T: 0.75ns= 1.00c 141 X86 :AND r1_16, r2_16 L: 1.50ns= 2.0c T: 1.50ns= 2.00c 142 X86 :AND r1_32, r2_32 L: 0.75ns= 1.0c T: 0.75ns= 1.00c 144 X86 :OR r8, r8 L: 0.75ns= 1.0c T: 0.75ns= 1.00c 145 X86 :OR r16, r16 L: 1.50ns= 2.0c T: 1.50ns= 2.00c 146 X86 :OR r32, r32 L: 0.75ns= 1.0c T: 0.75ns= 1.00c 148 X86 :OR r1_8, r2_8 L: 0.75ns= 1.0c T: 0.75ns= 1.00c 149 X86 :OR r1_16, r2_16 L: 1.50ns= 2.0c T: 1.50ns= 2.00c 150 X86 :OR r1_32, r2_32 L: 0.75ns= 1.0c T: 0.75ns= 1.00c 152 X86 :XOR r8, r8 L: 0.75ns= 1.0c T: 0.75ns= 1.00c 153 X86 :XOR r16, r16 L: 1.50ns= 2.0c T: 1.50ns= 2.00c 154 X86 :XOR r32, r32 L: 0.75ns= 1.0c T: 0.75ns= 1.00c 156 X86 :XOR r1_8, r2_8 L: 0.75ns= 1.0c T: 0.75ns= 1.00c 157 X86 :XOR r1_16, r2_16 L: 1.50ns= 2.0c T: 1.50ns= 2.00c 158 X86 :XOR r1_32, r2_32 L: 0.75ns= 1.0c T: 0.75ns= 1.00c 160 X86 :NEG r8 L: 0.75ns= 1.0c T: 0.75ns= 1.00c 161 X86 :NEG r16 L: 1.50ns= 2.0c T: 1.50ns= 2.00c 162 X86 :NEG r32 L: 0.75ns= 1.0c T: 0.75ns= 1.00c 164 X86 :NOT r8 L: 0.75ns= 1.0c T: 0.75ns= 1.00c 165 X86 :NOT r16 L: 1.50ns= 2.0c T: 1.50ns= 2.00c 166 X86 :NOT r32 L: 0.75ns= 1.0c T: 0.75ns= 1.00c 168 X86 :TEST r8, r8 L: [no true dep.] T: 0.75ns= 1.00c 169 X86 :TEST r16, r16 L: [no true dep.] T: 1.50ns= 2.00c 170 X86 :TEST r32, r32 L: [no true dep.] T: 0.75ns= 1.00c 172 X86 :TEST r1_8, r2_8 L: [no true dep.] T: 0.75ns= 1.00c 173 X86 :TEST r1_16, r2_16 L: [no true dep.] T: 1.50ns= 2.00c 174 X86 :TEST r1_32, r2_32 L: [no true dep.] T: 0.75ns= 1.00c 176 X86 :BT r16, r16 L: [no true dep.] T: 9.00ns= 12.00c 177 X86 :BT r32, r32 L: [no true dep.] T: 9.00ns= 12.00c 179 X86 :BT r16, imm8 L: [no true dep.] T: 3.75ns= 5.00c 180 X86 :BT r32, imm8 L: [no true dep.] T: 3.75ns= 5.00c 182 X86 :BTC r16, r16 L: 16.50ns= 22.0c T: 16.50ns= 22.00c 183 X86 :BTC r32, r32 L: 16.50ns= 22.0c T: 16.50ns= 22.00c 185 X86 :BTC r16, imm8 L: 7.50ns= 10.0c T: 7.50ns= 10.00c 186 X86 :BTC r32, imm8 L: 7.50ns= 10.0c T: 7.50ns= 10.00c 188 X86 :BTR r16, r16 L: 21.00ns= 28.0c T: 21.00ns= 28.00c 189 X86 :BTR r32, r32 L: 21.00ns= 28.0c T: 21.00ns= 28.00c 191 X86 :BTR r16, imm8 L: 10.50ns= 14.0c T: 10.50ns= 14.00c 192 X86 :BTR r32, imm8 L: 10.50ns= 14.0c T: 10.50ns= 14.00c 194 X86 :BTS r16, r16 L: 19.50ns= 26.0c T: 19.50ns= 26.00c 195 X86 :BTS r32, r32 L: 19.50ns= 26.0c T: 19.50ns= 26.00c 197 X86 :BTS r16, imm8 L: 10.50ns= 14.0c T: 10.50ns= 14.00c 198 X86 :BTS r32, imm8 L: 10.50ns= 14.0c T: 10.50ns= 14.00c 200 X86 :SETC r8 L: 0.75ns= 1.0c T: 0.75ns= 1.00c 201 X86 :INC r8 L: 0.75ns= 1.0c T: 0.75ns= 1.00c 202 X86 :INC r16 L: 1.50ns= 2.0c T: 1.50ns= 2.00c 203 X86 :INC r32 L: 0.75ns= 1.0c T: 0.75ns= 1.00c 205 X86 :LEA r16, [r16+r16] L: 1.50ns= 2.0c T: 1.50ns= 2.00c 206 X86 :LEA r32, [r32+r32] L: 0.81ns= 1.1c T: 0.81ns= 1.08c 208 X86 :LEA r16, [r+r+disp8] L: 1.56ns= 2.1c T: 1.56ns= 2.08c 209 X86 :LEA r32, [r+r+disp8] L: 0.75ns= 1.0c T: 0.75ns= 1.00c 211 X86 :LEA r16, [r+r*8] L: 1.50ns= 2.0c T: 1.50ns= 2.00c 212 X86 :LEA r32, [r+r*8] L: 0.81ns= 1.1c T: 0.81ns= 1.08c 214 X86 :LEA r16, [r+r*8+disp8] L: 1.56ns= 2.1c T: 1.56ns= 2.08c 215 X86 :LEA r32, [r+r*8+disp8] L: 0.75ns= 1.0c T: 0.75ns= 1.00c 217 X86 :SHL r8, 1 L: 0.75ns= 1.0c T: 0.75ns= 1.00c 218 X86 :SHL r16, 1 L: 1.50ns= 2.0c T: 1.50ns= 2.00c 219 X86 :SHL r32, 1 L: 0.75ns= 1.0c T: 0.75ns= 1.00c 221 X86 :SHL r8, imm8 L: 0.75ns= 1.0c T: 0.75ns= 1.00c 222 X86 :SHL r16, imm8 L: 1.50ns= 2.0c T: 1.50ns= 2.00c 223 X86 :SHL r32, imm8 L: 0.75ns= 1.0c T: 0.75ns= 1.00c 225 X86 :SHL r8, cl L: 0.75ns= 1.0c T: 0.75ns= 1.00c 226 X86 :SHL r16, cl L: 1.50ns= 2.0c T: 1.50ns= 2.00c 227 X86 :SHL r32, cl L: 0.75ns= 1.0c T: 0.75ns= 1.00c 229 X86 :SHR r8, 1 L: 0.75ns= 1.0c T: 0.75ns= 1.00c 230 X86 :SHR r16, 1 L: 1.50ns= 2.0c T: 1.50ns= 2.00c 231 X86 :SHR r32, 1 L: 0.75ns= 1.0c T: 0.75ns= 1.00c 233 X86 :SHR r8, imm8 L: 0.75ns= 1.0c T: 0.75ns= 1.00c 234 X86 :SHR r16, imm8 L: 1.50ns= 2.0c T: 1.50ns= 2.00c 235 X86 :SHR r32, imm8 L: 0.75ns= 1.0c T: 0.75ns= 1.00c 237 X86 :SHR r8, cl L: 0.75ns= 1.0c T: 0.75ns= 1.00c 238 X86 :SHR r16, cl L: 1.50ns= 2.0c T: 1.50ns= 2.00c 239 X86 :SHR r32, cl L: 0.75ns= 1.0c T: 0.75ns= 1.00c 241 X86 :SAR r8, 1 L: 0.75ns= 1.0c T: 0.75ns= 1.00c 242 X86 :SAR r16, 1 L: 1.50ns= 2.0c T: 1.50ns= 2.00c 243 X86 :SAR r32, 1 L: 0.75ns= 1.0c T: 0.75ns= 1.00c 245 X86 :SAR r8, imm8 L: 0.75ns= 1.0c T: 0.75ns= 1.00c 246 X86 :SAR r16, imm8 L: 1.50ns= 2.0c T: 1.50ns= 2.00c 247 X86 :SAR r32, imm8 L: 0.75ns= 1.0c T: 0.75ns= 1.00c 249 X86 :SAR r8, cl L: 0.75ns= 1.0c T: 0.75ns= 1.00c 250 X86 :SAR r16, cl L: 1.50ns= 2.0c T: 1.50ns= 2.00c 251 X86 :SAR r32, cl L: 0.75ns= 1.0c T: 0.75ns= 1.00c 253 X86 :SHLD r16, r16, imm8 L: 27.75ns= 37.0c T: 27.75ns= 37.00c 254 X86 :SHLD r32, r32, imm8 L: 20.25ns= 27.0c T: 20.25ns= 27.00c 256 X86 :SHLD r16, r16, cl L: 13.50ns= 18.0c T: 13.50ns= 18.00c 257 X86 :SHLD r32, r32, cl L: 13.50ns= 18.0c T: 13.50ns= 18.00c 259 X86 :SHRD r16, r16, imm8 L: 34.50ns= 46.0c T: 34.50ns= 46.00c 260 X86 :SHRD r32, r32, imm8 L: 27.75ns= 37.0c T: 27.75ns= 37.00c 262 X86 :SHRD r16, r16, cl L: 13.50ns= 18.0c T: 13.50ns= 18.00c 263 X86 :SHRD r32, r32, cl L: 13.50ns= 18.0c T: 13.50ns= 18.00c 265 X86 :ROL r8, 1 L: 0.75ns= 1.0c T: 0.75ns= 1.00c 266 X86 :ROL r16, 1 L: 1.50ns= 2.0c T: 1.50ns= 2.00c 267 X86 :ROL r32, 1 L: 0.75ns= 1.0c T: 0.75ns= 1.00c 269 X86 :ROL r8, imm8 L: 0.75ns= 1.0c T: 0.75ns= 1.00c 270 X86 :ROL r16, imm8 L: 1.50ns= 2.0c T: 1.50ns= 2.00c 271 X86 :ROL r32, imm8 L: 0.75ns= 1.0c T: 0.75ns= 1.00c 273 X86 :ROL r8, cl L: 0.75ns= 1.0c T: 0.75ns= 1.00c 274 X86 :ROL r16, cl L: 1.50ns= 2.0c T: 1.50ns= 2.00c 275 X86 :ROL r32, cl L: 0.75ns= 1.0c T: 0.75ns= 1.00c 277 X86 :ROR r8, 1 L: 0.75ns= 1.0c T: 0.75ns= 1.00c 278 X86 :ROR r16, 1 L: 1.50ns= 2.0c T: 1.50ns= 2.00c 279 X86 :ROR r32, 1 L: 0.75ns= 1.0c T: 0.75ns= 1.00c 281 X86 :ROR r8, imm8 L: 0.75ns= 1.0c T: 0.75ns= 1.00c 282 X86 :ROR r16, imm8 L: 1.50ns= 2.0c T: 1.50ns= 2.00c 283 X86 :ROR r32, imm8 L: 0.75ns= 1.0c T: 0.75ns= 1.00c 285 X86 :ROR r8, cl L: 0.75ns= 1.0c T: 0.75ns= 1.00c 286 X86 :ROR r16, cl L: 1.50ns= 2.0c T: 1.50ns= 2.00c 287 X86 :ROR r32, cl L: 0.75ns= 1.0c T: 0.75ns= 1.00c 289 X86 :RCL r8, 1 L: 0.75ns= 1.0c T: 0.75ns= 1.00c 290 X86 :RCL r16, 1 L: 1.50ns= 2.0c T: 1.50ns= 2.00c 291 X86 :RCL r32, 1 L: 0.75ns= 1.0c T: 0.75ns= 1.00c 293 X86 :RCL r8, imm8 L: 22.50ns= 30.0c T: 22.50ns= 30.00c 294 X86 :RCL r16, imm8 L: 21.75ns= 29.0c T: 21.75ns= 29.00c 295 X86 :RCL r32, imm8 L: 21.75ns= 29.0c T: 21.75ns= 29.00c 297 X86 :RCL r8, cl L: 15.75ns= 21.0c T: 15.75ns= 21.00c 298 X86 :RCL r16, cl L: 15.00ns= 20.0c T: 15.00ns= 20.00c 299 X86 :RCL r32, cl L: 15.00ns= 20.0c T: 15.00ns= 20.00c 301 X86 :RCR r8, 1 L: 0.75ns= 1.0c T: 0.75ns= 1.00c 302 X86 :RCR r16, 1 L: 1.50ns= 2.0c T: 1.50ns= 2.00c 303 X86 :RCR r32, 1 L: 0.75ns= 1.0c T: 0.75ns= 1.00c 305 X86 :RCR r8, imm8 L: 22.50ns= 30.0c T: 22.50ns= 30.00c 306 X86 :RCR r16, imm8 L: 21.75ns= 29.0c T: 21.75ns= 29.00c 307 X86 :RCR r32, imm8 L: 21.75ns= 29.0c T: 21.75ns= 29.00c 309 X86 :RCR r8, cl L: 15.75ns= 21.0c T: 15.75ns= 21.00c 310 X86 :RCR r16, cl L: 15.00ns= 20.0c T: 15.00ns= 20.00c 311 X86 :RCR r32, cl L: 15.00ns= 20.0c T: 15.00ns= 20.00c 313 X86 :BSF r16, r16 L: 9.75ns= 13.0c T: 9.75ns= 13.00c 314 X86 :BSF r32, r32 L: 9.75ns= 13.0c T: 9.75ns= 13.00c 316 X86 :BSR r16, r16 L: 10.50ns= 14.0c T: 10.50ns= 14.00c 317 X86 :BSR r32, r32 L: 10.50ns= 14.0c T: 10.50ns= 14.00c 319 X86 :BSWAP r32 L: 0.75ns= 1.0c T: 0.75ns= 1.00c 327 X86 :IMUL r16, r16 L: 3.75ns= 5.0c T: 3.75ns= 5.00c 328 X86 :IMUL r32, r32 L: 5.25ns= 7.0c T: 5.25ns= 7.00c 330 X86 :IMUL r16, r16, imm8 L: 3.75ns= 5.0c T: 3.75ns= 5.00c 331 X86 :IMUL r32, r32, imm8 L: 5.25ns= 7.0c T: 5.25ns= 7.00c 333 X86 :IMUL r16, r16, imm16 L: 3.75ns= 5.0c T: 3.75ns= 5.00c 334 X86 :IMUL r32, r32, imm32 L: 5.25ns= 7.0c T: 5.25ns= 7.00c 336 X86 :IMUL r8 (ah) L: 3.75ns= 5.0c T: 3.00ns= 4.00c 337 X86 :IMUL r16 (dx) L: 3.75ns= 5.0c T: 3.75ns= 5.00c 338 X86 :IMUL r32 (edx) L: 5.25ns= 7.0c T: 5.25ns= 7.00c 340 X86 :MUL r8 (ah) L: 3.75ns= 5.0c T: 3.00ns= 4.00c 341 X86 :MUL r16 (dx) L: 3.75ns= 5.0c T: 3.75ns= 5.00c 342 X86 :MUL r32 (edx) L: 5.25ns= 7.0c T: 5.25ns= 7.00c 344 X86 :IMUL r8 (al) L: 3.00ns= 4.0c T: 3.00ns= 4.00c 345 X86 :IMUL r16 (ax) L: 3.75ns= 5.0c T: 3.75ns= 5.00c 346 X86 :IMUL r32 (eax) L: 5.25ns= 7.0c T: 5.25ns= 7.00c 348 X86 :MUL r8 (al) L: 3.00ns= 4.0c T: 3.00ns= 4.00c 349 X86 :MUL r16 (ax) L: 3.75ns= 5.0c T: 3.75ns= 5.00c 350 X86 :MUL r32 (eax) L: 5.25ns= 7.0c T: 5.25ns= 7.00c 352 X86 :IDIV r8 14/ 7b (full) L: 15.00ns= 20.0c T: 15.00ns= 20.00c 353 X86 :IDIV r8 12/ 7b ax upd L: 16.50ns= 22.0c T: 16.50ns= 22.00c 354 X86 :IDIV r8 7/ 7b ax upd L: 16.50ns= 22.0c T: 16.50ns= 22.00c 355 X86 :IDIV r8 4/ 7b ax upd L: [no true dep.] T: 16.50ns= 22.00c 356 X86 :IDIV r8 0/ 7b L: [no true dep.] T: 15.00ns= 20.00c 357 X86 :IDIV r8 11/ 4b ax upd L: 16.50ns= 22.0c T: 16.50ns= 22.00c 358 X86 :IDIV r8 8/ 4b ax upd L: [no true dep.] T: 16.50ns= 22.00c 359 X86 :IDIV r8 4/ 4b ax upd L: 16.50ns= 22.0c T: 16.50ns= 22.00c 360 X86 :IDIV r8 0/ 4b L: [no true dep.] T: 15.00ns= 20.00c 361 X86 :IDIV r8 2^12/2^6 ax upd L: [no true dep.] T: 16.50ns= 22.00c 362 X86 :IDIV r8 1/1 L: 15.00ns= 20.0c T: 15.00ns= 20.00c 363 X86 :IDIV r8 1/1 ax upd L: 16.50ns= 22.0c T: 16.50ns= 22.00c 364 X86 :IDIV r16 30/15b (full) L: 21.00ns= 28.0c T: 21.00ns= 28.00c 365 X86 :IDIV r16 24/15b ax upd L: 21.75ns= 29.0c T: 21.75ns= 29.00c 366 X86 :IDIV r16 15/15b ax upd L: 21.75ns= 29.0c T: 21.75ns= 29.00c 367 X86 :IDIV r16 8/15b ax/dx upd L: [no true dep.] T: 22.50ns= 30.00c 368 X86 :IDIV r16 0/15b L: [no true dep.] T: 21.00ns= 28.00c 369 X86 :IDIV r16 23/ 8b ax upd L: 21.75ns= 29.0c T: 21.75ns= 29.00c 370 X86 :IDIV r16 16/ 8b ax upd L: [no true dep.] T: 21.75ns= 29.00c 371 X86 :IDIV r16 8/ 8b ax upd L: 21.75ns= 29.0c T: 21.75ns= 29.00c 372 X86 :IDIV r16 0/ 8b L: [no true dep.] T: 21.00ns= 28.00c 373 X86 :IDIV r16 2^28/2^14 ax/dx L: [no true dep.] T: 22.50ns= 30.00c 374 X86 :IDIV r16 1/1 L: 21.00ns= 28.0c T: 21.00ns= 28.00c 375 X86 :IDIV r16 1/1 ax upd L: 21.75ns= 29.0c T: 21.75ns= 29.00c 376 X86 :IDIV r16 1/1 ax/dx upd L: 22.50ns= 30.0c T: 22.50ns= 30.00c 377 X86 :IDIV r32 62/31b (full) L: 38.25ns= 51.0c T: 38.25ns= 51.00c 378 X86 :IDIV r32 62/31b 0 rem. L: 38.25ns= 51.0c T: 38.25ns= 51.00c 379 X86 :IDIV r32 48/31b eax upd L: 39.00ns= 52.0c T: 39.00ns= 52.00c 380 X86 :IDIV r32 31/31b eax upd L: 39.00ns= 52.0c T: 39.00ns= 52.00c 381 X86 :IDIV r32 16/31b eax/edx L: [no true dep.] T: 39.75ns= 53.00c 382 X86 :IDIV r32 0/31b L: [no true dep.] T: 38.25ns= 51.00c 383 X86 :IDIV r32 47/16b eax upd L: 39.00ns= 52.0c T: 39.00ns= 52.00c 384 X86 :IDIV r32 32/16b eax upd L: [no true dep.] T: 39.00ns= 52.00c 385 X86 :IDIV r32 16/16b eax upd L: 39.00ns= 52.0c T: 39.00ns= 52.00c 386 X86 :IDIV r32 0/16b L: [no true dep.] T: 38.25ns= 51.00c 387 X86 :IDIV r32 2^60/2^30 eax/edx L: [no true dep.] T: 39.75ns= 53.00c 388 X86 :IDIV r32 1/1 L: 38.25ns= 51.0c T: 38.25ns= 51.00c 389 X86 :IDIV r32 1/1 eax upd L: 39.00ns= 52.0c T: 39.00ns= 52.00c 390 X86 :IDIV r32 1/1 eax/edx upd L: 39.75ns= 53.0c T: 39.75ns= 53.00c 405 X86 :DIV r8 16/ 8b (full) L: 15.00ns= 20.0c T: 15.00ns= 20.00c 406 X86 :DIV r8 12/ 8b ax upd L: 16.50ns= 22.0c T: 16.50ns= 22.00c 407 X86 :DIV r8 8/ 8b ax upd L: 16.50ns= 22.0c T: 16.50ns= 22.00c 408 X86 :DIV r8 4/ 8b ax upd L: [no true dep.] T: 16.50ns= 22.00c 409 X86 :DIV r8 0/ 8b L: [no true dep.] T: 15.00ns= 20.00c 410 X86 :DIV r8 12/ 4b ax upd L: 16.50ns= 22.0c T: 16.50ns= 22.00c 411 X86 :DIV r8 8/ 4b ax upd L: [no true dep.] T: 16.50ns= 22.00c 412 X86 :DIV r8 4/ 4b ax upd L: 16.50ns= 22.0c T: 16.50ns= 22.00c 413 X86 :DIV r8 0/ 4b L: [no true dep.] T: 15.00ns= 20.00c 414 X86 :DIV r8 2^14/2^7 ax upd L: [no true dep.] T: 16.50ns= 22.00c 415 X86 :DIV r8 1/1 L: 15.00ns= 20.0c T: 15.00ns= 20.00c 416 X86 :DIV r8 1/1 ax upd L: 16.50ns= 22.0c T: 16.50ns= 22.00c 417 X86 :DIV r16 32/16b (full) L: 21.00ns= 28.0c T: 21.00ns= 28.00c 418 X86 :DIV r16 30/15b 0 rem. L: 21.00ns= 28.0c T: 21.00ns= 28.00c 419 X86 :DIV r16 24/16b ax upd L: 21.75ns= 29.0c T: 21.75ns= 29.00c 420 X86 :DIV r16 16/16b ax upd L: 21.75ns= 29.0c T: 21.75ns= 29.00c 421 X86 :DIV r16 8/16b ax/dx upd L: [no true dep.] T: 22.50ns= 30.00c 422 X86 :DIV r16 0/16b L: [no true dep.] T: 21.00ns= 28.00c 423 X86 :DIV r16 24/ 8b ax upd L: 21.75ns= 29.0c T: 21.75ns= 29.00c 424 X86 :DIV r16 16/ 8b ax upd L: [no true dep.] T: 21.75ns= 29.00c 425 X86 :DIV r16 8/ 8b ax upd L: 21.75ns= 29.0c T: 21.75ns= 29.00c 426 X86 :DIV r16 0/ 8b L: [no true dep.] T: 21.00ns= 28.00c 427 X86 :DIV r16 1/1 L: 21.00ns= 28.0c T: 21.00ns= 28.00c 428 X86 :DIV r16 1/1 ax upd L: 21.75ns= 29.0c T: 21.75ns= 29.00c 429 X86 :DIV r16 1/1 ax/dx upd L: 22.50ns= 30.0c T: 22.50ns= 30.00c 430 X86 :DIV r32 64/32b (full) L: 38.25ns= 51.0c T: 38.25ns= 51.00c 431 X86 :DIV r32 62/31b 0 rem. L: 38.25ns= 51.0c T: 38.25ns= 51.00c 432 X86 :DIV r32 48/32b eax upd L: 39.00ns= 52.0c T: 39.00ns= 52.00c 433 X86 :DIV r32 32/32b eax upd L: 39.00ns= 52.0c T: 39.00ns= 52.00c 434 X86 :DIV r32 16/32b eax/edx L: [no true dep.] T: 39.75ns= 53.00c 435 X86 :DIV r32 0/32b L: [no true dep.] T: 38.25ns= 51.00c 436 X86 :DIV r32 48/16b eax upd L: 39.00ns= 52.0c T: 39.00ns= 52.00c 437 X86 :DIV r32 32/16b eax upd L: [no true dep.] T: 39.00ns= 52.00c 438 X86 :DIV r32 16/16b eax upd L: 39.00ns= 52.0c T: 39.00ns= 52.00c 439 X86 :DIV r32 0/16b L: [no true dep.] T: 38.25ns= 51.00c 440 X86 :DIV r32 2^62/2^31 eax/edx L: [no true dep.] T: 39.75ns= 53.00c 441 X86 :DIV r32 1/1 L: 38.25ns= 51.0c T: 38.25ns= 51.00c 442 X86 :DIV r32 1/1 eax upd L: 39.00ns= 52.0c T: 39.00ns= 52.00c 443 X86 :DIV r32 1/1 eax/edx upd L: 39.75ns= 53.0c T: 39.75ns= 53.00c 458 X86 :CBW L: 1.50ns= 2.0c T: 1.50ns= 2.00c 459 X86 :CWDE L: 0.75ns= 1.0c T: 0.75ns= 1.00c 461 X86 :CWD L: 1.50ns= 2.0c T: 1.50ns= 2.00c 462 X86 :CDQ L: 0.75ns= 1.0c T: 0.75ns= 1.00c 464 X86 :CLC L: 0.75ns= 1.0c T: 0.75ns= 1.00c 465 X86 :STC L: 0.75ns= 1.0c T: 0.75ns= 1.00c 466 X86 :CMC L: 3.75ns= 5.0c T: 3.75ns= 5.00c 467 X86 :CLD L: 0.75ns= 1.0c T: 0.75ns= 1.00c 468 X86 :STD L: 0.75ns= 1.0c T: 0.75ns= 1.00c 469 X86 :AAA L: 23.00ns= 30.7c T: 23.00ns= 30.67c 470 X86 :AAD L: 3.00ns= 4.0c T: 3.00ns= 4.00c 471 X86 :AAM L: 9.00ns= 12.0c T: 9.00ns= 12.00c 472 X86 :AAS L: 26.13ns= 34.8c T: 26.13ns= 34.83c 473 X86 :DAA L: 18.00ns= 24.0c T: 18.00ns= 24.00c 474 X86 :DAS L: 19.50ns= 26.0c T: 19.50ns= 26.00c 475 X86 :LAHF L: 18.00ns= 24.0c T: 18.00ns= 24.00c 476 X86 :SAHF L: 19.50ns= 26.0c T: 19.50ns= 26.00c 477 X86 :PUSHA L: [no true dep.] T: 6.75ns= 9.00c 478 X86 :POPA L: [no true dep.] T: 6.00ns= 8.00c 479 X86 :PUSHA + POPA L: 18.00ns= 24.0c T: 18.00ns= 24.00c 480 X86 :PUSHAD L: [no true dep.] T: 6.75ns= 9.00c 481 X86 :POPAD L: [no true dep.] T: 6.00ns= 8.00c 482 X86 :PUSHAD + POPAD L: 18.00ns= 24.0c T: 18.00ns= 24.00c 483 X86 :PUSH r16 L: [no true dep.] T: 1.50ns= 2.00c 484 X86 :POP r16 L: [no true dep.] T: 1.50ns= 2.00c 485 X86 :PUSH r16 + POP r16 L: 7.50ns= 10.0c T: 7.50ns= 10.00c 486 X86 :PUSH r32 L: [no true dep.] T: 0.75ns= 1.00c 487 X86 :POP r32 L: [no true dep.] T: 0.75ns= 1.00c 488 X86 :PUSH r32 + POP r32 L: 7.50ns= 10.0c T: 7.50ns= 10.00c 489 X86 :PUSH imm8 L: [no true dep.] T: 0.75ns= 1.00c 490 X86 :PUSH imm8 + POP r32 L: 7.50ns= 10.0c T: 7.50ns= 10.00c 491 X86 :PUSH imm32 L: [no true dep.] T: 0.75ns= 1.00c 492 X86 :PUSH imm32 + POP r32 L: 7.50ns= 10.0c T: 7.50ns= 10.00c 493 X86 :PUSH [m16] L: [no true dep.] T: 1.56ns= 2.08c 494 X86 :POP [m16] L: [no true dep.] T: 1.56ns= 2.08c 495 X86 :PUSH [m16] + POP [m16] L: 15.00ns= 20.0c T: 8.25ns= 11.00c 496 X86 :PUSH [m32] L: [no true dep.] T: 1.50ns= 2.00c 497 X86 :POP [m32] L: [no true dep.] T: 1.50ns= 2.00c 498 X86 :PUSH [m32] + POP [m32] L: 15.00ns= 20.0c T: 8.25ns= 11.00c 499 X86 :PUSHF L: [no true dep.] T: 1.50ns= 2.00c 501 X86 :PUSHF + POPF L: 8.63ns= 11.5c T: 8.63ns= 11.50c 502 X86 :PUSHFD L: [no true dep.] T: 1.50ns= 2.00c 503 X86 :POPFD L: [no true dep.] T: 1.50ns= 2.00c 504 X86 :PUSHFD + POPFD L: 8.63ns= 11.5c T: 8.63ns= 11.50c 505 X86 :CMPSB L: 2.25ns= 3.0c T: 2.25ns= 3.00c 506 X86 :CMPSW L: 2.25ns= 3.0c T: 2.63ns= 3.50c 507 X86 :CMPSD L: 2.25ns= 3.0c T: 13.81ns= 18.42c 509 X86 :REPE CMPSB BW in L1D: 0.67 B/c 887MiB/s 510 X86 :REPE CMPSW BW in L1D: 1.33 B/c 1771MiB/s 511 X86 :REPE CMPSD BW in L1D: 2.65 B/c 3529MiB/s 513 X86 :LODSB L: 0.75ns= 1.0c T: 0.75ns= 1.00c 514 X86 :LODSW L: 1.50ns= 2.0c T: 1.69ns= 2.25c 515 X86 :LODSD L: 0.75ns= 1.0c T: 12.81ns= 17.08c 517 X86 :REP LODSB BW in L1D: 1.00 B/c 1329MiB/s 518 X86 :REP LODSW BW in L1D: 1.99 B/c 2649MiB/s 519 X86 :REP LODSD BW in L1D: 3.95 B/c 5261MiB/s 521 X86 :STOSB L: 0.75ns= 1.0c T: 0.75ns= 1.00c 522 X86 :STOSW L: 1.50ns= 2.0c T: 1.63ns= 2.17c 523 X86 :STOSD L: 0.75ns= 1.0c T: 12.94ns= 17.25c 525 X86 :REP STOSB BW in L1D: 1.00 B/c 1329MiB/s 526 X86 :REP STOSW BW in L1D: 1.99 B/c 2650MiB/s 527 X86 :REP STOSD BW in L1D: 3.95 B/c 5268MiB/s 529 X86 :MOVSB L: 1.50ns= 2.0c T: 1.50ns= 2.00c 530 X86 :MOVSW L: 1.50ns= 2.0c T: 1.88ns= 2.50c 531 X86 :MOVSD L: 1.50ns= 2.0c T: 22.06ns= 29.42c 533 X86 :REP MOVSB BW in L1D: 1.00 B/c 1330MiB/s 534 X86 :REP MOVSW BW in L1D: 1.99 B/c 2652MiB/s 535 X86 :REP MOVSD BW in L1D: 3.97 B/c 5288MiB/s 537 X86 :SCASB L: 1.50ns= 2.0c T: 1.50ns= 2.00c 538 X86 :SCASW L: 1.50ns= 2.0c T: 1.88ns= 2.50c 539 X86 :SCASD L: 1.50ns= 2.0c T: 13.25ns= 17.67c 541 X86 :REPNE SCASB BW in L1D: 0.50 B/c 666MiB/s 542 X86 :REPNE SCASW BW in L1D: 1.00 B/c 1330MiB/s 543 X86 :REPNE SCASD BW in L1D: 1.99 B/c 2653MiB/s 545 X86 :XADD r8, r8 L: 9.00ns= 12.0c T: 9.00ns= 12.00c 546 X86 :XADD r16, r16 L: 6.75ns= 9.0c T: 6.75ns= 9.00c 547 X86 :XADD r32, r32 L: 6.75ns= 9.0c T: 6.75ns= 9.00c 549 X86 :CMPXCHG r8, r8 L: 12.00ns= 16.0c T: 12.00ns= 16.00c 550 X86 :CMPXCHG r16, r16 L: 12.00ns= 16.0c T: 12.00ns= 16.00c 551 X86 :CMPXCHG r32, r32 L: 12.00ns= 16.0c T: 12.00ns= 16.00c 553 CMPX8 :CMPXCHG8B L: 24.00ns= 32.0c T: 27.00ns= 36.00c 555 X86 :RDTSC L: [no true dep.] T: 20.25ns= 27.00c 556 X86 :CPUID (EAX = 0) L: 43.50ns= 58.0c T: 43.50ns= 58.00c 557 X86 :CPUID (EAX = 1) L: 118.75ns=158.3c T: 118.75ns=158.33c 569 X87 :FNOP L: [no true dep.] T: 16.50ns= 22.00c 570 X87 :FXCH st(i) L: 0.75ns= 1.0c T: 0.75ns= 1.00c 571 X87 :FCHS L: 0.75ns= 1.0c T: 0.75ns= 1.00c 572 X87 :FABS L: 0.75ns= 1.0c T: 0.75ns= 1.00c 573 X87 :FTST L: [no true dep.] T: 3.75ns= 5.00c 574 X87 :FXAM L: [no true dep.] T: 16.50ns= 22.00c 575 CMOV :FCMOVE st, st(i) L: 0.75ns= 1.0c T: 0.75ns= 1.00c 576 X87 :FADD st(i), st (st = 0.0) L: 5.25ns= 7.0c T: 0.81ns= 1.08c 577 X87 :FADD st(i), st L: 5.25ns= 7.0c T: 0.81ns= 1.08c 578 X87 :FADD st, st(i), FXCH st(i) L: 5.25ns= 7.0c T: 2.25ns= 3.00c 579 X87 :FMUL st(i), st (st = 0.0) L: 6.00ns= 8.0c T: 1.50ns= 2.00c 580 X87 :FMUL st(i), st L: 6.00ns= 8.0c T: 1.50ns= 2.00c 581 X87 :FMUL st, st(i), FXCH st(i) L: 6.00ns= 8.0c T: 2.44ns= 3.25c 582 X87 :FMUL + FADD st, st(i) L: 11.25ns= 15.0c T: [not enough reg] 583 X87 :FMUL st(2i) FADD st(2i+1) L: 6.00ns= 8.0c T: [not enough reg] 584 X87 :FDIV32 st(i), st L: 24.75ns= 33.0c T: 20.25ns= 27.00c 585 X87 :FDIV64 st(i), st L: 46.50ns= 62.0c T: 42.00ns= 56.00c 586 X87 :FDIV80 st(i), st L: 54.75ns= 73.0c T: 50.25ns= 67.00c 587 X87 :FDIV80 (0.0l/x) L: 9.00ns= 12.0c T: 4.50ns= 6.00c 588 X87 :FDIV80 (x/1.0l) L: 54.75ns= 73.0c T: 50.25ns= 67.00c 589 X87 :FDIV80 (x/2.0l) L: 54.75ns= 73.0c T: 50.25ns= 67.00c 590 X87 :FDIV80 (x/0.5l) L: 9.00ns= 12.0c T: 4.50ns= 6.00c 591 X87 :FSQRT32 st L: 24.75ns= 33.0c T: 20.25ns= 27.00c 592 X87 :FSQRT64 st L: 46.50ns= 62.0c T: 42.00ns= 56.00c 593 X87 :FSQRT80 st L: 54.75ns= 73.0c T: 50.25ns= 67.00c 594 X87 :FSQRT80 (0.0l) L: 9.00ns= 12.0c T: 4.50ns= 6.00c 595 X87 :FSQRT80 (1.0l) L: 9.75ns= 13.0c T: 5.25ns= 7.00c 596 X87 :FDECSTP L: [no true dep.] T: 0.75ns= 1.00c 597 X87 :FINCSTP L: [no true dep.] T: 0.75ns= 1.00c 598 X87 :FCOM st(i) L: [no true dep.] T: 1.13ns= 1.50c 599 CMOV :FCOMI st, st(i) L: [no true dep.] T: 12.00ns= 16.00c 600 X87 :FSIN80 (0.0) L: 65.25ns= 87.0c T: 66.00ns= 88.00c 601 X87 :FSIN80 (0.0) + FADD L: 66.00ns= 88.0c T: 66.75ns= 89.00c 602 X87 :FSIN80 (1.0) + FADD L: 505.63ns=674.2c T: 507.57ns=676.75c 603 X87 :FSIN80 (4Pi) + FADD L: 518.38ns=691.2c T: 520.45ns=693.92c 604 X87 :FSIN80 (2Pi) + FADD L: 518.38ns=691.2c T: 520.51ns=694.00c 605 X87 :FSIN80 (Pi) + FADD L: 520.64ns=694.2c T: 522.57ns=696.75c 606 X87 :FSIN80 (Pi/2) + FADD L: 507.82ns=677.1c T: 510.01ns=680.00c 607 X87 :FSIN80 (Pi/4) + FADD L: 515.26ns=687.0c T: 517.07ns=689.42c 608 X87 :FSIN80 (Pi/8) + FADD L: 515.38ns=687.2c T: 517.32ns=689.75c 609 X87 :FSIN80 (Pi/16) + FADD L: 515.38ns=687.2c T: 517.26ns=689.67c 610 X87 :FSIN80 (Pi/32) + FADD L: 515.32ns=687.1c T: 517.38ns=689.83c 611 X87 :FCOS80 (0.73908513...) L: 506.38ns=675.2c T: 508.13ns=677.50c 612 X87 :FCOS80 (0.73908513...)+FADD L: 507.13ns=676.2c T: 509.01ns=678.67c 613 X87 :FCOS80 (0.0) + FADD L: 68.25ns= 91.0c T: 69.00ns= 92.00c 614 X87 :FCOS80 (1.0) + FADD L: 514.63ns=686.2c T: 516.45ns=688.58c 615 X87 :FCOS80 (4Pi) + FADD L: 507.07ns=676.1c T: 509.13ns=678.83c 616 X87 :FCOS80 (2Pi) + FADD L: 507.07ns=676.1c T: 509.32ns=679.08c 617 X87 :FCOS80 (Pi) + FADD L: 507.07ns=676.1c T: 509.13ns=678.83c 618 X87 :FCOS80 (Pi/2) + FADD L: 519.89ns=693.2c T: 521.82ns=695.75c 619 X87 :FCOS80 (Pi/4) + FADD L: 507.13ns=676.2c T: 509.20ns=678.92c 620 X87 :FCOS80 (Pi/8) + FADD L: 507.13ns=676.2c T: 508.95ns=678.58c 621 X87 :FCOS80 (Pi/16) + FADD L: 507.13ns=676.2c T: 509.20ns=678.92c 622 X87 :FCOS80 (Pi/32) + FADD L: 507.07ns=676.1c T: 509.01ns=678.67c 623 MMX :EMMS L: 4.50ns= 6.0c T: 4.50ns= 6.00c 624 MMX :MOVD r32, mm L: [diff. reg. set] T: 9.00ns= 12.00c 625 MMX :MOVD mm, r32 L: [diff. reg. set] T: 6.75ns= 9.00c 626 MMX :MOVD r32, mm+MOVD mm, r32 L: 15.56ns= 20.8c T: 15.44ns= 20.58c 630 MMX :MOVD mm, [m32] L: [memory dep.] T: 0.81ns= 1.08c 631 MMX :MOVD [m32], mm L: [memory dep.] T: 1.38ns= 1.83c 632 MMX :MOVD mm,[m32]+MOVD [m32],mm L: 7.50ns= 10.0c T: 1.63ns= 2.17c 633 MMX :MOVQ mm, mm L: 0.75ns= 1.0c T: 0.75ns= 1.00c 634 MMX :MOVQ mm, [m64] L: [memory dep.] T: 0.81ns= 1.08c 635 MMX :MOVQ [m64], mm L: [memory dep.] T: 1.38ns= 1.83c 636 MMX :MOVQ mm,[m64]+MOVQ [m64],mm L: 7.50ns= 10.0c T: 1.63ns= 2.17c 637 SSE :MOVNTQ [m64], mm L: [memory dep.] T: 1.83ns= 1.83c 638 SSE :PMOVMSKB r32, mm L: [diff. reg. set] T: 9.00ns= 12.00c 640 SSE :MASKMOVQ mm, mm L: [memory dep.] T: 7.17ns= 7.17c 641 MMX :PADDB mm, mm L: 0.75ns= 1.0c T: 0.75ns= 1.00c 642 MMX :PADDW mm, mm L: 0.75ns= 1.0c T: 0.75ns= 1.00c 643 MMX :PADDD mm, mm L: 0.75ns= 1.0c T: 0.75ns= 1.00c 645 MMX :PADDSB mm, mm L: 0.75ns= 1.0c T: 0.75ns= 1.00c 646 MMX :PADDSW mm, mm L: 0.75ns= 1.0c T: 0.75ns= 1.00c 647 MMX :PADDUSB mm, mm L: 0.75ns= 1.0c T: 0.75ns= 1.00c 648 MMX :PADDUSW mm, mm L: 0.75ns= 1.0c T: 0.75ns= 1.00c 649 MMX :PSUBB mm, mm L: 0.75ns= 1.0c T: 0.75ns= 1.00c 650 MMX :PSUBB mm_1, mm_2 L: 0.75ns= 1.0c T: 0.75ns= 1.00c 651 MMX :PSUBW mm, mm L: 0.75ns= 1.0c T: 0.75ns= 1.00c 652 MMX :PSUBW mm_1, mm_2 L: 0.75ns= 1.0c T: 0.75ns= 1.00c 653 MMX :PSUBD mm, mm L: 0.75ns= 1.0c T: 0.75ns= 1.00c 654 MMX :PSUBD mm_1, mm_2 L: 0.75ns= 1.0c T: 0.75ns= 1.00c 657 MMX :PSUBSB mm, mm L: 0.75ns= 1.0c T: 0.75ns= 1.00c 658 MMX :PSUBSB mm_1, mm_2 L: 0.75ns= 1.0c T: 0.75ns= 1.00c 659 MMX :PSUBSW mm, mm L: 0.75ns= 1.0c T: 0.75ns= 1.00c 660 MMX :PSUBSW mm_1, mm_2 L: 0.75ns= 1.0c T: 0.75ns= 1.00c 661 MMX :PSUBUSB mm, mm L: 0.75ns= 1.0c T: 0.75ns= 1.00c 662 MMX :PSUBUSB mm_1, mm_2 L: 0.75ns= 1.0c T: 0.75ns= 1.00c 663 MMX :PSUBUSW mm, mm L: 0.75ns= 1.0c T: 0.75ns= 1.00c 664 MMX :PSUBUSW mm_1, mm_2 L: 0.75ns= 1.0c T: 0.75ns= 1.00c 665 MMX :PCMPEQB mm, mm L: 0.75ns= 1.0c T: 0.75ns= 1.00c 666 MMX :PCMPEQB mm_1, mm_2 L: 0.75ns= 1.0c T: 0.75ns= 1.00c 667 MMX :PCMPEQW mm, mm L: 0.75ns= 1.0c T: 0.75ns= 1.00c 668 MMX :PCMPEQW mm_1, mm_2 L: 0.75ns= 1.0c T: 0.75ns= 1.00c 669 MMX :PCMPEQD mm, mm L: 0.75ns= 1.0c T: 0.75ns= 1.00c 670 MMX :PCMPEQD mm_1, mm_2 L: 0.75ns= 1.0c T: 0.75ns= 1.00c 671 MMX :PCMPGTB mm, mm L: 0.75ns= 1.0c T: 0.75ns= 1.00c 672 MMX :PCMPGTB mm_1, mm_2 L: 0.75ns= 1.0c T: 0.75ns= 1.00c 673 MMX :PCMPGTW mm, mm L: 0.75ns= 1.0c T: 0.75ns= 1.00c 674 MMX :PCMPGTW mm_1, mm_2 L: 0.75ns= 1.0c T: 0.75ns= 1.00c 675 MMX :PCMPGTD mm, mm L: 0.75ns= 1.0c T: 0.75ns= 1.00c 676 MMX :PCMPGTD mm_1, mm_2 L: 0.75ns= 1.0c T: 0.75ns= 1.00c 677 MMX :PAND mm, mm L: 0.75ns= 1.0c T: 0.75ns= 1.00c 678 MMX :PAND mm_1, mm_2 L: 0.75ns= 1.0c T: 0.75ns= 1.00c 679 MMX :PANDN mm, mm L: 0.75ns= 1.0c T: 0.75ns= 1.00c 680 MMX :PANDN mm_1, mm_2 L: 0.75ns= 1.0c T: 0.75ns= 1.00c 681 MMX :POR mm, mm L: 0.75ns= 1.0c T: 0.75ns= 1.00c 682 MMX :POR mm_1, mm_2 L: 0.75ns= 1.0c T: 0.75ns= 1.00c 683 MMX :PXOR mm, mm L: 0.75ns= 1.0c T: 0.75ns= 1.00c 684 MMX :PXOR mm_1, mm_2 L: 0.75ns= 1.0c T: 0.75ns= 1.00c 685 MMX :PMULHW mm, mm L: 2.25ns= 3.0c T: 0.75ns= 1.00c 686 SSE :PMULHUW mm, mm L: 2.25ns= 3.0c T: 0.75ns= 1.00c 689 MMX :PMULLW mm, mm L: 2.25ns= 3.0c T: 0.75ns= 1.00c 692 MMX :PMADDWD mm, mm L: 2.25ns= 3.0c T: 0.75ns= 1.00c 693 MMX :PSLLW mm, mm L: 0.75ns= 1.0c T: 0.75ns= 1.00c 694 MMX :PSLLW mm, imm8 L: 0.75ns= 1.0c T: 0.75ns= 1.00c 695 MMX :PSLLD mm, mm L: 0.75ns= 1.0c T: 0.75ns= 1.00c 696 MMX :PSLLD mm, imm8 L: 0.75ns= 1.0c T: 0.75ns= 1.00c 697 MMX :PSLLQ mm, mm L: 0.75ns= 1.0c T: 0.75ns= 1.00c 698 MMX :PSLLQ mm, imm8 L: 0.75ns= 1.0c T: 0.75ns= 1.00c 699 MMX :PSRAW mm, mm L: 0.75ns= 1.0c T: 0.75ns= 1.00c 700 MMX :PSRAW mm, imm8 L: 0.75ns= 1.0c T: 0.75ns= 1.00c 701 MMX :PSRAD mm, mm L: 0.75ns= 1.0c T: 0.75ns= 1.00c 702 MMX :PSRAD mm, imm8 L: 0.75ns= 1.0c T: 0.75ns= 1.00c 703 MMX :PSRLW mm, mm L: 0.75ns= 1.0c T: 0.75ns= 1.00c 704 MMX :PSRLW mm, imm8 L: 0.75ns= 1.0c T: 0.75ns= 1.00c 705 MMX :PSRLD mm, mm L: 0.75ns= 1.0c T: 0.75ns= 1.00c 706 MMX :PSRLD mm, imm8 L: 0.75ns= 1.0c T: 0.75ns= 1.00c 707 MMX :PSRLQ mm, mm L: 0.75ns= 1.0c T: 0.75ns= 1.00c 708 MMX :PSRLQ mm, imm8 L: 0.75ns= 1.0c T: 0.75ns= 1.00c 709 MMX :PUNPCKHBW mm, mm L: 0.75ns= 1.0c T: 0.75ns= 1.00c 710 MMX :PUNPCKHWD mm, mm L: 0.75ns= 1.0c T: 0.75ns= 1.00c 711 MMX :PUNPCKHDQ mm, mm L: 0.75ns= 1.0c T: 0.75ns= 1.00c 712 MMX :PUNPCKLBW mm, mm L: 0.75ns= 1.0c T: 0.75ns= 1.00c 713 MMX :PUNPCKLWD mm, mm L: 0.75ns= 1.0c T: 0.75ns= 1.00c 714 MMX :PUNPCKLDQ mm, mm L: 0.75ns= 1.0c T: 0.75ns= 1.00c 715 MMX :PACKSSWB mm, mm L: 0.75ns= 1.0c T: 0.75ns= 1.00c 716 MMX :PACKUSWB mm, mm L: 0.75ns= 1.0c T: 0.75ns= 1.00c 717 MMX :PACKSSDW mm, mm L: 0.75ns= 1.0c T: 0.75ns= 1.00c 751 SSE :PAVGB mm, mm L: 0.75ns= 1.0c T: 0.75ns= 1.00c 752 SSE :PAVGW mm, mm L: 0.75ns= 1.0c T: 0.75ns= 1.00c 753 SSE :PEXTRW r32, mm, im8 L: [diff. reg. set] T: 9.00ns= 12.00c 754 SSE :PINSRW mm, r32, im8 L: [diff. reg. set] T: 6.75ns= 9.00c 755 SSE :PEXTRW + PINSRW r32 L: 15.56ns= 20.8c T: 15.50ns= 20.67c 759 SSE :PMAXSW mm, mm L: 0.75ns= 1.0c T: 0.75ns= 1.00c 760 SSE :PMAXUB mm, mm L: 0.75ns= 1.0c T: 0.75ns= 1.00c 761 SSE :PMINSW mm, mm L: 0.75ns= 1.0c T: 0.75ns= 1.00c 762 SSE :PMINUB mm, mm L: 0.75ns= 1.0c T: 0.75ns= 1.00c 763 SSE :PSADBW mm, mm L: 3.00ns= 4.0c T: 1.50ns= 2.00c 764 SSE :PSHUFW mm, mm, im8 L: 2.25ns= 3.0c T: 2.25ns= 3.00c 765 SSE :PREFETCHNTA [mem] L: [memory dep.] T: 0.81ns= 1.08c 766 SSE :PREFETCHT0 [mem] L: [memory dep.] T: 0.81ns= 1.08c 767 SSE :PREFETCHT1 [mem] L: [memory dep.] T: 0.81ns= 1.08c 768 SSE :PREFETCHT2 [mem] L: [memory dep.] T: 0.81ns= 1.08c 769 SSE :SFENCE L: 1.25ns= 1.7c T: 1.25ns= 1.67c 786 SSE :MOVHLPS xmm, xmm L: 1.50ns= 2.0c T: 0.75ns= 1.00c 787 SSE :MOVHLPS xmm_1, xmm_2 L: 1.50ns= 2.0c T: 0.75ns= 1.00c 788 SSE :MOVSS xmm, xmm L: 1.50ns= 2.0c T: 1.50ns= 2.00c 789 SSE :MOVSS xmm, [m32] L: [memory dep.] T: 1.63ns= 2.17c 790 SSE :MOVSS [m32], xmm L: [memory dep.] T: 1.63ns= 2.17c 791 SSE :MOVSS LS pair L: 7.50ns= 10.0c T: 3.19ns= 4.25c 792 SSE :MOVLPS xmm, [m32] L: [memory dep.] T: 0.81ns= 1.08c 793 SSE :MOVLPS [m32], xmm L: [memory dep.] T: 1.38ns= 1.83c 794 SSE :MOVLPS LS pair L: 7.50ns= 10.0c T: 1.63ns= 2.17c 795 SSE :MOVHPS xmm, [m32] L: [memory dep.] T: 0.81ns= 1.08c 796 SSE :MOVHPS [m32], xmm L: [memory dep.] T: 1.38ns= 1.83c 797 SSE :MOVHPS LS pair L: 7.50ns= 10.0c T: 1.63ns= 2.17c 798 SSE :MOVAPS xmm, xmm L: 1.50ns= 2.0c T: 1.50ns= 2.00c 799 SSE :MOVAPS xmm, [m128] L: [memory dep.] T: 1.50ns= 2.00c 800 SSE :MOVAPS [m128], xmm L: [memory dep.] T: 1.63ns= 2.17c 801 SSE :MOVAPS LS pair L: 14.75ns= 19.7c T: 2.94ns= 3.92c 802 SSE :MOVUPS xmm, xmm L: 1.50ns= 2.0c T: 1.50ns= 2.00c 803 SSE :MOVUPS xmm, [m128] L: [memory dep.] T: 1.50ns= 2.00c 804 SSE :MOVUPS [m128], xmm L: [memory dep.] T: 2.81ns= 3.75c 805 SSE :MOVUPS aligned LS pair L: 9.94ns= 13.3c T: 3.00ns= 4.00c 806 SSE :MOVUPS xmm, [m128 + 4] L: [memory dep.] T: 9.94ns= 13.25c 807 SSE :MOVUPS [m128 + 4], xmm L: [memory dep.] T: 10.13ns= 13.50c 808 SSE :MOVUPS unaligned LS pair L: 18.38ns= 24.5c T: 14.50ns= 19.33c 810 SSE :MOVNTPS [m128], xmm L: [memory dep.] T: 2.33ns= 2.33c 811 SSE :MOVMSKPS r32, xmm L: [diff. reg. set] T: 9.00ns= 12.00c 812 SSE :UNPCKLPS xmm, xmm L: 2.25ns= 3.0c T: 1.50ns= 2.00c 813 SSE :UNPCKHPS xmm, xmm L: 2.25ns= 3.0c T: 1.50ns= 2.00c 814 SSE :SHUFPS xmm, xmm, imm8 L: 3.00ns= 4.0c T: 2.25ns= 3.00c 815 SSE :COMISS xmm, xmm L: [no true dep.] T: 15.00ns= 20.00c 816 SSE :UCOMISS xmm, xmm L: [no true dep.] T: 15.00ns= 20.00c 817 SSE :CMPSS xmm, xmm, imm8 L: 3.75ns= 5.0c T: 1.56ns= 2.08c 818 SSE :CMPPS xmm, xmm, imm8 L: 3.75ns= 5.0c T: 1.50ns= 2.00c 819 SSE :SUBSS xmm, xmm L: 3.75ns= 5.0c T: 1.50ns= 2.00c 820 SSE :SUBPS xmm, xmm L: 3.75ns= 5.0c T: 1.50ns= 2.00c 821 SSE :ADDSS xmm, xmm L: 3.75ns= 5.0c T: 1.50ns= 2.00c 822 SSE :ADDPS xmm, xmm L: 3.75ns= 5.0c T: 1.50ns= 2.00c 823 SSE :MULSS xmm, xmm L: 3.75ns= 5.0c T: 1.50ns= 2.00c 824 SSE :MULPS xmm, xmm L: 3.75ns= 5.0c T: 1.50ns= 2.00c 825 SSE :MULSS+ADDSS xmm, xmm L: 7.50ns= 10.0c T: [not enough reg] 826 SSE :MULPS+ADDPS xmm, xmm L: 7.50ns= 10.0c T: [not enough reg] 827 SSE :MULSS xm1,xm1 ADDSS xm2,xm2 L: 3.75ns= 5.0c T: [not enough reg] 828 SSE :MULPS xm1,xm1 ADDPS xm2,xm2 L: 3.75ns= 5.0c T: [not enough reg] 829 SSE :MAXSS xmm, xmm L: 3.75ns= 5.0c T: 1.50ns= 2.00c 830 SSE :MAXPS xmm, xmm L: 3.75ns= 5.0c T: 1.50ns= 2.00c 831 SSE :MINSS xmm, xmm L: 3.75ns= 5.0c T: 1.50ns= 2.00c 832 SSE :MINPS xmm, xmm L: 3.75ns= 5.0c T: 1.50ns= 2.00c 833 SSE :ANDNPS xmm, xmm L: 1.50ns= 2.0c T: 1.50ns= 2.00c 834 SSE :ANDNPS xmm_1, xmm_2 L: 1.50ns= 2.0c T: 1.50ns= 2.00c 835 SSE :ANDPS xmm, xmm L: 1.50ns= 2.0c T: 1.50ns= 2.00c 836 SSE :ANDPS xmm_1, xmm_2 L: 1.50ns= 2.0c T: 1.50ns= 2.00c 837 SSE :ORPS xmm, xmm L: 1.50ns= 2.0c T: 1.50ns= 2.00c 838 SSE :ORPS xmm_1, xmm_2 L: 1.50ns= 2.0c T: 1.50ns= 2.00c 839 SSE :XORPS xmm, xmm L: 1.50ns= 2.0c T: 1.50ns= 2.00c 840 SSE :XORPS xmm_1, xmm_2 L: 1.50ns= 2.0c T: 1.50ns= 2.00c 841 SSE :DIVSS xmm, xmm L: 24.00ns= 32.0c T: 22.50ns= 30.00c 842 SSE :DIVSS (0.0f/x) L: 24.00ns= 32.0c T: 22.50ns= 30.00c 843 SSE :DIVSS (x/1.0f) L: 24.00ns= 32.0c T: 22.50ns= 30.00c 844 SSE :DIVSS (x/2.0f) L: 24.00ns= 32.0c T: 22.50ns= 30.00c 845 SSE :DIVSS (x/0.5f) L: 24.00ns= 32.0c T: 22.50ns= 30.00c 846 SSE :DIVPS xmm, xmm L: 45.00ns= 60.0c T: 45.00ns= 60.00c 847 SSE :DIVPS (0.0f/x) L: 45.00ns= 60.0c T: 45.00ns= 60.00c 848 SSE :DIVPS (x/1.0f) L: 45.00ns= 60.0c T: 45.00ns= 60.00c 849 SSE :DIVPS (x/2.0f) L: 45.00ns= 60.0c T: 45.00ns= 60.00c 850 SSE :DIVPS (x/0.5f) L: 45.00ns= 60.0c T: 45.00ns= 60.00c 851 SSE :SQRTSS xmm, xmm L: 24.75ns= 33.0c T: 23.25ns= 31.00c 852 SSE :SQRTSS (0.0f) L: 24.75ns= 33.0c T: 23.25ns= 31.00c 853 SSE :SQRTSS (1.0f) L: 24.75ns= 33.0c T: 23.25ns= 31.00c 854 SSE :SQRTPS xmm, xmm L: 46.50ns= 62.0c T: 46.50ns= 62.00c 855 SSE :SQRTPS (0.0f) L: 46.50ns= 62.0c T: 46.50ns= 62.00c 856 SSE :SQRTPS (1.0f) L: 46.50ns= 62.0c T: 46.50ns= 62.00c 857 SSE :RCPSS xmm, xmm L: 12.00ns= 16.0c T: 9.00ns= 12.00c 858 SSE :RCPPS xmm, xmm L: 18.75ns= 25.0c T: 16.50ns= 22.00c 859 SSE :RSQRTSS xmm, xmm L: 15.75ns= 21.0c T: 12.75ns= 17.00c 860 SSE :RSQRTPS xmm, xmm L: 22.50ns= 30.0c T: 20.25ns= 27.00c 861 SSE :CVTPI2PS xmm, mm L: [diff. reg. set] T: 9.00ns= 12.00c 862 SSE :CVTPS2PI mm, xmm L: [diff. reg. set] T: 12.75ns= 17.00c 863 SSE :CVTPS2PI + CVTPI2PS L: 25.13ns= 33.5c T: 21.75ns= 29.00c 864 SSE :CVTTPS2PI mm, xmm L: [diff. reg. set] T: 12.75ns= 17.00c 865 SSE :CVTTPS2PI + CVTPI2PS L: 25.13ns= 33.5c T: 21.75ns= 29.00c 866 SSE :CVTSI2SS xmm, r32 L: [diff. reg. set] T: 6.75ns= 9.00c 867 SSE :CVTSS2SI r32, xmm L: [diff. reg. set] T: 12.75ns= 17.00c 868 SSE :CVTSS2SI + CVTSI2SS r32 L: 22.25ns= 29.7c T: 18.75ns= 25.00c 869 SSE :CVTTSS2SI r32, xmm L: [diff. reg. set] T: 12.75ns= 17.00c 870 SSE :CVTTSS2SI + CVTSI2SS r32 L: 22.25ns= 29.7c T: 18.75ns= 25.00c 876 SSE :STMXCSR [mem] L: [memory dep.] T: 18.75ns= 25.00c 877 SSE :LDMXCSR [mem] L: [memory dep.] T: 49.88ns= 66.50c 878 SSE :STMXCSR + LDMXCSR L: 68.31ns= 91.1c T: 68.63ns= 91.50c BenchInstLat exit code: 0x0708 Running time: 407 seconds.