Apple Microarchitecture Research by Dougall Johnson

M1/A14 P-core (Firestorm): Overview | Base Instructions | SIMD and FP Instructions
M1/A14 E-core (Icestorm):  Overview | Base Instructions | SIMD and FP Instructions

MOVN (64-bit)

Test 1: uops

Code:

  movn x0, #0x1234, lsl 16
  nop ; nop ; nop

(no loop instructions)

1000 unrolls and 1 iteration

Retires (minus 3 nops): 1.000

Issues: 0.000

Integer unit issues: 0.000

Load/store unit issues: 0.000

SIMD/FP unit issues: 0.000

retire uop (01)cycle (02)031e3f51606d6emap rewind (75)map stall (76)map int uop (7c)8283flush restart other nonspec (84)85inst all (8c)inst int alu (97)l1d cache writeback (a8)accfd5map dispatch bubble (d6)e0eb? int retires (ef)f5f6f7f8fd
40045284028525152852831010005289511400110000026011652501000529529529529529
40045284028525152852831010005289511400110004026001652501000529529529529529
400452841270525152852831010005289511400110000026001652501000529529529529529
40045284028525052852831010005289511400110000326001652501000529529529529529
40045284028525052852831010005289511400110000026001652501000529529529529529
40045284028525152852831010005289511400110000026001652501000529529529529529
40045284070525152852831010005289511400110000026001652501000529529529529529
40045284070525152852831010005289511400110000026001652501000529529529529529
40045284028525152852831010005289511400110000026001652501000529529529529529
40045283028525052852831010005289511400110000626001652501000529529529529529

Test 2: throughput

Count: 8

Code:

  movn x0, #0x1234, lsl 16
  movn x1, #0x1234, lsl 16
  movn x2, #0x1234, lsl 16
  movn x3, #0x1234, lsl 16
  movn x4, #0x1234, lsl 16
  movn x5, #0x1234, lsl 16
  movn x6, #0x1234, lsl 16
  movn x7, #0x1234, lsl 16

(fused SUBS/B.cc loop)

100 unrolls and 100 iterations

Result (median cycles for code divided by count): 0.1258

retire uop (01)cycle (02)03l2 tlb miss instruction (0a)18191e3f51schedule uop (52)schedule int uop (53)dispatch int uop (56)int uops in schedulers (59)60696a6d6emap rewind (75)map stall (76)dispatch uop (78)map int uop (7c)map int uop inputs (7f)8283flush restart other nonspec (84)85inst all (8c)inst branch (8d)inst branch taken (90)inst branch cond (94)inst int alu (97)9fld unit uop (a6)l1d cache writeback (a8)a9accfd5map dispatch bubble (d6)ddfetch restart (de)e0? int output thing (e9)? int retires (ef)f5f6f7f8fd
80204100927800001202560050600506005030025004969801006010060318600508020020010060351180201100991008010010000005112616221005759950801001006110061100611006110061
80204100607800012352560050600506005030025014969801006010060318600508020020010060351180201100991008010010000005134216221005759950801001006110061100611006110061
80204100607800003202560050600506005030025014969801006010060318600508020020010060351180201100991008010010000005112216221005759950801001006110061100611006110061
8020410060780000352560050600506005030025014969801006010060318600508020020010060351180201100991008010010000005112216221005759950801001006110061100611006110061
8020410060780000352560050600506005030025004969801006010060318600508020020010060351180201100991008010010000005112216221005759950801001006110061100611006110061
8020410060780000352560050600506005030025014969801006010060318600508020020010060351180201100991008010010000005112216221005759950801001006110061100611006110061
8020410060780000352560050600506005030025014969801006010060318600508020020010060351180201100991008010010000005112216221005759950801001006110061100611006110061
8020410060770000352560050600506005030025004969801006010060318600508020020010060351180201100991008010010000005112216221005759950801001006110061100611006110061
80204100607800001632560050600506005030025014969801006010060318600508020020010060351180201100991008010010000005112216221005759950801001006110061100611006110061
8020410060770000352560050600506005030025004969801006010060318600508020020010060351180201100991008010010000005112216221005759950801001006110061100611006110061

1000 unrolls and 10 iterations

Result (median cycles for code divided by count): 0.1255

retire uop (01)cycle (02)03l2 tlb miss data (0b)18191e3f51schedule uop (52)schedule int uop (53)dispatch int uop (56)int uops in schedulers (59)60696a6d6emap rewind (75)map stall (76)dispatch uop (78)map int uop (7c)map int uop inputs (7f)8283flush restart other nonspec (84)85inst all (8c)inst branch (8d)inst branch taken (90)inst branch cond (94)inst int alu (97)9fl1d tlb miss (a1)l1d cache writeback (a8)accfd5map dispatch bubble (d6)daddfetch restart (de)e0? int output thing (e9)? int retires (ef)f5f6f7f8fd
8002410044780001259425600046000460004300020049695810038100383186000480020201034435118002110910800101000050236160331003559994800101003910039100391003910039
800241003878000012325600046000460137300020049695810038100383186000480020201033935118002110910800101000050262160331003559994800101003910039100391003910039
80024100387800003525600046000460004300020049695810038100383186000480020201033435118002110910800101000050253160551003559994800101003910039100391003910039
80024100387800003525600046000460004300020049695810038100383186000480020201007735118002110910800101000050253160551003559994800101003910039100391003910039
800241003878000012625600046000460004300020149695810038100383186000480020201033435118002110910800101000050232160361003559994800101008710125100391003910039
80024100387812005625600046000460004300020149695810038100383186000480020201008135118002110910800101000050255160321003559994800101003910039100391003910039
800241003877000018525600046000460004300020149695810038100383186000480020201033735118002110910800101000050223160331003559994800101003910039100391003910039
800241003878000040925600046000460004300020049695810038100383186000480020201033735118002110910800101000050262160331003559994800101003910039100391003910039
800241003878000041125600046000460004300020049695810038100383186000480020201033435118002110910800101000350255160321003559994800101003910039100391003910039
800241003877000012525600046000460004300020149695810038100383186000480020201033435118002110910800101000050263160561003559994800101003910039100391003910039