Apple Microarchitecture Research by Dougall Johnson

M1/A14 P-core (Firestorm): Overview | Base Instructions | SIMD and FP Instructions
M1/A14 E-core (Icestorm):  Overview | Base Instructions | SIMD and FP Instructions

MOV (from sp, 64-bit)

Test 1: uops

Code:

  mov x0, sp

(no loop instructions)

1000 unrolls and 1 iteration

Retires: 1.000

Issues: 0.000

Integer unit issues: 0.000

Load/store unit issues: 0.000

SIMD/FP unit issues: 0.000

retire uop (01)cycle (02)033f51606d6emap rewind (75)map stall (76)map int uop (7c)map int uop inputs (7f)8283flush restart other nonspec (84)85inst all (8c)inst int alu (97)accfd5map dispatch bubble (d6)ddfetch restart (de)e0? int retires (ef)f5f6f7f8fd
1004152127150015215231010001000152351110011000074115111491000153153153153153
1004152127150015215231010001000152351110011000074115111491000153153153153153
1004152127150015215231010001000152351110011000074115111491000153153153153153
1004152127150015215231010001000152351110011000074115111491000153153153153153
1004152127150115215231010001000152351110011000074115111491000153153153153153
1004152127150015215231010001000152351110011000074115111491000153153153153153
1004152127150015215231010001000152351110011000074115111491000153153153153153
1004152127150015215231010001000152351110011000074115111491000153153153153153
1004152148150015215231010001000152351110011000074115111491000153153153153153
1004152127150015215231010001000152351110011000074115111491000153153153153153

Test 2: throughput

Count: 8

Code:

  mov x0, sp
  mov x1, sp
  mov x2, sp
  mov x3, sp
  mov x4, sp
  mov x5, sp
  mov x6, sp
  mov x7, sp

(fused SUBS/B.cc loop)

100 unrolls and 100 iterations

Result (median cycles for code divided by count): 0.1258

retire uop (01)cycle (02)03mmu table walk instruction (07)l2 tlb miss instruction (0a)0e18191e3f51schedule uop (52)schedule int uop (53)dispatch int uop (56)int uops in schedulers (59)60696a6d6erob full (74)map rewind (75)map stall (76)dispatch uop (78)map int uop (7c)map int uop inputs (7f)8283flush restart other nonspec (84)85inst all (8c)inst branch (8d)inst branch taken (90)inst branch cond (94)inst int alu (97)9fl1d cache writeback (a8)a9accfd5map dispatch bubble (d6)ddfetch restart (de)e0? int retires (ef)f5f6f7f8fd
802041006478010000639554100100100500049698010060100600318100802008020010060351180201100991008010010000051122162210057801001006110061100611006110061
802041006081000000639554100100100500049698010060100600318100802008020010060351180201100991008010010010051122162210057801001006110061100611006110061
802041006077000000359554100100100500049698010060100600318100802008020010060351180201100991008010010010051122162210057801001006110061100611006110061
802041006078000000359554100100100500049698010060100600318100802008020010060351180201100991008010010000051122162210057801001006110061100611006110061
802041006078000000359554100100100500049698010060100600318100802008020010060351180201100991008010010000051122162210057801001006110061100611006110061
802041006078000000359554100100100500049698010060100600318100802008020010060351180201100991008010010000051122162210057801001006110061100611006110061
802041006078000000359554100100100500049698010060100600318100802008020010060351180201100991008010010000051122162210057801001006110061100611006110061
802041006077000000359554100100100500049698010060100600318100802008020010060351180201100991008010010000051122162210057801001006110061100611012510061
8020410060780000001309554100100100500049698010060100600318100802008020010060351180201100991008010010000051122482210084801001012510061100611006110100
80204101337800011035955410010010150004969801006010060031810080200802001006035218020110099100801001000218051122162210057801001006110061100611006110061

1000 unrolls and 10 iterations

Result (median cycles for code divided by count): 0.1255

retire uop (01)cycle (02)03l2 tlb miss instruction (0a)1e3a3f51schedule uop (52)schedule int uop (53)dispatch int uop (56)int uops in schedulers (59)ldst uops in schedulers (5b)6061696a6d6emap rewind (75)map stall (76)dispatch uop (78)map int uop (7c)map int uop inputs (7f)8283flush restart other nonspec (84)85inst all (8c)inst branch (8d)inst branch taken (90)inst branch cond (94)inst int alu (97)9fl1d tlb access (a0)l1d tlb miss (a1)ld unit uop (a6)l1d cache writeback (a8)accfd0d2d5map dispatch bubble (d6)ddfetch restart (de)e0? int output thing (e9)? int retires (ef)f5f6f7f8fd
8002410043780120237998210101050010496958100381003831810800208002010038351180021109108001010000005030511316810100350800101003910039100391003910039
800241003878100326998210101050010496958100381003831810800208002010038351180021109108001010000005030541016910100350800101003910039100391003910039
80024100387800041998210101050010496958100381003831810800208002010038351180021109108001010000005030549161010100350800101003910039100391003910039
8002410038780002379982101010500104969581003810038318108002080020100383511800211091080010100001050290091699100350800101003910039100391003910039
800241003878000359982101010500054969581003810038318108002080020100383511800211091080010100000050310091699100350800101003910039100391003910039
800241003877000766998210101050005496958100381003831810800208002010038351180021109108001010000005029001016910100350800101003910039100391003910039
80024100387700035998210101050005496958100381003831810800208002010038351180021109108001010000005028541016109100350800101003910039100391003910039
8002410038780210359982101010500104969581003810038318108002080020100383511800211091080010100000050290010161010100350800101003910039100391003910039
80024100387800035998210101050010496958100381003831810800208002010038351180021109108001010000005029001016911100350800101003910039100391003910039
8002410038770003599821010105000549695810038100383181080020800201003835118002110910800101000000502954101698100350800101003910039100391003910039