Apple Microarchitecture Research by Dougall Johnson

M1/A14 P-core (Firestorm): Overview | Base Instructions | SIMD and FP Instructions
M1/A14 E-core (Icestorm):  Overview | Base Instructions | SIMD and FP Instructions

MOV (bitmask immediate, 64-bit)

Test 1: uops

Code:

  mov x0, #0xaaaaaaaaaaaaaaaa
  nop ; nop ; nop

(no loop instructions)

1000 unrolls and 1 iteration

Retires (minus 3 nops): 1.000

Issues: 0.000

Integer unit issues: 0.000

Load/store unit issues: 0.000

SIMD/FP unit issues: 0.000

retire uop (01)cycle (02)031e3f51606d6emap rewind (75)map stall (76)map int uop (7c)8283flush restart other nonspec (84)85inst all (8c)inst int alu (97)l1d cache writeback (a8)accfd2d5map dispatch bubble (d6)ddfetch restart (de)e0? int retires (ef)f5f6f7f8fd
4004528402852505285283101000528951140011000002640416445251000529529529529529
4004528402852505285283101000528951140011000002630316335251000529529529529529
4004528402852515285283101000528951140011000002640416335251000529529529529529
4004528402852505285283101000528951140011000002640416445251000529529529529529
4004528403552505285283101000528951140011000002640416445251000529529529529529
4004528602852515285283101000528951140011000002640316445251000529529529529529
4004528402852515285283101000528951140011000002640416445251000529529529529529
4004528402852505285283101000528951140011000002640416435251000529529529529529
4004528402852515285283101000528951140011000002640416445251000529529529529529
4004528402852515285283101000528951140011000002640416445251000529529529529529

Test 2: throughput

Count: 8

Code:

  mov x0, #0xaaaaaaaaaaaaaaaa
  mov x1, #0xaaaaaaaaaaaaaaaa
  mov x2, #0xaaaaaaaaaaaaaaaa
  mov x3, #0xaaaaaaaaaaaaaaaa
  mov x4, #0xaaaaaaaaaaaaaaaa
  mov x5, #0xaaaaaaaaaaaaaaaa
  mov x6, #0xaaaaaaaaaaaaaaaa
  mov x7, #0xaaaaaaaaaaaaaaaa

(fused SUBS/B.cc loop)

100 unrolls and 100 iterations

Result (median cycles for code divided by count): 0.1258

retire uop (01)cycle (02)031e3f51schedule uop (52)schedule int uop (53)dispatch int uop (56)int uops in schedulers (59)5f60696a6d6emap stall dispatch (70)map rewind (75)map stall (76)dispatch uop (78)map int uop (7c)map int uop inputs (7f)8283flush restart other nonspec (84)85inst all (8c)inst branch (8d)inst branch taken (90)inst branch cond (94)inst int alu (97)9fl1d cache writeback (a8)accfd5map dispatch bubble (d6)ddfetch restart (de)e0? int output thing (e9)? int retires (ef)f5f6f7f8fd
80204100647704152560050600506005030025000496980100601006003186005080200200100603511802011009910080100100105113316331005759950801001006110061100611006110061
8020410060770352560050600506005030025000496980100601006003186005080200200100603511802011009910080100100105113316331005759950801001006110061100611006110061
80204100607812352560050600506005030025000496980100601006003186005080200200100603511802011009910080100100165113316331005759950801001006110061100611006110061
8020410060770352560050600506005030025000496980100601006003186005080200200100603511802011009910080100100005113316331005759950801001006110061100611006110061
8020410060780352560050600506005030025000496980100601006003186005080200200100603511802011009910080100100035113316331005759950801001006110061100611006110061
80204100609806192560050600506005030025000496980100601006003186005080200200100603511802011009910080100100005113316331005759950801001006110061100611006110061
8020410060780352560050600506005030025000496980100601006003186005080200200100603511802011009910080100100005113316331005759950801001006110061100611006110061
8020410060780352560050600506005030025000496980100601006003186005080200200100603511802011009910080100100005113316331005759950801001006110061100611006110061
8020410060780352560050600506005030025000496980100601006003186005080200200100603511802011009910080100100005113316331005759950801001006110061100611006110061
80204100607806052560050600506005030025000496980100601006003186005080200200100603511802011009910080100100005113316331005759950801001006110061100611006110061

1000 unrolls and 10 iterations

Result (median cycles for code divided by count): 0.1255

retire uop (01)cycle (02)03mmu table walk instruction (07)1e3f51schedule uop (52)schedule int uop (53)dispatch int uop (56)int uops in schedulers (59)60696a6d6emap rewind (75)map stall (76)dispatch uop (78)map int uop (7c)map int uop inputs (7f)8283flush restart other nonspec (84)85inst all (8c)inst branch (8d)inst branch taken (90)inst branch cond (94)inst int alu (97)9fl1d cache writeback (a8)accfd5map dispatch bubble (d6)ddfetch restart (de)e0? int output thing (e9)? int retires (ef)f5f6f7f8fd
8002410054771098256000460004600043000201496958100381003831860004800202010038351180021109108001010005021116111003559994800101003910039100391003910039
8002410038780035256000460004600043000200496958100381003831860004800202010038351180021109108001010105021116111003559994800101003910039100391003910039
8002410038780335256000460004600043000200496958100381003831860004800202010038351180021109108001010005021116111003559994800101003910039100391003910039
80024100387800352560004600046000430002004969581003810038317160004800202010038351180021109108001010005021216111003559994800101003910039100391003910039
8002410038770063256000460004600043000200496958100381003831860004800202010038351180021109108001010005021116111003559994800101003910039100391003910039
80024100387800503256000460004600043000200496958100381003831860004800202010038351180021109108001010005021116111003559994800101003910039100391003910039
8002410038800056256000460004600043000201496958100381003831860004800202010038351180021109108001010005021116111003559994800101003910039100391003910039
8002410038780035256000460004600043000200496958100381003831860004800202010038351180021109108001010005021116111003559994800101003910039100391003910039
8002410038780056256000460004600043000200496958100381003831860004800202010038351180021109108001010005021116111003559994800101003910039100391003910039
8002410038780035256000460004600043000201496958100381003831860004800202010038351180021109108001010005021116111003559994800101003910039100391003910039