Apple Microarchitecture Research by Dougall Johnson

M1/A14 P-core (Firestorm): Overview | Base Instructions | SIMD and FP Instructions
M1/A14 E-core (Icestorm):  Overview | Base Instructions | SIMD and FP Instructions

STRB

Test 1: uops

Code:

  strb w0, [x6]
  mov x0, 0

(no loop instructions)

1000 unrolls and 1 iteration

Retires: 1.000

Issues: 1.000

Integer unit issues: 0.000

Load/store unit issues: 1.000

SIMD/FP unit issues: 0.000

retire uop (01)cycle (02)03l1d tlb fill (05)mmu table walk data (08)l2 tlb miss data (0b)1e1f223a3f46494f51schedule uop (52)schedule ldst uop (55)dispatch ldst uop (58)simd uops in schedulers (5a)606d6emap stall dispatch (70)map rewind (75)map stall (76)dispatch uop (78)map ldst uop (7d)map ldst uop inputs (80)8283flush restart other nonspec (84)85inst all (8c)inst int store (96)inst ldst (9b)l1d tlb access (a0)l1d tlb miss (a1)l1d cache miss st (a2)a4ld unit uop (a6)st unit uop (a7)l1d cache writeback (a8)a9acafbcl1d cache miss st nonspec (c0)l1d tlb miss nonspec (c1)c2cfd5map dispatch bubble (d6)ddfetch restart (de)e0? ldst retires (ed)f5f6f7f8fd
1005554400003005271616225100010001000224481554542355340110001000200054354311100110001000100004210100200210022420073116115391000543543543555543
1004542400003105271616125100010001000224481542542355340110001000200054254311100110001000100004204101610181002164414073116115511000555555555555543
10045424000031052716165251000100010002288405545543763411100010002000563554111001100010001015154400100200210022420073116115401000544544544544543
1004542400097005271616325100010001000224480542542355340010001000200054254211100110001000100004200100200210022420073116115391000543543543555544
10045424000031052716162251000100010002302805545543763411100010002000563554111001100010001014144200100200210022420073116115391000543565564555555
100455441110171153916161251000100010002244805425423553400100010002000542542111001100010001000144400101601161002164414173116115491000555552543543543
10045424000031052716160251000100010002247205545423553400100010002000542542111001100010001000144401101600181002164414173116115611000554554555553553
10045524111018015361616125100010001000224720542543356340010001000200055454211100110001000101404200100200210022420073116115391000553543543543543
10045424000330052716161251000100010002300405545633673421100010002000554552111001100010001015154412101600191002164414073116115511000555544544544544
1004543400003005281616125100010001000224720542542356340110001000200054254211100110001000101404210100200210022420073116115401000555555555555555

Test 2: throughput

Count: 8

Code:

  strb w0, [x6]
  strb w0, [x6]
  strb w0, [x6]
  strb w0, [x6]
  strb w0, [x6]
  strb w0, [x6]
  strb w0, [x6]
  strb w0, [x6]
  mov x7, x6
  mov x8, x6
  mov x9, x6
  mov x10, x6
  mov x11, x6
  mov x12, x6
  mov x13, x6

(fused SUBS/B.cc loop)

100 unrolls and 100 iterations

Result (median cycles for code divided by count): 0.5005

retire uop (01)cycle (02)03mmu table walk data (08)191e1f22233f46494f51schedule uop (52)schedule int uop (53)schedule ldst uop (55)dispatch int uop (56)dispatch ldst uop (58)int uops in schedulers (59)simd uops in schedulers (5a)60696a6d6emap stall dispatch (70)map rewind (75)map stall (76)dispatch uop (78)map int uop (7c)map ldst uop (7d)map int uop inputs (7f)map ldst uop inputs (80)8283flush restart other nonspec (84)85inst all (8c)inst branch (8d)inst branch taken (90)inst branch cond (94)inst int store (96)inst int alu (97)inst ldst (9b)9fl1d tlb access (a0)l1d cache miss st (a2)st unit uop (a7)l1d cache writeback (a8)acafbcl1d cache miss st nonspec (c0)cfd5map dispatch bubble (d6)ddfetch restart (de)e0? int output thing (e9)? ldst retires (ed)? int retires (ef)f5f6f7f8fd
80205400423000003104002716160258010010080000100800005001839424049369624004240051299643299988010020080000200160000400423199511802011009910080000100800001008000034800020880002234511021622400460800001004005040043400514004340043
80204400423000003104002716160258010010080000100800005001839424049369704004240042299553299988010020080000200160000400423199311802011009910080000100800001008000034800020280002234511021622400480800001004004340043400524004340043
8020440042300000310400251616025801001008000010080000500183942404936970400404004229955330007801002008000020016000040042319951180201100991008000010080000100800000800020880002234511021622400390800001004004340043400434005240043
80204400423000009004002716160258010010080000100800005001839424049369604004240040299553300078010020080000200160000400423199511802011009910080000100800001008000034800020280002234511021623400390800001004004340052400434005240043
80204400423000009104002716160258010010080000100800005001839424049369624004040042299553300088010020080000200160000400403199511802011009910080000100800001008000034800020580002034511021622400390800001004004340043400434004340051
80204400423000003104003416160258010010080000100800005001839424049369624004940049299633300008010020080000200160000400403200311802011009910080000100800001008000034800020280000234511021622400470800001004004340043400434004340043
80204400422990003104002516160258010010080000100800005001839424049369624004240042299553300098010020080000200160000400513199511802011009910080000100800001008000034800020280002234511021622400390800001004004340043400434004340051
8020440042300000910400270160258010010080000100800005001839808049369624004240040299553300008010020080000200160000400433199511802011009910080000100800001008000034800020580002234511021622400390800001004004340051400434005140043
80204400493000006104003616160258010010080000100800005001839424049369604004240051299553300008010020080000200160000400423199511802011009910080000100800001008000034800020580002234511021622400370800001004004340043400434004340051
8020440042300000910400271600258010010080000100800005001839424049369624004240042299553299988010020080000200160000400423199511802011009910080000100800001008000034800020280002234511021622400480800001004004340043400434004340043

1000 unrolls and 10 iterations

Result (median cycles for code divided by count): 0.5005

retire uop (01)cycle (02)03191e1f223f46494f51schedule uop (52)schedule int uop (53)schedule ldst uop (55)dispatch int uop (56)dispatch ldst uop (58)int uops in schedulers (59)simd uops in schedulers (5a)60696a6d6emap stall dispatch (70)map rewind (75)map stall (76)dispatch uop (78)map int uop (7c)map ldst uop (7d)map int uop inputs (7f)map ldst uop inputs (80)8283flush restart other nonspec (84)85inst all (8c)inst branch (8d)inst branch taken (90)inst branch cond (94)inst int store (96)inst int alu (97)inst ldst (9b)9fl1d tlb access (a0)l1d cache miss st (a2)st unit uop (a7)l1d cache writeback (a8)acafbcl1d cache miss st nonspec (c0)cfd5map dispatch bubble (d6)d9ddfetch restart (de)e0? ldst retires (ed)? int retires (ef)f5f6f7f8fd
800254004329900314002716161258001010800001080000501839448149369624004240042299753300228001020800002016000040042400421180021109108000010800001080000428000202800022425020181641774003980000104004140043400434004340043
800244004230000304002716161258001010800001080000501839448149369624004040042299773300228001020800002016000040202401901180021109108000010800001080000428000010800022425020151688174003980000104004140043400434004340043
80024400423000631400281616125800101080000108000050183944814936962400424004229977330022800102080000201600004004240042118002110910800001080000108000042800001280002242502061668174003980000104004340041400554004340043
800244004230000314002700025800101080000108000050183944814936962400424004229978330022800102080000201600004004040042118002110910800001080000108000042800020280002242502081667144004180000104004440041400414004340043
800244004229901383040027161602580010108000010800005018394481493696240042400422997533002080010208000020160000400424004211800211091080000108000010800004280000028000220502061608174003980000104004340044400444004340041
800244004230001383140025161662580010108000010800005018393521983696340040400402997533002280010208000020160000400424004211800211091080000108000010800000800020280002242502061601784003780000104004340041400434004340043
80024400423000105304002716161258001010800001080000501839352149369624019140042299773300238001020800002016000040042400421180021109108000010800001080000428000202800022425020616017174004080000104004140041400434004440041
80024400423000135314002716161258001010800001080000501839448149369624005440042299773300228001020800002016000040042400421180021109108000010800001080000428000202800020425020171606174003980000104004340043400414004340044
800244004230002643140025016125800101080000108000050183944814936962400404004229977330022800102080000201600004004240042118002110910800001080000108000042800020680002242502071608174003780000104004340041400444004340041
800244004329901953140025161602580010108000010800005018394481493696240054400422997733002280010208000020160000400434004011800211091080000108000010800004280000008000224250201616017174003980000104004440043400414004440041