ge25519_dbl_p1p1.S 77 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182838485868788899091929394959697989910010110210310410510610710810911011111211311411511611711811912012112212312412512612712812913013113213313413513613713813914014114214314414514614714814915015115215315415515615715815916016116216316416516616716816917017117217317417517617717817918018118218318418518618718818919019119219319419519619719819920020120220320420520620720820921021121221321421521621721821922022122222322422522622722822923023123223323423523623723823924024124224324424524624724824925025125225325425525625725825926026126226326426526626726826927027127227327427527627727827928028128228328428528628728828929029129229329429529629729829930030130230330430530630730830931031131231331431531631731831932032132232332432532632732832933033133233333433533633733833934034134234334434534634734834935035135235335435535635735835936036136236336436536636736836937037137237337437537637737837938038138238338438538638738838939039139239339439539639739839940040140240340440540640740840941041141241341441541641741841942042142242342442542642742842943043143243343443543643743843944044144244344444544644744844945045145245345445545645745845946046146246346446546646746846947047147247347447547647747847948048148248348448548648748848949049149249349449549649749849950050150250350450550650750850951051151251351451551651751851952052152252352452552652752852953053153253353453553653753853954054154254354454554654754854955055155255355455555655755855956056156256356456556656756856957057157257357457557657757857958058158258358458558658758858959059159259359459559659759859960060160260360460560660760860961061161261361461561661761861962062162262362462562662762862963063163263363463563663763863964064164264364464564664764864965065165265365465565665765865966066166266366466566666766866967067167267367467567667767867968068168268368468568668768868969069169269369469569669769869970070170270370470570670770870971071171271371471571671771871972072172272372472572672772872973073173273373473573673773873974074174274374474574674774874975075175275375475575675775875976076176276376476576676776876977077177277377477577677777877978078178278378478578678778878979079179279379479579679779879980080180280380480580680780880981081181281381481581681781881982082182282382482582682782882983083183283383483583683783883984084184284384484584684784884985085185285385485585685785885986086186286386486586686786886987087187287387487587687787887988088188288388488588688788888989089189289389489589689789889990090190290390490590690790890991091191291391491591691791891992092192292392492592692792892993093193293393493593693793893994094194294394494594694794894995095195295395495595695795895996096196296396496596696796896997097197297397497597697797897998098198298398498598698798898999099199299399499599699799899910001001100210031004100510061007100810091010101110121013101410151016101710181019102010211022102310241025102610271028102910301031103210331034103510361037103810391040104110421043104410451046104710481049105010511052105310541055105610571058105910601061106210631064106510661067106810691070107110721073107410751076107710781079108010811082108310841085108610871088108910901091109210931094109510961097109810991100110111021103110411051106110711081109111011111112111311141115111611171118111911201121112211231124112511261127112811291130113111321133113411351136113711381139114011411142114311441145114611471148114911501151115211531154115511561157115811591160116111621163116411651166116711681169117011711172117311741175117611771178117911801181118211831184118511861187118811891190119111921193119411951196119711981199120012011202120312041205120612071208120912101211121212131214121512161217121812191220122112221223122412251226122712281229123012311232123312341235123612371238123912401241124212431244124512461247124812491250125112521253125412551256125712581259126012611262126312641265126612671268126912701271127212731274127512761277127812791280128112821283128412851286128712881289129012911292129312941295129612971298129913001301130213031304130513061307130813091310131113121313131413151316131713181319132013211322132313241325132613271328132913301331133213331334133513361337133813391340134113421343134413451346134713481349135013511352135313541355135613571358135913601361136213631364136513661367136813691370137113721373137413751376137713781379138013811382138313841385138613871388138913901391139213931394139513961397139813991400140114021403140414051406140714081409141014111412141314141415141614171418141914201421142214231424142514261427142814291430143114321433143414351436143714381439144014411442144314441445144614471448144914501451145214531454145514561457145814591460146114621463146414651466146714681469147014711472147314741475147614771478147914801481148214831484148514861487148814891490149114921493149414951496149714981499150015011502150315041505150615071508150915101511151215131514151515161517151815191520152115221523152415251526152715281529153015311532153315341535153615371538153915401541154215431544154515461547154815491550155115521553155415551556155715581559156015611562156315641565156615671568156915701571157215731574157515761577157815791580158115821583158415851586158715881589159015911592159315941595159615971598159916001601160216031604160516061607160816091610161116121613161416151616161716181619162016211622162316241625162616271628162916301631163216331634163516361637163816391640164116421643164416451646164716481649165016511652165316541655165616571658165916601661166216631664166516661667166816691670167116721673167416751676167716781679168016811682168316841685168616871688168916901691169216931694169516961697169816991700170117021703170417051706170717081709171017111712171317141715171617171718171917201721172217231724172517261727172817291730173117321733173417351736173717381739174017411742174317441745174617471748174917501751175217531754175517561757175817591760176117621763176417651766176717681769177017711772177317741775177617771778177917801781178217831784178517861787178817891790179117921793179417951796179717981799180018011802180318041805180618071808180918101811181218131814181518161817181818191820182118221823182418251826182718281829183018311832183318341835183618371838183918401841184218431844184518461847184818491850185118521853185418551856185718581859186018611862186318641865186618671868186918701871187218731874187518761877187818791880188118821883188418851886188718881889189018911892189318941895189618971898189919001901190219031904190519061907190819091910191119121913191419151916191719181919192019211922192319241925192619271928192919301931193219331934193519361937193819391940194119421943194419451946194719481949195019511952195319541955195619571958195919601961196219631964196519661967196819691970197119721973197419751976197719781979198019811982198319841985198619871988198919901991199219931994199519961997199819992000200120022003200420052006200720082009201020112012201320142015201620172018201920202021202220232024202520262027202820292030203120322033203420352036203720382039204020412042204320442045204620472048204920502051205220532054205520562057205820592060206120622063206420652066206720682069207020712072207320742075207620772078207920802081208220832084208520862087208820892090209120922093209420952096209720982099210021012102210321042105210621072108210921102111211221132114211521162117211821192120212121222123212421252126212721282129213021312132213321342135213621372138213921402141214221432144214521462147214821492150215121522153215421552156215721582159216021612162216321642165216621672168216921702171217221732174217521762177217821792180218121822183218421852186218721882189219021912192219321942195219621972198219922002201220222032204220522062207220822092210221122122213221422152216221722182219222022212222222322242225222622272228222922302231223222332234223522362237223822392240224122422243224422452246224722482249225022512252225322542255225622572258225922602261226222632264226522662267226822692270227122722273227422752276227722782279228022812282228322842285228622872288228922902291229222932294229522962297229822992300230123022303230423052306230723082309231023112312231323142315231623172318231923202321232223232324232523262327232823292330233123322333233423352336233723382339234023412342234323442345234623472348234923502351235223532354235523562357235823592360236123622363236423652366236723682369237023712372237323742375237623772378237923802381238223832384238523862387238823892390239123922393239423952396239723982399240024012402240324042405240624072408240924102411241224132414241524162417241824192420242124222423242424252426242724282429243024312432243324342435243624372438243924402441244224432444244524462447244824492450245124522453245424552456245724582459246024612462246324642465246624672468246924702471247224732474247524762477247824792480248124822483248424852486248724882489249024912492249324942495249624972498249925002501250225032504250525062507250825092510251125122513251425152516251725182519252025212522252325242525252625272528252925302531253225332534253525362537253825392540254125422543254425452546254725482549255025512552255325542555255625572558255925602561256225632564256525662567256825692570257125722573257425752576257725782579258025812582258325842585258625872588258925902591259225932594259525962597259825992600260126022603260426052606260726082609261026112612261326142615261626172618261926202621262226232624262526262627262826292630263126322633263426352636263726382639264026412642264326442645264626472648264926502651265226532654265526562657265826592660266126622663266426652666266726682669267026712672267326742675267626772678267926802681268226832684268526862687268826892690269126922693269426952696269726982699270027012702270327042705270627072708270927102711271227132714271527162717271827192720272127222723272427252726272727282729273027312732273327342735273627372738273927402741274227432744274527462747274827492750275127522753275427552756275727582759276027612762276327642765276627672768276927702771277227732774277527762777277827792780278127822783278427852786278727882789279027912792279327942795279627972798279928002801280228032804280528062807280828092810281128122813281428152816281728182819282028212822282328242825282628272828282928302831283228332834283528362837283828392840284128422843284428452846284728482849285028512852285328542855285628572858285928602861286228632864286528662867286828692870287128722873287428752876287728782879288028812882288328842885288628872888288928902891289228932894289528962897289828992900290129022903290429052906290729082909291029112912291329142915291629172918291929202921292229232924292529262927292829292930293129322933293429352936293729382939294029412942294329442945294629472948294929502951295229532954295529562957295829592960296129622963296429652966296729682969297029712972297329742975
  1. # qhasm: int64 rp
  2. # qhasm: int64 pp
  3. # qhasm: input rp
  4. # qhasm: input pp
  5. # qhasm: int64 a0
  6. # qhasm: int64 a1
  7. # qhasm: int64 a2
  8. # qhasm: int64 a3
  9. # qhasm: stack64 a0_stack
  10. # qhasm: stack64 a1_stack
  11. # qhasm: stack64 a2_stack
  12. # qhasm: stack64 a3_stack
  13. # qhasm: int64 b0
  14. # qhasm: int64 b1
  15. # qhasm: int64 b2
  16. # qhasm: int64 b3
  17. # qhasm: stack64 b0_stack
  18. # qhasm: stack64 b1_stack
  19. # qhasm: stack64 b2_stack
  20. # qhasm: stack64 b3_stack
  21. # qhasm: int64 c0
  22. # qhasm: int64 c1
  23. # qhasm: int64 c2
  24. # qhasm: int64 c3
  25. # qhasm: stack64 c0_stack
  26. # qhasm: stack64 c1_stack
  27. # qhasm: stack64 c2_stack
  28. # qhasm: stack64 c3_stack
  29. # qhasm: int64 d0
  30. # qhasm: int64 d1
  31. # qhasm: int64 d2
  32. # qhasm: int64 d3
  33. # qhasm: stack64 d0_stack
  34. # qhasm: stack64 d1_stack
  35. # qhasm: stack64 d2_stack
  36. # qhasm: stack64 d3_stack
  37. # qhasm: int64 e0
  38. # qhasm: int64 e1
  39. # qhasm: int64 e2
  40. # qhasm: int64 e3
  41. # qhasm: stack64 e0_stack
  42. # qhasm: stack64 e1_stack
  43. # qhasm: stack64 e2_stack
  44. # qhasm: stack64 e3_stack
  45. # qhasm: int64 rx0
  46. # qhasm: int64 rx1
  47. # qhasm: int64 rx2
  48. # qhasm: int64 rx3
  49. # qhasm: stack64 rx0_stack
  50. # qhasm: stack64 rx1_stack
  51. # qhasm: stack64 rx2_stack
  52. # qhasm: stack64 rx3_stack
  53. # qhasm: int64 ry0
  54. # qhasm: int64 ry1
  55. # qhasm: int64 ry2
  56. # qhasm: int64 ry3
  57. # qhasm: int64 ry4
  58. # qhasm: int64 rz0
  59. # qhasm: int64 rz1
  60. # qhasm: int64 rz2
  61. # qhasm: int64 rz3
  62. # qhasm: int64 rt0
  63. # qhasm: int64 rt1
  64. # qhasm: int64 rt2
  65. # qhasm: int64 rt3
  66. # qhasm: int64 mulr4
  67. # qhasm: int64 mulr5
  68. # qhasm: int64 mulr6
  69. # qhasm: int64 mulr7
  70. # qhasm: int64 mulr8
  71. # qhasm: int64 mulrax
  72. # qhasm: int64 mulrdx
  73. # qhasm: int64 mulx0
  74. # qhasm: int64 mulx1
  75. # qhasm: int64 mulx2
  76. # qhasm: int64 mulx3
  77. # qhasm: int64 mulc
  78. # qhasm: int64 mulzero
  79. # qhasm: int64 muli38
  80. # qhasm: int64 squarer4
  81. # qhasm: int64 squarer5
  82. # qhasm: int64 squarer6
  83. # qhasm: int64 squarer7
  84. # qhasm: int64 squarer8
  85. # qhasm: int64 squarerax
  86. # qhasm: int64 squarerdx
  87. # qhasm: int64 squaret1
  88. # qhasm: int64 squaret2
  89. # qhasm: int64 squaret3
  90. # qhasm: int64 squarec
  91. # qhasm: int64 squarezero
  92. # qhasm: int64 squarei38
  93. # qhasm: int64 addt0
  94. # qhasm: int64 addt1
  95. # qhasm: int64 subt0
  96. # qhasm: int64 subt1
  97. # qhasm: int64 caller1
  98. # qhasm: int64 caller2
  99. # qhasm: int64 caller3
  100. # qhasm: int64 caller4
  101. # qhasm: int64 caller5
  102. # qhasm: int64 caller6
  103. # qhasm: int64 caller7
  104. # qhasm: caller caller1
  105. # qhasm: caller caller2
  106. # qhasm: caller caller3
  107. # qhasm: caller caller4
  108. # qhasm: caller caller5
  109. # qhasm: caller caller6
  110. # qhasm: caller caller7
  111. # qhasm: stack64 caller1_stack
  112. # qhasm: stack64 caller2_stack
  113. # qhasm: stack64 caller3_stack
  114. # qhasm: stack64 caller4_stack
  115. # qhasm: stack64 caller5_stack
  116. # qhasm: stack64 caller6_stack
  117. # qhasm: stack64 caller7_stack
  118. # qhasm: enter CRYPTO_NAMESPACE(ge25519_dbl_p1p1)
  119. .text
  120. .p2align 5
  121. .globl _CRYPTO_NAMESPACE(ge25519_dbl_p1p1)
  122. .globl CRYPTO_NAMESPACE(ge25519_dbl_p1p1)
  123. _CRYPTO_NAMESPACE(ge25519_dbl_p1p1):
  124. CRYPTO_NAMESPACE(ge25519_dbl_p1p1):
  125. mov %rsp,%r11
  126. and $31,%r11
  127. add $192,%r11
  128. sub %r11,%rsp
  129. # qhasm: caller1_stack = caller1
  130. # asm 1: movq <caller1=int64#9,>caller1_stack=stack64#1
  131. # asm 2: movq <caller1=%r11,>caller1_stack=0(%rsp)
  132. movq %r11,0(%rsp)
  133. # qhasm: caller2_stack = caller2
  134. # asm 1: movq <caller2=int64#10,>caller2_stack=stack64#2
  135. # asm 2: movq <caller2=%r12,>caller2_stack=8(%rsp)
  136. movq %r12,8(%rsp)
  137. # qhasm: caller3_stack = caller3
  138. # asm 1: movq <caller3=int64#11,>caller3_stack=stack64#3
  139. # asm 2: movq <caller3=%r13,>caller3_stack=16(%rsp)
  140. movq %r13,16(%rsp)
  141. # qhasm: caller4_stack = caller4
  142. # asm 1: movq <caller4=int64#12,>caller4_stack=stack64#4
  143. # asm 2: movq <caller4=%r14,>caller4_stack=24(%rsp)
  144. movq %r14,24(%rsp)
  145. # qhasm: caller5_stack = caller5
  146. # asm 1: movq <caller5=int64#13,>caller5_stack=stack64#5
  147. # asm 2: movq <caller5=%r15,>caller5_stack=32(%rsp)
  148. movq %r15,32(%rsp)
  149. # qhasm: caller6_stack = caller6
  150. # asm 1: movq <caller6=int64#14,>caller6_stack=stack64#6
  151. # asm 2: movq <caller6=%rbx,>caller6_stack=40(%rsp)
  152. movq %rbx,40(%rsp)
  153. # qhasm: caller7_stack = caller7
  154. # asm 1: movq <caller7=int64#15,>caller7_stack=stack64#7
  155. # asm 2: movq <caller7=%rbp,>caller7_stack=48(%rsp)
  156. movq %rbp,48(%rsp)
  157. # qhasm: squarer7 = 0
  158. # asm 1: mov $0,>squarer7=int64#4
  159. # asm 2: mov $0,>squarer7=%rcx
  160. mov $0,%rcx
  161. # qhasm: squarerax = *(uint64 *)(pp + 8)
  162. # asm 1: movq 8(<pp=int64#2),>squarerax=int64#7
  163. # asm 2: movq 8(<pp=%rsi),>squarerax=%rax
  164. movq 8(%rsi),%rax
  165. # qhasm: (uint128) squarerdx squarerax = squarerax * *(uint64 *)(pp + 0)
  166. # asm 1: mulq 0(<pp=int64#2)
  167. # asm 2: mulq 0(<pp=%rsi)
  168. mulq 0(%rsi)
  169. # qhasm: a1 = squarerax
  170. # asm 1: mov <squarerax=int64#7,>a1=int64#5
  171. # asm 2: mov <squarerax=%rax,>a1=%r8
  172. mov %rax,%r8
  173. # qhasm: a2 = squarerdx
  174. # asm 1: mov <squarerdx=int64#3,>a2=int64#6
  175. # asm 2: mov <squarerdx=%rdx,>a2=%r9
  176. mov %rdx,%r9
  177. # qhasm: squarerax = *(uint64 *)(pp + 16)
  178. # asm 1: movq 16(<pp=int64#2),>squarerax=int64#7
  179. # asm 2: movq 16(<pp=%rsi),>squarerax=%rax
  180. movq 16(%rsi),%rax
  181. # qhasm: (uint128) squarerdx squarerax = squarerax * *(uint64 *)(pp + 8)
  182. # asm 1: mulq 8(<pp=int64#2)
  183. # asm 2: mulq 8(<pp=%rsi)
  184. mulq 8(%rsi)
  185. # qhasm: a3 = squarerax
  186. # asm 1: mov <squarerax=int64#7,>a3=int64#8
  187. # asm 2: mov <squarerax=%rax,>a3=%r10
  188. mov %rax,%r10
  189. # qhasm: squarer4 = squarerdx
  190. # asm 1: mov <squarerdx=int64#3,>squarer4=int64#9
  191. # asm 2: mov <squarerdx=%rdx,>squarer4=%r11
  192. mov %rdx,%r11
  193. # qhasm: squarerax = *(uint64 *)(pp + 24)
  194. # asm 1: movq 24(<pp=int64#2),>squarerax=int64#7
  195. # asm 2: movq 24(<pp=%rsi),>squarerax=%rax
  196. movq 24(%rsi),%rax
  197. # qhasm: (uint128) squarerdx squarerax = squarerax * *(uint64 *)(pp + 16)
  198. # asm 1: mulq 16(<pp=int64#2)
  199. # asm 2: mulq 16(<pp=%rsi)
  200. mulq 16(%rsi)
  201. # qhasm: squarer5 = squarerax
  202. # asm 1: mov <squarerax=int64#7,>squarer5=int64#10
  203. # asm 2: mov <squarerax=%rax,>squarer5=%r12
  204. mov %rax,%r12
  205. # qhasm: squarer6 = squarerdx
  206. # asm 1: mov <squarerdx=int64#3,>squarer6=int64#11
  207. # asm 2: mov <squarerdx=%rdx,>squarer6=%r13
  208. mov %rdx,%r13
  209. # qhasm: squarerax = *(uint64 *)(pp + 16)
  210. # asm 1: movq 16(<pp=int64#2),>squarerax=int64#7
  211. # asm 2: movq 16(<pp=%rsi),>squarerax=%rax
  212. movq 16(%rsi),%rax
  213. # qhasm: (uint128) squarerdx squarerax = squarerax * *(uint64 *)(pp + 0)
  214. # asm 1: mulq 0(<pp=int64#2)
  215. # asm 2: mulq 0(<pp=%rsi)
  216. mulq 0(%rsi)
  217. # qhasm: carry? a2 += squarerax
  218. # asm 1: add <squarerax=int64#7,<a2=int64#6
  219. # asm 2: add <squarerax=%rax,<a2=%r9
  220. add %rax,%r9
  221. # qhasm: carry? a3 += squarerdx + carry
  222. # asm 1: adc <squarerdx=int64#3,<a3=int64#8
  223. # asm 2: adc <squarerdx=%rdx,<a3=%r10
  224. adc %rdx,%r10
  225. # qhasm: squarer4 += 0 + carry
  226. # asm 1: adc $0,<squarer4=int64#9
  227. # asm 2: adc $0,<squarer4=%r11
  228. adc $0,%r11
  229. # qhasm: squarerax = *(uint64 *)(pp + 24)
  230. # asm 1: movq 24(<pp=int64#2),>squarerax=int64#7
  231. # asm 2: movq 24(<pp=%rsi),>squarerax=%rax
  232. movq 24(%rsi),%rax
  233. # qhasm: (uint128) squarerdx squarerax = squarerax * *(uint64 *)(pp + 8)
  234. # asm 1: mulq 8(<pp=int64#2)
  235. # asm 2: mulq 8(<pp=%rsi)
  236. mulq 8(%rsi)
  237. # qhasm: carry? squarer4 += squarerax
  238. # asm 1: add <squarerax=int64#7,<squarer4=int64#9
  239. # asm 2: add <squarerax=%rax,<squarer4=%r11
  240. add %rax,%r11
  241. # qhasm: carry? squarer5 += squarerdx + carry
  242. # asm 1: adc <squarerdx=int64#3,<squarer5=int64#10
  243. # asm 2: adc <squarerdx=%rdx,<squarer5=%r12
  244. adc %rdx,%r12
  245. # qhasm: squarer6 += 0 + carry
  246. # asm 1: adc $0,<squarer6=int64#11
  247. # asm 2: adc $0,<squarer6=%r13
  248. adc $0,%r13
  249. # qhasm: squarerax = *(uint64 *)(pp + 24)
  250. # asm 1: movq 24(<pp=int64#2),>squarerax=int64#7
  251. # asm 2: movq 24(<pp=%rsi),>squarerax=%rax
  252. movq 24(%rsi),%rax
  253. # qhasm: (uint128) squarerdx squarerax = squarerax * *(uint64 *)(pp + 0)
  254. # asm 1: mulq 0(<pp=int64#2)
  255. # asm 2: mulq 0(<pp=%rsi)
  256. mulq 0(%rsi)
  257. # qhasm: carry? a3 += squarerax
  258. # asm 1: add <squarerax=int64#7,<a3=int64#8
  259. # asm 2: add <squarerax=%rax,<a3=%r10
  260. add %rax,%r10
  261. # qhasm: carry? squarer4 += squarerdx + carry
  262. # asm 1: adc <squarerdx=int64#3,<squarer4=int64#9
  263. # asm 2: adc <squarerdx=%rdx,<squarer4=%r11
  264. adc %rdx,%r11
  265. # qhasm: carry? squarer5 += 0 + carry
  266. # asm 1: adc $0,<squarer5=int64#10
  267. # asm 2: adc $0,<squarer5=%r12
  268. adc $0,%r12
  269. # qhasm: carry? squarer6 += 0 + carry
  270. # asm 1: adc $0,<squarer6=int64#11
  271. # asm 2: adc $0,<squarer6=%r13
  272. adc $0,%r13
  273. # qhasm: squarer7 += 0 + carry
  274. # asm 1: adc $0,<squarer7=int64#4
  275. # asm 2: adc $0,<squarer7=%rcx
  276. adc $0,%rcx
  277. # qhasm: carry? a1 += a1
  278. # asm 1: add <a1=int64#5,<a1=int64#5
  279. # asm 2: add <a1=%r8,<a1=%r8
  280. add %r8,%r8
  281. # qhasm: carry? a2 += a2 + carry
  282. # asm 1: adc <a2=int64#6,<a2=int64#6
  283. # asm 2: adc <a2=%r9,<a2=%r9
  284. adc %r9,%r9
  285. # qhasm: carry? a3 += a3 + carry
  286. # asm 1: adc <a3=int64#8,<a3=int64#8
  287. # asm 2: adc <a3=%r10,<a3=%r10
  288. adc %r10,%r10
  289. # qhasm: carry? squarer4 += squarer4 + carry
  290. # asm 1: adc <squarer4=int64#9,<squarer4=int64#9
  291. # asm 2: adc <squarer4=%r11,<squarer4=%r11
  292. adc %r11,%r11
  293. # qhasm: carry? squarer5 += squarer5 + carry
  294. # asm 1: adc <squarer5=int64#10,<squarer5=int64#10
  295. # asm 2: adc <squarer5=%r12,<squarer5=%r12
  296. adc %r12,%r12
  297. # qhasm: carry? squarer6 += squarer6 + carry
  298. # asm 1: adc <squarer6=int64#11,<squarer6=int64#11
  299. # asm 2: adc <squarer6=%r13,<squarer6=%r13
  300. adc %r13,%r13
  301. # qhasm: squarer7 += squarer7 + carry
  302. # asm 1: adc <squarer7=int64#4,<squarer7=int64#4
  303. # asm 2: adc <squarer7=%rcx,<squarer7=%rcx
  304. adc %rcx,%rcx
  305. # qhasm: squarerax = *(uint64 *)(pp + 0)
  306. # asm 1: movq 0(<pp=int64#2),>squarerax=int64#7
  307. # asm 2: movq 0(<pp=%rsi),>squarerax=%rax
  308. movq 0(%rsi),%rax
  309. # qhasm: (uint128) squarerdx squarerax = squarerax * *(uint64 *)(pp + 0)
  310. # asm 1: mulq 0(<pp=int64#2)
  311. # asm 2: mulq 0(<pp=%rsi)
  312. mulq 0(%rsi)
  313. # qhasm: a0 = squarerax
  314. # asm 1: mov <squarerax=int64#7,>a0=int64#12
  315. # asm 2: mov <squarerax=%rax,>a0=%r14
  316. mov %rax,%r14
  317. # qhasm: squaret1 = squarerdx
  318. # asm 1: mov <squarerdx=int64#3,>squaret1=int64#13
  319. # asm 2: mov <squarerdx=%rdx,>squaret1=%r15
  320. mov %rdx,%r15
  321. # qhasm: squarerax = *(uint64 *)(pp + 8)
  322. # asm 1: movq 8(<pp=int64#2),>squarerax=int64#7
  323. # asm 2: movq 8(<pp=%rsi),>squarerax=%rax
  324. movq 8(%rsi),%rax
  325. # qhasm: (uint128) squarerdx squarerax = squarerax * *(uint64 *)(pp + 8)
  326. # asm 1: mulq 8(<pp=int64#2)
  327. # asm 2: mulq 8(<pp=%rsi)
  328. mulq 8(%rsi)
  329. # qhasm: squaret2 = squarerax
  330. # asm 1: mov <squarerax=int64#7,>squaret2=int64#14
  331. # asm 2: mov <squarerax=%rax,>squaret2=%rbx
  332. mov %rax,%rbx
  333. # qhasm: squaret3 = squarerdx
  334. # asm 1: mov <squarerdx=int64#3,>squaret3=int64#15
  335. # asm 2: mov <squarerdx=%rdx,>squaret3=%rbp
  336. mov %rdx,%rbp
  337. # qhasm: squarerax = *(uint64 *)(pp + 16)
  338. # asm 1: movq 16(<pp=int64#2),>squarerax=int64#7
  339. # asm 2: movq 16(<pp=%rsi),>squarerax=%rax
  340. movq 16(%rsi),%rax
  341. # qhasm: (uint128) squarerdx squarerax = squarerax * *(uint64 *)(pp + 16)
  342. # asm 1: mulq 16(<pp=int64#2)
  343. # asm 2: mulq 16(<pp=%rsi)
  344. mulq 16(%rsi)
  345. # qhasm: carry? a1 += squaret1
  346. # asm 1: add <squaret1=int64#13,<a1=int64#5
  347. # asm 2: add <squaret1=%r15,<a1=%r8
  348. add %r15,%r8
  349. # qhasm: carry? a2 += squaret2 + carry
  350. # asm 1: adc <squaret2=int64#14,<a2=int64#6
  351. # asm 2: adc <squaret2=%rbx,<a2=%r9
  352. adc %rbx,%r9
  353. # qhasm: carry? a3 += squaret3 + carry
  354. # asm 1: adc <squaret3=int64#15,<a3=int64#8
  355. # asm 2: adc <squaret3=%rbp,<a3=%r10
  356. adc %rbp,%r10
  357. # qhasm: carry? squarer4 += squarerax + carry
  358. # asm 1: adc <squarerax=int64#7,<squarer4=int64#9
  359. # asm 2: adc <squarerax=%rax,<squarer4=%r11
  360. adc %rax,%r11
  361. # qhasm: carry? squarer5 += squarerdx + carry
  362. # asm 1: adc <squarerdx=int64#3,<squarer5=int64#10
  363. # asm 2: adc <squarerdx=%rdx,<squarer5=%r12
  364. adc %rdx,%r12
  365. # qhasm: carry? squarer6 += 0 + carry
  366. # asm 1: adc $0,<squarer6=int64#11
  367. # asm 2: adc $0,<squarer6=%r13
  368. adc $0,%r13
  369. # qhasm: squarer7 += 0 + carry
  370. # asm 1: adc $0,<squarer7=int64#4
  371. # asm 2: adc $0,<squarer7=%rcx
  372. adc $0,%rcx
  373. # qhasm: squarerax = *(uint64 *)(pp + 24)
  374. # asm 1: movq 24(<pp=int64#2),>squarerax=int64#7
  375. # asm 2: movq 24(<pp=%rsi),>squarerax=%rax
  376. movq 24(%rsi),%rax
  377. # qhasm: (uint128) squarerdx squarerax = squarerax * *(uint64 *)(pp + 24)
  378. # asm 1: mulq 24(<pp=int64#2)
  379. # asm 2: mulq 24(<pp=%rsi)
  380. mulq 24(%rsi)
  381. # qhasm: carry? squarer6 += squarerax
  382. # asm 1: add <squarerax=int64#7,<squarer6=int64#11
  383. # asm 2: add <squarerax=%rax,<squarer6=%r13
  384. add %rax,%r13
  385. # qhasm: squarer7 += squarerdx + carry
  386. # asm 1: adc <squarerdx=int64#3,<squarer7=int64#4
  387. # asm 2: adc <squarerdx=%rdx,<squarer7=%rcx
  388. adc %rdx,%rcx
  389. # qhasm: squarerax = squarer4
  390. # asm 1: mov <squarer4=int64#9,>squarerax=int64#7
  391. # asm 2: mov <squarer4=%r11,>squarerax=%rax
  392. mov %r11,%rax
  393. # qhasm: (uint128) squarerdx squarerax = squarerax * *(uint64 *)&CRYPTO_NAMESPACE(38)
  394. mulq CRYPTO_NAMESPACE(38)(%rip)
  395. # qhasm: squarer4 = squarerax
  396. # asm 1: mov <squarerax=int64#7,>squarer4=int64#9
  397. # asm 2: mov <squarerax=%rax,>squarer4=%r11
  398. mov %rax,%r11
  399. # qhasm: squarerax = squarer5
  400. # asm 1: mov <squarer5=int64#10,>squarerax=int64#7
  401. # asm 2: mov <squarer5=%r12,>squarerax=%rax
  402. mov %r12,%rax
  403. # qhasm: squarer5 = squarerdx
  404. # asm 1: mov <squarerdx=int64#3,>squarer5=int64#10
  405. # asm 2: mov <squarerdx=%rdx,>squarer5=%r12
  406. mov %rdx,%r12
  407. # qhasm: (uint128) squarerdx squarerax = squarerax * *(uint64 *)&CRYPTO_NAMESPACE(38)
  408. mulq CRYPTO_NAMESPACE(38)(%rip)
  409. # qhasm: carry? squarer5 += squarerax
  410. # asm 1: add <squarerax=int64#7,<squarer5=int64#10
  411. # asm 2: add <squarerax=%rax,<squarer5=%r12
  412. add %rax,%r12
  413. # qhasm: squarerax = squarer6
  414. # asm 1: mov <squarer6=int64#11,>squarerax=int64#7
  415. # asm 2: mov <squarer6=%r13,>squarerax=%rax
  416. mov %r13,%rax
  417. # qhasm: squarer6 = 0
  418. # asm 1: mov $0,>squarer6=int64#11
  419. # asm 2: mov $0,>squarer6=%r13
  420. mov $0,%r13
  421. # qhasm: squarer6 += squarerdx + carry
  422. # asm 1: adc <squarerdx=int64#3,<squarer6=int64#11
  423. # asm 2: adc <squarerdx=%rdx,<squarer6=%r13
  424. adc %rdx,%r13
  425. # qhasm: (uint128) squarerdx squarerax = squarerax * *(uint64 *)&CRYPTO_NAMESPACE(38)
  426. mulq CRYPTO_NAMESPACE(38)(%rip)
  427. # qhasm: carry? squarer6 += squarerax
  428. # asm 1: add <squarerax=int64#7,<squarer6=int64#11
  429. # asm 2: add <squarerax=%rax,<squarer6=%r13
  430. add %rax,%r13
  431. # qhasm: squarerax = squarer7
  432. # asm 1: mov <squarer7=int64#4,>squarerax=int64#7
  433. # asm 2: mov <squarer7=%rcx,>squarerax=%rax
  434. mov %rcx,%rax
  435. # qhasm: squarer7 = 0
  436. # asm 1: mov $0,>squarer7=int64#4
  437. # asm 2: mov $0,>squarer7=%rcx
  438. mov $0,%rcx
  439. # qhasm: squarer7 += squarerdx + carry
  440. # asm 1: adc <squarerdx=int64#3,<squarer7=int64#4
  441. # asm 2: adc <squarerdx=%rdx,<squarer7=%rcx
  442. adc %rdx,%rcx
  443. # qhasm: (uint128) squarerdx squarerax = squarerax * *(uint64 *)&CRYPTO_NAMESPACE(38)
  444. mulq CRYPTO_NAMESPACE(38)(%rip)
  445. # qhasm: carry? squarer7 += squarerax
  446. # asm 1: add <squarerax=int64#7,<squarer7=int64#4
  447. # asm 2: add <squarerax=%rax,<squarer7=%rcx
  448. add %rax,%rcx
  449. # qhasm: squarer8 = 0
  450. # asm 1: mov $0,>squarer8=int64#7
  451. # asm 2: mov $0,>squarer8=%rax
  452. mov $0,%rax
  453. # qhasm: squarer8 += squarerdx + carry
  454. # asm 1: adc <squarerdx=int64#3,<squarer8=int64#7
  455. # asm 2: adc <squarerdx=%rdx,<squarer8=%rax
  456. adc %rdx,%rax
  457. # qhasm: carry? a0 += squarer4
  458. # asm 1: add <squarer4=int64#9,<a0=int64#12
  459. # asm 2: add <squarer4=%r11,<a0=%r14
  460. add %r11,%r14
  461. # qhasm: carry? a1 += squarer5 + carry
  462. # asm 1: adc <squarer5=int64#10,<a1=int64#5
  463. # asm 2: adc <squarer5=%r12,<a1=%r8
  464. adc %r12,%r8
  465. # qhasm: carry? a2 += squarer6 + carry
  466. # asm 1: adc <squarer6=int64#11,<a2=int64#6
  467. # asm 2: adc <squarer6=%r13,<a2=%r9
  468. adc %r13,%r9
  469. # qhasm: carry? a3 += squarer7 + carry
  470. # asm 1: adc <squarer7=int64#4,<a3=int64#8
  471. # asm 2: adc <squarer7=%rcx,<a3=%r10
  472. adc %rcx,%r10
  473. # qhasm: squarezero = 0
  474. # asm 1: mov $0,>squarezero=int64#3
  475. # asm 2: mov $0,>squarezero=%rdx
  476. mov $0,%rdx
  477. # qhasm: squarer8 += squarezero + carry
  478. # asm 1: adc <squarezero=int64#3,<squarer8=int64#7
  479. # asm 2: adc <squarezero=%rdx,<squarer8=%rax
  480. adc %rdx,%rax
  481. # qhasm: squarer8 *= 38
  482. # asm 1: imulq $38,<squarer8=int64#7,>squarer8=int64#4
  483. # asm 2: imulq $38,<squarer8=%rax,>squarer8=%rcx
  484. imulq $38,%rax,%rcx
  485. # qhasm: carry? a0 += squarer8
  486. # asm 1: add <squarer8=int64#4,<a0=int64#12
  487. # asm 2: add <squarer8=%rcx,<a0=%r14
  488. add %rcx,%r14
  489. # qhasm: carry? a1 += squarezero + carry
  490. # asm 1: adc <squarezero=int64#3,<a1=int64#5
  491. # asm 2: adc <squarezero=%rdx,<a1=%r8
  492. adc %rdx,%r8
  493. # qhasm: carry? a2 += squarezero + carry
  494. # asm 1: adc <squarezero=int64#3,<a2=int64#6
  495. # asm 2: adc <squarezero=%rdx,<a2=%r9
  496. adc %rdx,%r9
  497. # qhasm: carry? a3 += squarezero + carry
  498. # asm 1: adc <squarezero=int64#3,<a3=int64#8
  499. # asm 2: adc <squarezero=%rdx,<a3=%r10
  500. adc %rdx,%r10
  501. # qhasm: squarezero += squarezero + carry
  502. # asm 1: adc <squarezero=int64#3,<squarezero=int64#3
  503. # asm 2: adc <squarezero=%rdx,<squarezero=%rdx
  504. adc %rdx,%rdx
  505. # qhasm: squarezero *= 38
  506. # asm 1: imulq $38,<squarezero=int64#3,>squarezero=int64#3
  507. # asm 2: imulq $38,<squarezero=%rdx,>squarezero=%rdx
  508. imulq $38,%rdx,%rdx
  509. # qhasm: a0 += squarezero
  510. # asm 1: add <squarezero=int64#3,<a0=int64#12
  511. # asm 2: add <squarezero=%rdx,<a0=%r14
  512. add %rdx,%r14
  513. # qhasm: a0_stack = a0
  514. # asm 1: movq <a0=int64#12,>a0_stack=stack64#8
  515. # asm 2: movq <a0=%r14,>a0_stack=56(%rsp)
  516. movq %r14,56(%rsp)
  517. # qhasm: a1_stack = a1
  518. # asm 1: movq <a1=int64#5,>a1_stack=stack64#9
  519. # asm 2: movq <a1=%r8,>a1_stack=64(%rsp)
  520. movq %r8,64(%rsp)
  521. # qhasm: a2_stack = a2
  522. # asm 1: movq <a2=int64#6,>a2_stack=stack64#10
  523. # asm 2: movq <a2=%r9,>a2_stack=72(%rsp)
  524. movq %r9,72(%rsp)
  525. # qhasm: a3_stack = a3
  526. # asm 1: movq <a3=int64#8,>a3_stack=stack64#11
  527. # asm 2: movq <a3=%r10,>a3_stack=80(%rsp)
  528. movq %r10,80(%rsp)
  529. # qhasm: squarer7 = 0
  530. # asm 1: mov $0,>squarer7=int64#4
  531. # asm 2: mov $0,>squarer7=%rcx
  532. mov $0,%rcx
  533. # qhasm: squarerax = *(uint64 *)(pp + 40)
  534. # asm 1: movq 40(<pp=int64#2),>squarerax=int64#7
  535. # asm 2: movq 40(<pp=%rsi),>squarerax=%rax
  536. movq 40(%rsi),%rax
  537. # qhasm: (uint128) squarerdx squarerax = squarerax * *(uint64 *)(pp + 32)
  538. # asm 1: mulq 32(<pp=int64#2)
  539. # asm 2: mulq 32(<pp=%rsi)
  540. mulq 32(%rsi)
  541. # qhasm: b1 = squarerax
  542. # asm 1: mov <squarerax=int64#7,>b1=int64#5
  543. # asm 2: mov <squarerax=%rax,>b1=%r8
  544. mov %rax,%r8
  545. # qhasm: b2 = squarerdx
  546. # asm 1: mov <squarerdx=int64#3,>b2=int64#6
  547. # asm 2: mov <squarerdx=%rdx,>b2=%r9
  548. mov %rdx,%r9
  549. # qhasm: squarerax = *(uint64 *)(pp + 48)
  550. # asm 1: movq 48(<pp=int64#2),>squarerax=int64#7
  551. # asm 2: movq 48(<pp=%rsi),>squarerax=%rax
  552. movq 48(%rsi),%rax
  553. # qhasm: (uint128) squarerdx squarerax = squarerax * *(uint64 *)(pp + 40)
  554. # asm 1: mulq 40(<pp=int64#2)
  555. # asm 2: mulq 40(<pp=%rsi)
  556. mulq 40(%rsi)
  557. # qhasm: b3 = squarerax
  558. # asm 1: mov <squarerax=int64#7,>b3=int64#8
  559. # asm 2: mov <squarerax=%rax,>b3=%r10
  560. mov %rax,%r10
  561. # qhasm: squarer4 = squarerdx
  562. # asm 1: mov <squarerdx=int64#3,>squarer4=int64#9
  563. # asm 2: mov <squarerdx=%rdx,>squarer4=%r11
  564. mov %rdx,%r11
  565. # qhasm: squarerax = *(uint64 *)(pp + 56)
  566. # asm 1: movq 56(<pp=int64#2),>squarerax=int64#7
  567. # asm 2: movq 56(<pp=%rsi),>squarerax=%rax
  568. movq 56(%rsi),%rax
  569. # qhasm: (uint128) squarerdx squarerax = squarerax * *(uint64 *)(pp + 48)
  570. # asm 1: mulq 48(<pp=int64#2)
  571. # asm 2: mulq 48(<pp=%rsi)
  572. mulq 48(%rsi)
  573. # qhasm: squarer5 = squarerax
  574. # asm 1: mov <squarerax=int64#7,>squarer5=int64#10
  575. # asm 2: mov <squarerax=%rax,>squarer5=%r12
  576. mov %rax,%r12
  577. # qhasm: squarer6 = squarerdx
  578. # asm 1: mov <squarerdx=int64#3,>squarer6=int64#11
  579. # asm 2: mov <squarerdx=%rdx,>squarer6=%r13
  580. mov %rdx,%r13
  581. # qhasm: squarerax = *(uint64 *)(pp + 48)
  582. # asm 1: movq 48(<pp=int64#2),>squarerax=int64#7
  583. # asm 2: movq 48(<pp=%rsi),>squarerax=%rax
  584. movq 48(%rsi),%rax
  585. # qhasm: (uint128) squarerdx squarerax = squarerax * *(uint64 *)(pp + 32)
  586. # asm 1: mulq 32(<pp=int64#2)
  587. # asm 2: mulq 32(<pp=%rsi)
  588. mulq 32(%rsi)
  589. # qhasm: carry? b2 += squarerax
  590. # asm 1: add <squarerax=int64#7,<b2=int64#6
  591. # asm 2: add <squarerax=%rax,<b2=%r9
  592. add %rax,%r9
  593. # qhasm: carry? b3 += squarerdx + carry
  594. # asm 1: adc <squarerdx=int64#3,<b3=int64#8
  595. # asm 2: adc <squarerdx=%rdx,<b3=%r10
  596. adc %rdx,%r10
  597. # qhasm: squarer4 += 0 + carry
  598. # asm 1: adc $0,<squarer4=int64#9
  599. # asm 2: adc $0,<squarer4=%r11
  600. adc $0,%r11
  601. # qhasm: squarerax = *(uint64 *)(pp + 56)
  602. # asm 1: movq 56(<pp=int64#2),>squarerax=int64#7
  603. # asm 2: movq 56(<pp=%rsi),>squarerax=%rax
  604. movq 56(%rsi),%rax
  605. # qhasm: (uint128) squarerdx squarerax = squarerax * *(uint64 *)(pp + 40)
  606. # asm 1: mulq 40(<pp=int64#2)
  607. # asm 2: mulq 40(<pp=%rsi)
  608. mulq 40(%rsi)
  609. # qhasm: carry? squarer4 += squarerax
  610. # asm 1: add <squarerax=int64#7,<squarer4=int64#9
  611. # asm 2: add <squarerax=%rax,<squarer4=%r11
  612. add %rax,%r11
  613. # qhasm: carry? squarer5 += squarerdx + carry
  614. # asm 1: adc <squarerdx=int64#3,<squarer5=int64#10
  615. # asm 2: adc <squarerdx=%rdx,<squarer5=%r12
  616. adc %rdx,%r12
  617. # qhasm: squarer6 += 0 + carry
  618. # asm 1: adc $0,<squarer6=int64#11
  619. # asm 2: adc $0,<squarer6=%r13
  620. adc $0,%r13
  621. # qhasm: squarerax = *(uint64 *)(pp + 56)
  622. # asm 1: movq 56(<pp=int64#2),>squarerax=int64#7
  623. # asm 2: movq 56(<pp=%rsi),>squarerax=%rax
  624. movq 56(%rsi),%rax
  625. # qhasm: (uint128) squarerdx squarerax = squarerax * *(uint64 *)(pp + 32)
  626. # asm 1: mulq 32(<pp=int64#2)
  627. # asm 2: mulq 32(<pp=%rsi)
  628. mulq 32(%rsi)
  629. # qhasm: carry? b3 += squarerax
  630. # asm 1: add <squarerax=int64#7,<b3=int64#8
  631. # asm 2: add <squarerax=%rax,<b3=%r10
  632. add %rax,%r10
  633. # qhasm: carry? squarer4 += squarerdx + carry
  634. # asm 1: adc <squarerdx=int64#3,<squarer4=int64#9
  635. # asm 2: adc <squarerdx=%rdx,<squarer4=%r11
  636. adc %rdx,%r11
  637. # qhasm: carry? squarer5 += 0 + carry
  638. # asm 1: adc $0,<squarer5=int64#10
  639. # asm 2: adc $0,<squarer5=%r12
  640. adc $0,%r12
  641. # qhasm: carry? squarer6 += 0 + carry
  642. # asm 1: adc $0,<squarer6=int64#11
  643. # asm 2: adc $0,<squarer6=%r13
  644. adc $0,%r13
  645. # qhasm: squarer7 += 0 + carry
  646. # asm 1: adc $0,<squarer7=int64#4
  647. # asm 2: adc $0,<squarer7=%rcx
  648. adc $0,%rcx
  649. # qhasm: carry? b1 += b1
  650. # asm 1: add <b1=int64#5,<b1=int64#5
  651. # asm 2: add <b1=%r8,<b1=%r8
  652. add %r8,%r8
  653. # qhasm: carry? b2 += b2 + carry
  654. # asm 1: adc <b2=int64#6,<b2=int64#6
  655. # asm 2: adc <b2=%r9,<b2=%r9
  656. adc %r9,%r9
  657. # qhasm: carry? b3 += b3 + carry
  658. # asm 1: adc <b3=int64#8,<b3=int64#8
  659. # asm 2: adc <b3=%r10,<b3=%r10
  660. adc %r10,%r10
  661. # qhasm: carry? squarer4 += squarer4 + carry
  662. # asm 1: adc <squarer4=int64#9,<squarer4=int64#9
  663. # asm 2: adc <squarer4=%r11,<squarer4=%r11
  664. adc %r11,%r11
  665. # qhasm: carry? squarer5 += squarer5 + carry
  666. # asm 1: adc <squarer5=int64#10,<squarer5=int64#10
  667. # asm 2: adc <squarer5=%r12,<squarer5=%r12
  668. adc %r12,%r12
  669. # qhasm: carry? squarer6 += squarer6 + carry
  670. # asm 1: adc <squarer6=int64#11,<squarer6=int64#11
  671. # asm 2: adc <squarer6=%r13,<squarer6=%r13
  672. adc %r13,%r13
  673. # qhasm: squarer7 += squarer7 + carry
  674. # asm 1: adc <squarer7=int64#4,<squarer7=int64#4
  675. # asm 2: adc <squarer7=%rcx,<squarer7=%rcx
  676. adc %rcx,%rcx
  677. # qhasm: squarerax = *(uint64 *)(pp + 32)
  678. # asm 1: movq 32(<pp=int64#2),>squarerax=int64#7
  679. # asm 2: movq 32(<pp=%rsi),>squarerax=%rax
  680. movq 32(%rsi),%rax
  681. # qhasm: (uint128) squarerdx squarerax = squarerax * *(uint64 *)(pp + 32)
  682. # asm 1: mulq 32(<pp=int64#2)
  683. # asm 2: mulq 32(<pp=%rsi)
  684. mulq 32(%rsi)
  685. # qhasm: b0 = squarerax
  686. # asm 1: mov <squarerax=int64#7,>b0=int64#12
  687. # asm 2: mov <squarerax=%rax,>b0=%r14
  688. mov %rax,%r14
  689. # qhasm: squaret1 = squarerdx
  690. # asm 1: mov <squarerdx=int64#3,>squaret1=int64#13
  691. # asm 2: mov <squarerdx=%rdx,>squaret1=%r15
  692. mov %rdx,%r15
  693. # qhasm: squarerax = *(uint64 *)(pp + 40)
  694. # asm 1: movq 40(<pp=int64#2),>squarerax=int64#7
  695. # asm 2: movq 40(<pp=%rsi),>squarerax=%rax
  696. movq 40(%rsi),%rax
  697. # qhasm: (uint128) squarerdx squarerax = squarerax * *(uint64 *)(pp + 40)
  698. # asm 1: mulq 40(<pp=int64#2)
  699. # asm 2: mulq 40(<pp=%rsi)
  700. mulq 40(%rsi)
  701. # qhasm: squaret2 = squarerax
  702. # asm 1: mov <squarerax=int64#7,>squaret2=int64#14
  703. # asm 2: mov <squarerax=%rax,>squaret2=%rbx
  704. mov %rax,%rbx
  705. # qhasm: squaret3 = squarerdx
  706. # asm 1: mov <squarerdx=int64#3,>squaret3=int64#15
  707. # asm 2: mov <squarerdx=%rdx,>squaret3=%rbp
  708. mov %rdx,%rbp
  709. # qhasm: squarerax = *(uint64 *)(pp + 48)
  710. # asm 1: movq 48(<pp=int64#2),>squarerax=int64#7
  711. # asm 2: movq 48(<pp=%rsi),>squarerax=%rax
  712. movq 48(%rsi),%rax
  713. # qhasm: (uint128) squarerdx squarerax = squarerax * *(uint64 *)(pp + 48)
  714. # asm 1: mulq 48(<pp=int64#2)
  715. # asm 2: mulq 48(<pp=%rsi)
  716. mulq 48(%rsi)
  717. # qhasm: carry? b1 += squaret1
  718. # asm 1: add <squaret1=int64#13,<b1=int64#5
  719. # asm 2: add <squaret1=%r15,<b1=%r8
  720. add %r15,%r8
  721. # qhasm: carry? b2 += squaret2 + carry
  722. # asm 1: adc <squaret2=int64#14,<b2=int64#6
  723. # asm 2: adc <squaret2=%rbx,<b2=%r9
  724. adc %rbx,%r9
  725. # qhasm: carry? b3 += squaret3 + carry
  726. # asm 1: adc <squaret3=int64#15,<b3=int64#8
  727. # asm 2: adc <squaret3=%rbp,<b3=%r10
  728. adc %rbp,%r10
  729. # qhasm: carry? squarer4 += squarerax + carry
  730. # asm 1: adc <squarerax=int64#7,<squarer4=int64#9
  731. # asm 2: adc <squarerax=%rax,<squarer4=%r11
  732. adc %rax,%r11
  733. # qhasm: carry? squarer5 += squarerdx + carry
  734. # asm 1: adc <squarerdx=int64#3,<squarer5=int64#10
  735. # asm 2: adc <squarerdx=%rdx,<squarer5=%r12
  736. adc %rdx,%r12
  737. # qhasm: carry? squarer6 += 0 + carry
  738. # asm 1: adc $0,<squarer6=int64#11
  739. # asm 2: adc $0,<squarer6=%r13
  740. adc $0,%r13
  741. # qhasm: squarer7 += 0 + carry
  742. # asm 1: adc $0,<squarer7=int64#4
  743. # asm 2: adc $0,<squarer7=%rcx
  744. adc $0,%rcx
  745. # qhasm: squarerax = *(uint64 *)(pp + 56)
  746. # asm 1: movq 56(<pp=int64#2),>squarerax=int64#7
  747. # asm 2: movq 56(<pp=%rsi),>squarerax=%rax
  748. movq 56(%rsi),%rax
  749. # qhasm: (uint128) squarerdx squarerax = squarerax * *(uint64 *)(pp + 56)
  750. # asm 1: mulq 56(<pp=int64#2)
  751. # asm 2: mulq 56(<pp=%rsi)
  752. mulq 56(%rsi)
  753. # qhasm: carry? squarer6 += squarerax
  754. # asm 1: add <squarerax=int64#7,<squarer6=int64#11
  755. # asm 2: add <squarerax=%rax,<squarer6=%r13
  756. add %rax,%r13
  757. # qhasm: squarer7 += squarerdx + carry
  758. # asm 1: adc <squarerdx=int64#3,<squarer7=int64#4
  759. # asm 2: adc <squarerdx=%rdx,<squarer7=%rcx
  760. adc %rdx,%rcx
  761. # qhasm: squarerax = squarer4
  762. # asm 1: mov <squarer4=int64#9,>squarerax=int64#7
  763. # asm 2: mov <squarer4=%r11,>squarerax=%rax
  764. mov %r11,%rax
  765. # qhasm: (uint128) squarerdx squarerax = squarerax * *(uint64 *)&CRYPTO_NAMESPACE(38)
  766. mulq CRYPTO_NAMESPACE(38)(%rip)
  767. # qhasm: squarer4 = squarerax
  768. # asm 1: mov <squarerax=int64#7,>squarer4=int64#9
  769. # asm 2: mov <squarerax=%rax,>squarer4=%r11
  770. mov %rax,%r11
  771. # qhasm: squarerax = squarer5
  772. # asm 1: mov <squarer5=int64#10,>squarerax=int64#7
  773. # asm 2: mov <squarer5=%r12,>squarerax=%rax
  774. mov %r12,%rax
  775. # qhasm: squarer5 = squarerdx
  776. # asm 1: mov <squarerdx=int64#3,>squarer5=int64#10
  777. # asm 2: mov <squarerdx=%rdx,>squarer5=%r12
  778. mov %rdx,%r12
  779. # qhasm: (uint128) squarerdx squarerax = squarerax * *(uint64 *)&CRYPTO_NAMESPACE(38)
  780. mulq CRYPTO_NAMESPACE(38)(%rip)
  781. # qhasm: carry? squarer5 += squarerax
  782. # asm 1: add <squarerax=int64#7,<squarer5=int64#10
  783. # asm 2: add <squarerax=%rax,<squarer5=%r12
  784. add %rax,%r12
  785. # qhasm: squarerax = squarer6
  786. # asm 1: mov <squarer6=int64#11,>squarerax=int64#7
  787. # asm 2: mov <squarer6=%r13,>squarerax=%rax
  788. mov %r13,%rax
  789. # qhasm: squarer6 = 0
  790. # asm 1: mov $0,>squarer6=int64#11
  791. # asm 2: mov $0,>squarer6=%r13
  792. mov $0,%r13
  793. # qhasm: squarer6 += squarerdx + carry
  794. # asm 1: adc <squarerdx=int64#3,<squarer6=int64#11
  795. # asm 2: adc <squarerdx=%rdx,<squarer6=%r13
  796. adc %rdx,%r13
  797. # qhasm: (uint128) squarerdx squarerax = squarerax * *(uint64 *)&CRYPTO_NAMESPACE(38)
  798. mulq CRYPTO_NAMESPACE(38)(%rip)
  799. # qhasm: carry? squarer6 += squarerax
  800. # asm 1: add <squarerax=int64#7,<squarer6=int64#11
  801. # asm 2: add <squarerax=%rax,<squarer6=%r13
  802. add %rax,%r13
  803. # qhasm: squarerax = squarer7
  804. # asm 1: mov <squarer7=int64#4,>squarerax=int64#7
  805. # asm 2: mov <squarer7=%rcx,>squarerax=%rax
  806. mov %rcx,%rax
  807. # qhasm: squarer7 = 0
  808. # asm 1: mov $0,>squarer7=int64#4
  809. # asm 2: mov $0,>squarer7=%rcx
  810. mov $0,%rcx
  811. # qhasm: squarer7 += squarerdx + carry
  812. # asm 1: adc <squarerdx=int64#3,<squarer7=int64#4
  813. # asm 2: adc <squarerdx=%rdx,<squarer7=%rcx
  814. adc %rdx,%rcx
  815. # qhasm: (uint128) squarerdx squarerax = squarerax * *(uint64 *)&CRYPTO_NAMESPACE(38)
  816. mulq CRYPTO_NAMESPACE(38)(%rip)
  817. # qhasm: carry? squarer7 += squarerax
  818. # asm 1: add <squarerax=int64#7,<squarer7=int64#4
  819. # asm 2: add <squarerax=%rax,<squarer7=%rcx
  820. add %rax,%rcx
  821. # qhasm: squarer8 = 0
  822. # asm 1: mov $0,>squarer8=int64#7
  823. # asm 2: mov $0,>squarer8=%rax
  824. mov $0,%rax
  825. # qhasm: squarer8 += squarerdx + carry
  826. # asm 1: adc <squarerdx=int64#3,<squarer8=int64#7
  827. # asm 2: adc <squarerdx=%rdx,<squarer8=%rax
  828. adc %rdx,%rax
  829. # qhasm: carry? b0 += squarer4
  830. # asm 1: add <squarer4=int64#9,<b0=int64#12
  831. # asm 2: add <squarer4=%r11,<b0=%r14
  832. add %r11,%r14
  833. # qhasm: carry? b1 += squarer5 + carry
  834. # asm 1: adc <squarer5=int64#10,<b1=int64#5
  835. # asm 2: adc <squarer5=%r12,<b1=%r8
  836. adc %r12,%r8
  837. # qhasm: carry? b2 += squarer6 + carry
  838. # asm 1: adc <squarer6=int64#11,<b2=int64#6
  839. # asm 2: adc <squarer6=%r13,<b2=%r9
  840. adc %r13,%r9
  841. # qhasm: carry? b3 += squarer7 + carry
  842. # asm 1: adc <squarer7=int64#4,<b3=int64#8
  843. # asm 2: adc <squarer7=%rcx,<b3=%r10
  844. adc %rcx,%r10
  845. # qhasm: squarezero = 0
  846. # asm 1: mov $0,>squarezero=int64#3
  847. # asm 2: mov $0,>squarezero=%rdx
  848. mov $0,%rdx
  849. # qhasm: squarer8 += squarezero + carry
  850. # asm 1: adc <squarezero=int64#3,<squarer8=int64#7
  851. # asm 2: adc <squarezero=%rdx,<squarer8=%rax
  852. adc %rdx,%rax
  853. # qhasm: squarer8 *= 38
  854. # asm 1: imulq $38,<squarer8=int64#7,>squarer8=int64#4
  855. # asm 2: imulq $38,<squarer8=%rax,>squarer8=%rcx
  856. imulq $38,%rax,%rcx
  857. # qhasm: carry? b0 += squarer8
  858. # asm 1: add <squarer8=int64#4,<b0=int64#12
  859. # asm 2: add <squarer8=%rcx,<b0=%r14
  860. add %rcx,%r14
  861. # qhasm: carry? b1 += squarezero + carry
  862. # asm 1: adc <squarezero=int64#3,<b1=int64#5
  863. # asm 2: adc <squarezero=%rdx,<b1=%r8
  864. adc %rdx,%r8
  865. # qhasm: carry? b2 += squarezero + carry
  866. # asm 1: adc <squarezero=int64#3,<b2=int64#6
  867. # asm 2: adc <squarezero=%rdx,<b2=%r9
  868. adc %rdx,%r9
  869. # qhasm: carry? b3 += squarezero + carry
  870. # asm 1: adc <squarezero=int64#3,<b3=int64#8
  871. # asm 2: adc <squarezero=%rdx,<b3=%r10
  872. adc %rdx,%r10
  873. # qhasm: squarezero += squarezero + carry
  874. # asm 1: adc <squarezero=int64#3,<squarezero=int64#3
  875. # asm 2: adc <squarezero=%rdx,<squarezero=%rdx
  876. adc %rdx,%rdx
  877. # qhasm: squarezero *= 38
  878. # asm 1: imulq $38,<squarezero=int64#3,>squarezero=int64#3
  879. # asm 2: imulq $38,<squarezero=%rdx,>squarezero=%rdx
  880. imulq $38,%rdx,%rdx
  881. # qhasm: b0 += squarezero
  882. # asm 1: add <squarezero=int64#3,<b0=int64#12
  883. # asm 2: add <squarezero=%rdx,<b0=%r14
  884. add %rdx,%r14
  885. # qhasm: b0_stack = b0
  886. # asm 1: movq <b0=int64#12,>b0_stack=stack64#12
  887. # asm 2: movq <b0=%r14,>b0_stack=88(%rsp)
  888. movq %r14,88(%rsp)
  889. # qhasm: b1_stack = b1
  890. # asm 1: movq <b1=int64#5,>b1_stack=stack64#13
  891. # asm 2: movq <b1=%r8,>b1_stack=96(%rsp)
  892. movq %r8,96(%rsp)
  893. # qhasm: b2_stack = b2
  894. # asm 1: movq <b2=int64#6,>b2_stack=stack64#14
  895. # asm 2: movq <b2=%r9,>b2_stack=104(%rsp)
  896. movq %r9,104(%rsp)
  897. # qhasm: b3_stack = b3
  898. # asm 1: movq <b3=int64#8,>b3_stack=stack64#15
  899. # asm 2: movq <b3=%r10,>b3_stack=112(%rsp)
  900. movq %r10,112(%rsp)
  901. # qhasm: squarer7 = 0
  902. # asm 1: mov $0,>squarer7=int64#4
  903. # asm 2: mov $0,>squarer7=%rcx
  904. mov $0,%rcx
  905. # qhasm: squarerax = *(uint64 *)(pp + 72)
  906. # asm 1: movq 72(<pp=int64#2),>squarerax=int64#7
  907. # asm 2: movq 72(<pp=%rsi),>squarerax=%rax
  908. movq 72(%rsi),%rax
  909. # qhasm: (uint128) squarerdx squarerax = squarerax * *(uint64 *)(pp + 64)
  910. # asm 1: mulq 64(<pp=int64#2)
  911. # asm 2: mulq 64(<pp=%rsi)
  912. mulq 64(%rsi)
  913. # qhasm: c1 = squarerax
  914. # asm 1: mov <squarerax=int64#7,>c1=int64#5
  915. # asm 2: mov <squarerax=%rax,>c1=%r8
  916. mov %rax,%r8
  917. # qhasm: c2 = squarerdx
  918. # asm 1: mov <squarerdx=int64#3,>c2=int64#6
  919. # asm 2: mov <squarerdx=%rdx,>c2=%r9
  920. mov %rdx,%r9
  921. # qhasm: squarerax = *(uint64 *)(pp + 80)
  922. # asm 1: movq 80(<pp=int64#2),>squarerax=int64#7
  923. # asm 2: movq 80(<pp=%rsi),>squarerax=%rax
  924. movq 80(%rsi),%rax
  925. # qhasm: (uint128) squarerdx squarerax = squarerax * *(uint64 *)(pp + 72)
  926. # asm 1: mulq 72(<pp=int64#2)
  927. # asm 2: mulq 72(<pp=%rsi)
  928. mulq 72(%rsi)
  929. # qhasm: c3 = squarerax
  930. # asm 1: mov <squarerax=int64#7,>c3=int64#8
  931. # asm 2: mov <squarerax=%rax,>c3=%r10
  932. mov %rax,%r10
  933. # qhasm: squarer4 = squarerdx
  934. # asm 1: mov <squarerdx=int64#3,>squarer4=int64#9
  935. # asm 2: mov <squarerdx=%rdx,>squarer4=%r11
  936. mov %rdx,%r11
  937. # qhasm: squarerax = *(uint64 *)(pp + 88)
  938. # asm 1: movq 88(<pp=int64#2),>squarerax=int64#7
  939. # asm 2: movq 88(<pp=%rsi),>squarerax=%rax
  940. movq 88(%rsi),%rax
  941. # qhasm: (uint128) squarerdx squarerax = squarerax * *(uint64 *)(pp + 80)
  942. # asm 1: mulq 80(<pp=int64#2)
  943. # asm 2: mulq 80(<pp=%rsi)
  944. mulq 80(%rsi)
  945. # qhasm: squarer5 = squarerax
  946. # asm 1: mov <squarerax=int64#7,>squarer5=int64#10
  947. # asm 2: mov <squarerax=%rax,>squarer5=%r12
  948. mov %rax,%r12
  949. # qhasm: squarer6 = squarerdx
  950. # asm 1: mov <squarerdx=int64#3,>squarer6=int64#11
  951. # asm 2: mov <squarerdx=%rdx,>squarer6=%r13
  952. mov %rdx,%r13
  953. # qhasm: squarerax = *(uint64 *)(pp + 80)
  954. # asm 1: movq 80(<pp=int64#2),>squarerax=int64#7
  955. # asm 2: movq 80(<pp=%rsi),>squarerax=%rax
  956. movq 80(%rsi),%rax
  957. # qhasm: (uint128) squarerdx squarerax = squarerax * *(uint64 *)(pp + 64)
  958. # asm 1: mulq 64(<pp=int64#2)
  959. # asm 2: mulq 64(<pp=%rsi)
  960. mulq 64(%rsi)
  961. # qhasm: carry? c2 += squarerax
  962. # asm 1: add <squarerax=int64#7,<c2=int64#6
  963. # asm 2: add <squarerax=%rax,<c2=%r9
  964. add %rax,%r9
  965. # qhasm: carry? c3 += squarerdx + carry
  966. # asm 1: adc <squarerdx=int64#3,<c3=int64#8
  967. # asm 2: adc <squarerdx=%rdx,<c3=%r10
  968. adc %rdx,%r10
  969. # qhasm: squarer4 += 0 + carry
  970. # asm 1: adc $0,<squarer4=int64#9
  971. # asm 2: adc $0,<squarer4=%r11
  972. adc $0,%r11
  973. # qhasm: squarerax = *(uint64 *)(pp + 88)
  974. # asm 1: movq 88(<pp=int64#2),>squarerax=int64#7
  975. # asm 2: movq 88(<pp=%rsi),>squarerax=%rax
  976. movq 88(%rsi),%rax
  977. # qhasm: (uint128) squarerdx squarerax = squarerax * *(uint64 *)(pp + 72)
  978. # asm 1: mulq 72(<pp=int64#2)
  979. # asm 2: mulq 72(<pp=%rsi)
  980. mulq 72(%rsi)
  981. # qhasm: carry? squarer4 += squarerax
  982. # asm 1: add <squarerax=int64#7,<squarer4=int64#9
  983. # asm 2: add <squarerax=%rax,<squarer4=%r11
  984. add %rax,%r11
  985. # qhasm: carry? squarer5 += squarerdx + carry
  986. # asm 1: adc <squarerdx=int64#3,<squarer5=int64#10
  987. # asm 2: adc <squarerdx=%rdx,<squarer5=%r12
  988. adc %rdx,%r12
  989. # qhasm: squarer6 += 0 + carry
  990. # asm 1: adc $0,<squarer6=int64#11
  991. # asm 2: adc $0,<squarer6=%r13
  992. adc $0,%r13
  993. # qhasm: squarerax = *(uint64 *)(pp + 88)
  994. # asm 1: movq 88(<pp=int64#2),>squarerax=int64#7
  995. # asm 2: movq 88(<pp=%rsi),>squarerax=%rax
  996. movq 88(%rsi),%rax
  997. # qhasm: (uint128) squarerdx squarerax = squarerax * *(uint64 *)(pp + 64)
  998. # asm 1: mulq 64(<pp=int64#2)
  999. # asm 2: mulq 64(<pp=%rsi)
  1000. mulq 64(%rsi)
  1001. # qhasm: carry? c3 += squarerax
  1002. # asm 1: add <squarerax=int64#7,<c3=int64#8
  1003. # asm 2: add <squarerax=%rax,<c3=%r10
  1004. add %rax,%r10
  1005. # qhasm: carry? squarer4 += squarerdx + carry
  1006. # asm 1: adc <squarerdx=int64#3,<squarer4=int64#9
  1007. # asm 2: adc <squarerdx=%rdx,<squarer4=%r11
  1008. adc %rdx,%r11
  1009. # qhasm: carry? squarer5 += 0 + carry
  1010. # asm 1: adc $0,<squarer5=int64#10
  1011. # asm 2: adc $0,<squarer5=%r12
  1012. adc $0,%r12
  1013. # qhasm: carry? squarer6 += 0 + carry
  1014. # asm 1: adc $0,<squarer6=int64#11
  1015. # asm 2: adc $0,<squarer6=%r13
  1016. adc $0,%r13
  1017. # qhasm: squarer7 += 0 + carry
  1018. # asm 1: adc $0,<squarer7=int64#4
  1019. # asm 2: adc $0,<squarer7=%rcx
  1020. adc $0,%rcx
  1021. # qhasm: carry? c1 += c1
  1022. # asm 1: add <c1=int64#5,<c1=int64#5
  1023. # asm 2: add <c1=%r8,<c1=%r8
  1024. add %r8,%r8
  1025. # qhasm: carry? c2 += c2 + carry
  1026. # asm 1: adc <c2=int64#6,<c2=int64#6
  1027. # asm 2: adc <c2=%r9,<c2=%r9
  1028. adc %r9,%r9
  1029. # qhasm: carry? c3 += c3 + carry
  1030. # asm 1: adc <c3=int64#8,<c3=int64#8
  1031. # asm 2: adc <c3=%r10,<c3=%r10
  1032. adc %r10,%r10
  1033. # qhasm: carry? squarer4 += squarer4 + carry
  1034. # asm 1: adc <squarer4=int64#9,<squarer4=int64#9
  1035. # asm 2: adc <squarer4=%r11,<squarer4=%r11
  1036. adc %r11,%r11
  1037. # qhasm: carry? squarer5 += squarer5 + carry
  1038. # asm 1: adc <squarer5=int64#10,<squarer5=int64#10
  1039. # asm 2: adc <squarer5=%r12,<squarer5=%r12
  1040. adc %r12,%r12
  1041. # qhasm: carry? squarer6 += squarer6 + carry
  1042. # asm 1: adc <squarer6=int64#11,<squarer6=int64#11
  1043. # asm 2: adc <squarer6=%r13,<squarer6=%r13
  1044. adc %r13,%r13
  1045. # qhasm: squarer7 += squarer7 + carry
  1046. # asm 1: adc <squarer7=int64#4,<squarer7=int64#4
  1047. # asm 2: adc <squarer7=%rcx,<squarer7=%rcx
  1048. adc %rcx,%rcx
  1049. # qhasm: squarerax = *(uint64 *)(pp + 64)
  1050. # asm 1: movq 64(<pp=int64#2),>squarerax=int64#7
  1051. # asm 2: movq 64(<pp=%rsi),>squarerax=%rax
  1052. movq 64(%rsi),%rax
  1053. # qhasm: (uint128) squarerdx squarerax = squarerax * *(uint64 *)(pp + 64)
  1054. # asm 1: mulq 64(<pp=int64#2)
  1055. # asm 2: mulq 64(<pp=%rsi)
  1056. mulq 64(%rsi)
  1057. # qhasm: c0 = squarerax
  1058. # asm 1: mov <squarerax=int64#7,>c0=int64#12
  1059. # asm 2: mov <squarerax=%rax,>c0=%r14
  1060. mov %rax,%r14
  1061. # qhasm: squaret1 = squarerdx
  1062. # asm 1: mov <squarerdx=int64#3,>squaret1=int64#13
  1063. # asm 2: mov <squarerdx=%rdx,>squaret1=%r15
  1064. mov %rdx,%r15
  1065. # qhasm: squarerax = *(uint64 *)(pp + 72)
  1066. # asm 1: movq 72(<pp=int64#2),>squarerax=int64#7
  1067. # asm 2: movq 72(<pp=%rsi),>squarerax=%rax
  1068. movq 72(%rsi),%rax
  1069. # qhasm: (uint128) squarerdx squarerax = squarerax * *(uint64 *)(pp + 72)
  1070. # asm 1: mulq 72(<pp=int64#2)
  1071. # asm 2: mulq 72(<pp=%rsi)
  1072. mulq 72(%rsi)
  1073. # qhasm: squaret2 = squarerax
  1074. # asm 1: mov <squarerax=int64#7,>squaret2=int64#14
  1075. # asm 2: mov <squarerax=%rax,>squaret2=%rbx
  1076. mov %rax,%rbx
  1077. # qhasm: squaret3 = squarerdx
  1078. # asm 1: mov <squarerdx=int64#3,>squaret3=int64#15
  1079. # asm 2: mov <squarerdx=%rdx,>squaret3=%rbp
  1080. mov %rdx,%rbp
  1081. # qhasm: squarerax = *(uint64 *)(pp + 80)
  1082. # asm 1: movq 80(<pp=int64#2),>squarerax=int64#7
  1083. # asm 2: movq 80(<pp=%rsi),>squarerax=%rax
  1084. movq 80(%rsi),%rax
  1085. # qhasm: (uint128) squarerdx squarerax = squarerax * *(uint64 *)(pp + 80)
  1086. # asm 1: mulq 80(<pp=int64#2)
  1087. # asm 2: mulq 80(<pp=%rsi)
  1088. mulq 80(%rsi)
  1089. # qhasm: carry? c1 += squaret1
  1090. # asm 1: add <squaret1=int64#13,<c1=int64#5
  1091. # asm 2: add <squaret1=%r15,<c1=%r8
  1092. add %r15,%r8
  1093. # qhasm: carry? c2 += squaret2 + carry
  1094. # asm 1: adc <squaret2=int64#14,<c2=int64#6
  1095. # asm 2: adc <squaret2=%rbx,<c2=%r9
  1096. adc %rbx,%r9
  1097. # qhasm: carry? c3 += squaret3 + carry
  1098. # asm 1: adc <squaret3=int64#15,<c3=int64#8
  1099. # asm 2: adc <squaret3=%rbp,<c3=%r10
  1100. adc %rbp,%r10
  1101. # qhasm: carry? squarer4 += squarerax + carry
  1102. # asm 1: adc <squarerax=int64#7,<squarer4=int64#9
  1103. # asm 2: adc <squarerax=%rax,<squarer4=%r11
  1104. adc %rax,%r11
  1105. # qhasm: carry? squarer5 += squarerdx + carry
  1106. # asm 1: adc <squarerdx=int64#3,<squarer5=int64#10
  1107. # asm 2: adc <squarerdx=%rdx,<squarer5=%r12
  1108. adc %rdx,%r12
  1109. # qhasm: carry? squarer6 += 0 + carry
  1110. # asm 1: adc $0,<squarer6=int64#11
  1111. # asm 2: adc $0,<squarer6=%r13
  1112. adc $0,%r13
  1113. # qhasm: squarer7 += 0 + carry
  1114. # asm 1: adc $0,<squarer7=int64#4
  1115. # asm 2: adc $0,<squarer7=%rcx
  1116. adc $0,%rcx
  1117. # qhasm: squarerax = *(uint64 *)(pp + 88)
  1118. # asm 1: movq 88(<pp=int64#2),>squarerax=int64#7
  1119. # asm 2: movq 88(<pp=%rsi),>squarerax=%rax
  1120. movq 88(%rsi),%rax
  1121. # qhasm: (uint128) squarerdx squarerax = squarerax * *(uint64 *)(pp + 88)
  1122. # asm 1: mulq 88(<pp=int64#2)
  1123. # asm 2: mulq 88(<pp=%rsi)
  1124. mulq 88(%rsi)
  1125. # qhasm: carry? squarer6 += squarerax
  1126. # asm 1: add <squarerax=int64#7,<squarer6=int64#11
  1127. # asm 2: add <squarerax=%rax,<squarer6=%r13
  1128. add %rax,%r13
  1129. # qhasm: squarer7 += squarerdx + carry
  1130. # asm 1: adc <squarerdx=int64#3,<squarer7=int64#4
  1131. # asm 2: adc <squarerdx=%rdx,<squarer7=%rcx
  1132. adc %rdx,%rcx
  1133. # qhasm: squarerax = squarer4
  1134. # asm 1: mov <squarer4=int64#9,>squarerax=int64#7
  1135. # asm 2: mov <squarer4=%r11,>squarerax=%rax
  1136. mov %r11,%rax
  1137. # qhasm: (uint128) squarerdx squarerax = squarerax * *(uint64 *)&CRYPTO_NAMESPACE(38)
  1138. mulq CRYPTO_NAMESPACE(38)(%rip)
  1139. # qhasm: squarer4 = squarerax
  1140. # asm 1: mov <squarerax=int64#7,>squarer4=int64#9
  1141. # asm 2: mov <squarerax=%rax,>squarer4=%r11
  1142. mov %rax,%r11
  1143. # qhasm: squarerax = squarer5
  1144. # asm 1: mov <squarer5=int64#10,>squarerax=int64#7
  1145. # asm 2: mov <squarer5=%r12,>squarerax=%rax
  1146. mov %r12,%rax
  1147. # qhasm: squarer5 = squarerdx
  1148. # asm 1: mov <squarerdx=int64#3,>squarer5=int64#10
  1149. # asm 2: mov <squarerdx=%rdx,>squarer5=%r12
  1150. mov %rdx,%r12
  1151. # qhasm: (uint128) squarerdx squarerax = squarerax * *(uint64 *)&CRYPTO_NAMESPACE(38)
  1152. mulq CRYPTO_NAMESPACE(38)(%rip)
  1153. # qhasm: carry? squarer5 += squarerax
  1154. # asm 1: add <squarerax=int64#7,<squarer5=int64#10
  1155. # asm 2: add <squarerax=%rax,<squarer5=%r12
  1156. add %rax,%r12
  1157. # qhasm: squarerax = squarer6
  1158. # asm 1: mov <squarer6=int64#11,>squarerax=int64#7
  1159. # asm 2: mov <squarer6=%r13,>squarerax=%rax
  1160. mov %r13,%rax
  1161. # qhasm: squarer6 = 0
  1162. # asm 1: mov $0,>squarer6=int64#11
  1163. # asm 2: mov $0,>squarer6=%r13
  1164. mov $0,%r13
  1165. # qhasm: squarer6 += squarerdx + carry
  1166. # asm 1: adc <squarerdx=int64#3,<squarer6=int64#11
  1167. # asm 2: adc <squarerdx=%rdx,<squarer6=%r13
  1168. adc %rdx,%r13
  1169. # qhasm: (uint128) squarerdx squarerax = squarerax * *(uint64 *)&CRYPTO_NAMESPACE(38)
  1170. mulq CRYPTO_NAMESPACE(38)(%rip)
  1171. # qhasm: carry? squarer6 += squarerax
  1172. # asm 1: add <squarerax=int64#7,<squarer6=int64#11
  1173. # asm 2: add <squarerax=%rax,<squarer6=%r13
  1174. add %rax,%r13
  1175. # qhasm: squarerax = squarer7
  1176. # asm 1: mov <squarer7=int64#4,>squarerax=int64#7
  1177. # asm 2: mov <squarer7=%rcx,>squarerax=%rax
  1178. mov %rcx,%rax
  1179. # qhasm: squarer7 = 0
  1180. # asm 1: mov $0,>squarer7=int64#4
  1181. # asm 2: mov $0,>squarer7=%rcx
  1182. mov $0,%rcx
  1183. # qhasm: squarer7 += squarerdx + carry
  1184. # asm 1: adc <squarerdx=int64#3,<squarer7=int64#4
  1185. # asm 2: adc <squarerdx=%rdx,<squarer7=%rcx
  1186. adc %rdx,%rcx
  1187. # qhasm: (uint128) squarerdx squarerax = squarerax * *(uint64 *)&CRYPTO_NAMESPACE(38)
  1188. mulq CRYPTO_NAMESPACE(38)(%rip)
  1189. # qhasm: carry? squarer7 += squarerax
  1190. # asm 1: add <squarerax=int64#7,<squarer7=int64#4
  1191. # asm 2: add <squarerax=%rax,<squarer7=%rcx
  1192. add %rax,%rcx
  1193. # qhasm: squarer8 = 0
  1194. # asm 1: mov $0,>squarer8=int64#7
  1195. # asm 2: mov $0,>squarer8=%rax
  1196. mov $0,%rax
  1197. # qhasm: squarer8 += squarerdx + carry
  1198. # asm 1: adc <squarerdx=int64#3,<squarer8=int64#7
  1199. # asm 2: adc <squarerdx=%rdx,<squarer8=%rax
  1200. adc %rdx,%rax
  1201. # qhasm: carry? c0 += squarer4
  1202. # asm 1: add <squarer4=int64#9,<c0=int64#12
  1203. # asm 2: add <squarer4=%r11,<c0=%r14
  1204. add %r11,%r14
  1205. # qhasm: carry? c1 += squarer5 + carry
  1206. # asm 1: adc <squarer5=int64#10,<c1=int64#5
  1207. # asm 2: adc <squarer5=%r12,<c1=%r8
  1208. adc %r12,%r8
  1209. # qhasm: carry? c2 += squarer6 + carry
  1210. # asm 1: adc <squarer6=int64#11,<c2=int64#6
  1211. # asm 2: adc <squarer6=%r13,<c2=%r9
  1212. adc %r13,%r9
  1213. # qhasm: carry? c3 += squarer7 + carry
  1214. # asm 1: adc <squarer7=int64#4,<c3=int64#8
  1215. # asm 2: adc <squarer7=%rcx,<c3=%r10
  1216. adc %rcx,%r10
  1217. # qhasm: squarezero = 0
  1218. # asm 1: mov $0,>squarezero=int64#3
  1219. # asm 2: mov $0,>squarezero=%rdx
  1220. mov $0,%rdx
  1221. # qhasm: squarer8 += squarezero + carry
  1222. # asm 1: adc <squarezero=int64#3,<squarer8=int64#7
  1223. # asm 2: adc <squarezero=%rdx,<squarer8=%rax
  1224. adc %rdx,%rax
  1225. # qhasm: squarer8 *= 38
  1226. # asm 1: imulq $38,<squarer8=int64#7,>squarer8=int64#4
  1227. # asm 2: imulq $38,<squarer8=%rax,>squarer8=%rcx
  1228. imulq $38,%rax,%rcx
  1229. # qhasm: carry? c0 += squarer8
  1230. # asm 1: add <squarer8=int64#4,<c0=int64#12
  1231. # asm 2: add <squarer8=%rcx,<c0=%r14
  1232. add %rcx,%r14
  1233. # qhasm: carry? c1 += squarezero + carry
  1234. # asm 1: adc <squarezero=int64#3,<c1=int64#5
  1235. # asm 2: adc <squarezero=%rdx,<c1=%r8
  1236. adc %rdx,%r8
  1237. # qhasm: carry? c2 += squarezero + carry
  1238. # asm 1: adc <squarezero=int64#3,<c2=int64#6
  1239. # asm 2: adc <squarezero=%rdx,<c2=%r9
  1240. adc %rdx,%r9
  1241. # qhasm: carry? c3 += squarezero + carry
  1242. # asm 1: adc <squarezero=int64#3,<c3=int64#8
  1243. # asm 2: adc <squarezero=%rdx,<c3=%r10
  1244. adc %rdx,%r10
  1245. # qhasm: squarezero += squarezero + carry
  1246. # asm 1: adc <squarezero=int64#3,<squarezero=int64#3
  1247. # asm 2: adc <squarezero=%rdx,<squarezero=%rdx
  1248. adc %rdx,%rdx
  1249. # qhasm: squarezero *= 38
  1250. # asm 1: imulq $38,<squarezero=int64#3,>squarezero=int64#3
  1251. # asm 2: imulq $38,<squarezero=%rdx,>squarezero=%rdx
  1252. imulq $38,%rdx,%rdx
  1253. # qhasm: c0 += squarezero
  1254. # asm 1: add <squarezero=int64#3,<c0=int64#12
  1255. # asm 2: add <squarezero=%rdx,<c0=%r14
  1256. add %rdx,%r14
  1257. # qhasm: carry? c0 += c0
  1258. # asm 1: add <c0=int64#12,<c0=int64#12
  1259. # asm 2: add <c0=%r14,<c0=%r14
  1260. add %r14,%r14
  1261. # qhasm: carry? c1 += c1 + carry
  1262. # asm 1: adc <c1=int64#5,<c1=int64#5
  1263. # asm 2: adc <c1=%r8,<c1=%r8
  1264. adc %r8,%r8
  1265. # qhasm: carry? c2 += c2 + carry
  1266. # asm 1: adc <c2=int64#6,<c2=int64#6
  1267. # asm 2: adc <c2=%r9,<c2=%r9
  1268. adc %r9,%r9
  1269. # qhasm: carry? c3 += c3 + carry
  1270. # asm 1: adc <c3=int64#8,<c3=int64#8
  1271. # asm 2: adc <c3=%r10,<c3=%r10
  1272. adc %r10,%r10
  1273. # qhasm: addt0 = 0
  1274. # asm 1: mov $0,>addt0=int64#3
  1275. # asm 2: mov $0,>addt0=%rdx
  1276. mov $0,%rdx
  1277. # qhasm: addt1 = 38
  1278. # asm 1: mov $38,>addt1=int64#4
  1279. # asm 2: mov $38,>addt1=%rcx
  1280. mov $38,%rcx
  1281. # qhasm: addt1 = addt0 if !carry
  1282. # asm 1: cmovae <addt0=int64#3,<addt1=int64#4
  1283. # asm 2: cmovae <addt0=%rdx,<addt1=%rcx
  1284. cmovae %rdx,%rcx
  1285. # qhasm: carry? c0 += addt1
  1286. # asm 1: add <addt1=int64#4,<c0=int64#12
  1287. # asm 2: add <addt1=%rcx,<c0=%r14
  1288. add %rcx,%r14
  1289. # qhasm: carry? c1 += addt0 + carry
  1290. # asm 1: adc <addt0=int64#3,<c1=int64#5
  1291. # asm 2: adc <addt0=%rdx,<c1=%r8
  1292. adc %rdx,%r8
  1293. # qhasm: carry? c2 += addt0 + carry
  1294. # asm 1: adc <addt0=int64#3,<c2=int64#6
  1295. # asm 2: adc <addt0=%rdx,<c2=%r9
  1296. adc %rdx,%r9
  1297. # qhasm: carry? c3 += addt0 + carry
  1298. # asm 1: adc <addt0=int64#3,<c3=int64#8
  1299. # asm 2: adc <addt0=%rdx,<c3=%r10
  1300. adc %rdx,%r10
  1301. # qhasm: addt0 = addt1 if carry
  1302. # asm 1: cmovc <addt1=int64#4,<addt0=int64#3
  1303. # asm 2: cmovc <addt1=%rcx,<addt0=%rdx
  1304. cmovc %rcx,%rdx
  1305. # qhasm: c0 += addt0
  1306. # asm 1: add <addt0=int64#3,<c0=int64#12
  1307. # asm 2: add <addt0=%rdx,<c0=%r14
  1308. add %rdx,%r14
  1309. # qhasm: c0_stack = c0
  1310. # asm 1: movq <c0=int64#12,>c0_stack=stack64#16
  1311. # asm 2: movq <c0=%r14,>c0_stack=120(%rsp)
  1312. movq %r14,120(%rsp)
  1313. # qhasm: c1_stack = c1
  1314. # asm 1: movq <c1=int64#5,>c1_stack=stack64#17
  1315. # asm 2: movq <c1=%r8,>c1_stack=128(%rsp)
  1316. movq %r8,128(%rsp)
  1317. # qhasm: c2_stack = c2
  1318. # asm 1: movq <c2=int64#6,>c2_stack=stack64#18
  1319. # asm 2: movq <c2=%r9,>c2_stack=136(%rsp)
  1320. movq %r9,136(%rsp)
  1321. # qhasm: c3_stack = c3
  1322. # asm 1: movq <c3=int64#8,>c3_stack=stack64#19
  1323. # asm 2: movq <c3=%r10,>c3_stack=144(%rsp)
  1324. movq %r10,144(%rsp)
  1325. # qhasm: d0 = 0
  1326. # asm 1: mov $0,>d0=int64#3
  1327. # asm 2: mov $0,>d0=%rdx
  1328. mov $0,%rdx
  1329. # qhasm: d1 = 0
  1330. # asm 1: mov $0,>d1=int64#4
  1331. # asm 2: mov $0,>d1=%rcx
  1332. mov $0,%rcx
  1333. # qhasm: d2 = 0
  1334. # asm 1: mov $0,>d2=int64#5
  1335. # asm 2: mov $0,>d2=%r8
  1336. mov $0,%r8
  1337. # qhasm: d3 = 0
  1338. # asm 1: mov $0,>d3=int64#6
  1339. # asm 2: mov $0,>d3=%r9
  1340. mov $0,%r9
  1341. # qhasm: carry? d0 -= a0_stack
  1342. # asm 1: subq <a0_stack=stack64#8,<d0=int64#3
  1343. # asm 2: subq <a0_stack=56(%rsp),<d0=%rdx
  1344. subq 56(%rsp),%rdx
  1345. # qhasm: carry? d1 -= a1_stack - carry
  1346. # asm 1: sbbq <a1_stack=stack64#9,<d1=int64#4
  1347. # asm 2: sbbq <a1_stack=64(%rsp),<d1=%rcx
  1348. sbbq 64(%rsp),%rcx
  1349. # qhasm: carry? d2 -= a2_stack - carry
  1350. # asm 1: sbbq <a2_stack=stack64#10,<d2=int64#5
  1351. # asm 2: sbbq <a2_stack=72(%rsp),<d2=%r8
  1352. sbbq 72(%rsp),%r8
  1353. # qhasm: carry? d3 -= a3_stack - carry
  1354. # asm 1: sbbq <a3_stack=stack64#11,<d3=int64#6
  1355. # asm 2: sbbq <a3_stack=80(%rsp),<d3=%r9
  1356. sbbq 80(%rsp),%r9
  1357. # qhasm: subt0 = 0
  1358. # asm 1: mov $0,>subt0=int64#7
  1359. # asm 2: mov $0,>subt0=%rax
  1360. mov $0,%rax
  1361. # qhasm: subt1 = 38
  1362. # asm 1: mov $38,>subt1=int64#8
  1363. # asm 2: mov $38,>subt1=%r10
  1364. mov $38,%r10
  1365. # qhasm: subt1 = subt0 if !carry
  1366. # asm 1: cmovae <subt0=int64#7,<subt1=int64#8
  1367. # asm 2: cmovae <subt0=%rax,<subt1=%r10
  1368. cmovae %rax,%r10
  1369. # qhasm: carry? d0 -= subt1
  1370. # asm 1: sub <subt1=int64#8,<d0=int64#3
  1371. # asm 2: sub <subt1=%r10,<d0=%rdx
  1372. sub %r10,%rdx
  1373. # qhasm: carry? d1 -= subt0 - carry
  1374. # asm 1: sbb <subt0=int64#7,<d1=int64#4
  1375. # asm 2: sbb <subt0=%rax,<d1=%rcx
  1376. sbb %rax,%rcx
  1377. # qhasm: carry? d2 -= subt0 - carry
  1378. # asm 1: sbb <subt0=int64#7,<d2=int64#5
  1379. # asm 2: sbb <subt0=%rax,<d2=%r8
  1380. sbb %rax,%r8
  1381. # qhasm: carry? d3 -= subt0 - carry
  1382. # asm 1: sbb <subt0=int64#7,<d3=int64#6
  1383. # asm 2: sbb <subt0=%rax,<d3=%r9
  1384. sbb %rax,%r9
  1385. # qhasm: subt0 = subt1 if carry
  1386. # asm 1: cmovc <subt1=int64#8,<subt0=int64#7
  1387. # asm 2: cmovc <subt1=%r10,<subt0=%rax
  1388. cmovc %r10,%rax
  1389. # qhasm: d0 -= subt0
  1390. # asm 1: sub <subt0=int64#7,<d0=int64#3
  1391. # asm 2: sub <subt0=%rax,<d0=%rdx
  1392. sub %rax,%rdx
  1393. # qhasm: d0_stack = d0
  1394. # asm 1: movq <d0=int64#3,>d0_stack=stack64#8
  1395. # asm 2: movq <d0=%rdx,>d0_stack=56(%rsp)
  1396. movq %rdx,56(%rsp)
  1397. # qhasm: d1_stack = d1
  1398. # asm 1: movq <d1=int64#4,>d1_stack=stack64#9
  1399. # asm 2: movq <d1=%rcx,>d1_stack=64(%rsp)
  1400. movq %rcx,64(%rsp)
  1401. # qhasm: d2_stack = d2
  1402. # asm 1: movq <d2=int64#5,>d2_stack=stack64#10
  1403. # asm 2: movq <d2=%r8,>d2_stack=72(%rsp)
  1404. movq %r8,72(%rsp)
  1405. # qhasm: d3_stack = d3
  1406. # asm 1: movq <d3=int64#6,>d3_stack=stack64#11
  1407. # asm 2: movq <d3=%r9,>d3_stack=80(%rsp)
  1408. movq %r9,80(%rsp)
  1409. # qhasm: e0 = 0
  1410. # asm 1: mov $0,>e0=int64#7
  1411. # asm 2: mov $0,>e0=%rax
  1412. mov $0,%rax
  1413. # qhasm: e1 = 0
  1414. # asm 1: mov $0,>e1=int64#8
  1415. # asm 2: mov $0,>e1=%r10
  1416. mov $0,%r10
  1417. # qhasm: e2 = 0
  1418. # asm 1: mov $0,>e2=int64#9
  1419. # asm 2: mov $0,>e2=%r11
  1420. mov $0,%r11
  1421. # qhasm: e3 = 0
  1422. # asm 1: mov $0,>e3=int64#10
  1423. # asm 2: mov $0,>e3=%r12
  1424. mov $0,%r12
  1425. # qhasm: carry? e0 -= b0_stack
  1426. # asm 1: subq <b0_stack=stack64#12,<e0=int64#7
  1427. # asm 2: subq <b0_stack=88(%rsp),<e0=%rax
  1428. subq 88(%rsp),%rax
  1429. # qhasm: carry? e1 -= b1_stack - carry
  1430. # asm 1: sbbq <b1_stack=stack64#13,<e1=int64#8
  1431. # asm 2: sbbq <b1_stack=96(%rsp),<e1=%r10
  1432. sbbq 96(%rsp),%r10
  1433. # qhasm: carry? e2 -= b2_stack - carry
  1434. # asm 1: sbbq <b2_stack=stack64#14,<e2=int64#9
  1435. # asm 2: sbbq <b2_stack=104(%rsp),<e2=%r11
  1436. sbbq 104(%rsp),%r11
  1437. # qhasm: carry? e3 -= b3_stack - carry
  1438. # asm 1: sbbq <b3_stack=stack64#15,<e3=int64#10
  1439. # asm 2: sbbq <b3_stack=112(%rsp),<e3=%r12
  1440. sbbq 112(%rsp),%r12
  1441. # qhasm: subt0 = 0
  1442. # asm 1: mov $0,>subt0=int64#11
  1443. # asm 2: mov $0,>subt0=%r13
  1444. mov $0,%r13
  1445. # qhasm: subt1 = 38
  1446. # asm 1: mov $38,>subt1=int64#12
  1447. # asm 2: mov $38,>subt1=%r14
  1448. mov $38,%r14
  1449. # qhasm: subt1 = subt0 if !carry
  1450. # asm 1: cmovae <subt0=int64#11,<subt1=int64#12
  1451. # asm 2: cmovae <subt0=%r13,<subt1=%r14
  1452. cmovae %r13,%r14
  1453. # qhasm: carry? e0 -= subt1
  1454. # asm 1: sub <subt1=int64#12,<e0=int64#7
  1455. # asm 2: sub <subt1=%r14,<e0=%rax
  1456. sub %r14,%rax
  1457. # qhasm: carry? e1 -= subt0 - carry
  1458. # asm 1: sbb <subt0=int64#11,<e1=int64#8
  1459. # asm 2: sbb <subt0=%r13,<e1=%r10
  1460. sbb %r13,%r10
  1461. # qhasm: carry? e2 -= subt0 - carry
  1462. # asm 1: sbb <subt0=int64#11,<e2=int64#9
  1463. # asm 2: sbb <subt0=%r13,<e2=%r11
  1464. sbb %r13,%r11
  1465. # qhasm: carry? e3 -= subt0 - carry
  1466. # asm 1: sbb <subt0=int64#11,<e3=int64#10
  1467. # asm 2: sbb <subt0=%r13,<e3=%r12
  1468. sbb %r13,%r12
  1469. # qhasm: subt0 = subt1 if carry
  1470. # asm 1: cmovc <subt1=int64#12,<subt0=int64#11
  1471. # asm 2: cmovc <subt1=%r14,<subt0=%r13
  1472. cmovc %r14,%r13
  1473. # qhasm: e0 -= subt0
  1474. # asm 1: sub <subt0=int64#11,<e0=int64#7
  1475. # asm 2: sub <subt0=%r13,<e0=%rax
  1476. sub %r13,%rax
  1477. # qhasm: e0_stack = e0
  1478. # asm 1: movq <e0=int64#7,>e0_stack=stack64#20
  1479. # asm 2: movq <e0=%rax,>e0_stack=152(%rsp)
  1480. movq %rax,152(%rsp)
  1481. # qhasm: e1_stack = e1
  1482. # asm 1: movq <e1=int64#8,>e1_stack=stack64#21
  1483. # asm 2: movq <e1=%r10,>e1_stack=160(%rsp)
  1484. movq %r10,160(%rsp)
  1485. # qhasm: e2_stack = e2
  1486. # asm 1: movq <e2=int64#9,>e2_stack=stack64#22
  1487. # asm 2: movq <e2=%r11,>e2_stack=168(%rsp)
  1488. movq %r11,168(%rsp)
  1489. # qhasm: e3_stack = e3
  1490. # asm 1: movq <e3=int64#10,>e3_stack=stack64#23
  1491. # asm 2: movq <e3=%r12,>e3_stack=176(%rsp)
  1492. movq %r12,176(%rsp)
  1493. # qhasm: rz0 = d0
  1494. # asm 1: mov <d0=int64#3,>rz0=int64#7
  1495. # asm 2: mov <d0=%rdx,>rz0=%rax
  1496. mov %rdx,%rax
  1497. # qhasm: rz1 = d1
  1498. # asm 1: mov <d1=int64#4,>rz1=int64#8
  1499. # asm 2: mov <d1=%rcx,>rz1=%r10
  1500. mov %rcx,%r10
  1501. # qhasm: rz2 = d2
  1502. # asm 1: mov <d2=int64#5,>rz2=int64#9
  1503. # asm 2: mov <d2=%r8,>rz2=%r11
  1504. mov %r8,%r11
  1505. # qhasm: rz3 = d3
  1506. # asm 1: mov <d3=int64#6,>rz3=int64#10
  1507. # asm 2: mov <d3=%r9,>rz3=%r12
  1508. mov %r9,%r12
  1509. # qhasm: carry? rz0 += b0_stack
  1510. # asm 1: addq <b0_stack=stack64#12,<rz0=int64#7
  1511. # asm 2: addq <b0_stack=88(%rsp),<rz0=%rax
  1512. addq 88(%rsp),%rax
  1513. # qhasm: carry? rz1 += b1_stack + carry
  1514. # asm 1: adcq <b1_stack=stack64#13,<rz1=int64#8
  1515. # asm 2: adcq <b1_stack=96(%rsp),<rz1=%r10
  1516. adcq 96(%rsp),%r10
  1517. # qhasm: carry? rz2 += b2_stack + carry
  1518. # asm 1: adcq <b2_stack=stack64#14,<rz2=int64#9
  1519. # asm 2: adcq <b2_stack=104(%rsp),<rz2=%r11
  1520. adcq 104(%rsp),%r11
  1521. # qhasm: carry? rz3 += b3_stack + carry
  1522. # asm 1: adcq <b3_stack=stack64#15,<rz3=int64#10
  1523. # asm 2: adcq <b3_stack=112(%rsp),<rz3=%r12
  1524. adcq 112(%rsp),%r12
  1525. # qhasm: addt0 = 0
  1526. # asm 1: mov $0,>addt0=int64#11
  1527. # asm 2: mov $0,>addt0=%r13
  1528. mov $0,%r13
  1529. # qhasm: addt1 = 38
  1530. # asm 1: mov $38,>addt1=int64#12
  1531. # asm 2: mov $38,>addt1=%r14
  1532. mov $38,%r14
  1533. # qhasm: addt1 = addt0 if !carry
  1534. # asm 1: cmovae <addt0=int64#11,<addt1=int64#12
  1535. # asm 2: cmovae <addt0=%r13,<addt1=%r14
  1536. cmovae %r13,%r14
  1537. # qhasm: carry? rz0 += addt1
  1538. # asm 1: add <addt1=int64#12,<rz0=int64#7
  1539. # asm 2: add <addt1=%r14,<rz0=%rax
  1540. add %r14,%rax
  1541. # qhasm: carry? rz1 += addt0 + carry
  1542. # asm 1: adc <addt0=int64#11,<rz1=int64#8
  1543. # asm 2: adc <addt0=%r13,<rz1=%r10
  1544. adc %r13,%r10
  1545. # qhasm: carry? rz2 += addt0 + carry
  1546. # asm 1: adc <addt0=int64#11,<rz2=int64#9
  1547. # asm 2: adc <addt0=%r13,<rz2=%r11
  1548. adc %r13,%r11
  1549. # qhasm: carry? rz3 += addt0 + carry
  1550. # asm 1: adc <addt0=int64#11,<rz3=int64#10
  1551. # asm 2: adc <addt0=%r13,<rz3=%r12
  1552. adc %r13,%r12
  1553. # qhasm: addt0 = addt1 if carry
  1554. # asm 1: cmovc <addt1=int64#12,<addt0=int64#11
  1555. # asm 2: cmovc <addt1=%r14,<addt0=%r13
  1556. cmovc %r14,%r13
  1557. # qhasm: rz0 += addt0
  1558. # asm 1: add <addt0=int64#11,<rz0=int64#7
  1559. # asm 2: add <addt0=%r13,<rz0=%rax
  1560. add %r13,%rax
  1561. # qhasm: *(uint64 *) (rp + 32) = rz0
  1562. # asm 1: movq <rz0=int64#7,32(<rp=int64#1)
  1563. # asm 2: movq <rz0=%rax,32(<rp=%rdi)
  1564. movq %rax,32(%rdi)
  1565. # qhasm: *(uint64 *) (rp + 40) = rz1
  1566. # asm 1: movq <rz1=int64#8,40(<rp=int64#1)
  1567. # asm 2: movq <rz1=%r10,40(<rp=%rdi)
  1568. movq %r10,40(%rdi)
  1569. # qhasm: *(uint64 *) (rp + 48) = rz2
  1570. # asm 1: movq <rz2=int64#9,48(<rp=int64#1)
  1571. # asm 2: movq <rz2=%r11,48(<rp=%rdi)
  1572. movq %r11,48(%rdi)
  1573. # qhasm: *(uint64 *) (rp + 56) = rz3
  1574. # asm 1: movq <rz3=int64#10,56(<rp=int64#1)
  1575. # asm 2: movq <rz3=%r12,56(<rp=%rdi)
  1576. movq %r12,56(%rdi)
  1577. # qhasm: carry? d0 -= b0_stack
  1578. # asm 1: subq <b0_stack=stack64#12,<d0=int64#3
  1579. # asm 2: subq <b0_stack=88(%rsp),<d0=%rdx
  1580. subq 88(%rsp),%rdx
  1581. # qhasm: carry? d1 -= b1_stack - carry
  1582. # asm 1: sbbq <b1_stack=stack64#13,<d1=int64#4
  1583. # asm 2: sbbq <b1_stack=96(%rsp),<d1=%rcx
  1584. sbbq 96(%rsp),%rcx
  1585. # qhasm: carry? d2 -= b2_stack - carry
  1586. # asm 1: sbbq <b2_stack=stack64#14,<d2=int64#5
  1587. # asm 2: sbbq <b2_stack=104(%rsp),<d2=%r8
  1588. sbbq 104(%rsp),%r8
  1589. # qhasm: carry? d3 -= b3_stack - carry
  1590. # asm 1: sbbq <b3_stack=stack64#15,<d3=int64#6
  1591. # asm 2: sbbq <b3_stack=112(%rsp),<d3=%r9
  1592. sbbq 112(%rsp),%r9
  1593. # qhasm: subt0 = 0
  1594. # asm 1: mov $0,>subt0=int64#11
  1595. # asm 2: mov $0,>subt0=%r13
  1596. mov $0,%r13
  1597. # qhasm: subt1 = 38
  1598. # asm 1: mov $38,>subt1=int64#12
  1599. # asm 2: mov $38,>subt1=%r14
  1600. mov $38,%r14
  1601. # qhasm: subt1 = subt0 if !carry
  1602. # asm 1: cmovae <subt0=int64#11,<subt1=int64#12
  1603. # asm 2: cmovae <subt0=%r13,<subt1=%r14
  1604. cmovae %r13,%r14
  1605. # qhasm: carry? d0 -= subt1
  1606. # asm 1: sub <subt1=int64#12,<d0=int64#3
  1607. # asm 2: sub <subt1=%r14,<d0=%rdx
  1608. sub %r14,%rdx
  1609. # qhasm: carry? d1 -= subt0 - carry
  1610. # asm 1: sbb <subt0=int64#11,<d1=int64#4
  1611. # asm 2: sbb <subt0=%r13,<d1=%rcx
  1612. sbb %r13,%rcx
  1613. # qhasm: carry? d2 -= subt0 - carry
  1614. # asm 1: sbb <subt0=int64#11,<d2=int64#5
  1615. # asm 2: sbb <subt0=%r13,<d2=%r8
  1616. sbb %r13,%r8
  1617. # qhasm: carry? d3 -= subt0 - carry
  1618. # asm 1: sbb <subt0=int64#11,<d3=int64#6
  1619. # asm 2: sbb <subt0=%r13,<d3=%r9
  1620. sbb %r13,%r9
  1621. # qhasm: subt0 = subt1 if carry
  1622. # asm 1: cmovc <subt1=int64#12,<subt0=int64#11
  1623. # asm 2: cmovc <subt1=%r14,<subt0=%r13
  1624. cmovc %r14,%r13
  1625. # qhasm: d0 -= subt0
  1626. # asm 1: sub <subt0=int64#11,<d0=int64#3
  1627. # asm 2: sub <subt0=%r13,<d0=%rdx
  1628. sub %r13,%rdx
  1629. # qhasm: *(uint64 *)(rp + 64) = d0
  1630. # asm 1: movq <d0=int64#3,64(<rp=int64#1)
  1631. # asm 2: movq <d0=%rdx,64(<rp=%rdi)
  1632. movq %rdx,64(%rdi)
  1633. # qhasm: *(uint64 *)(rp + 72) = d1
  1634. # asm 1: movq <d1=int64#4,72(<rp=int64#1)
  1635. # asm 2: movq <d1=%rcx,72(<rp=%rdi)
  1636. movq %rcx,72(%rdi)
  1637. # qhasm: *(uint64 *)(rp + 80) = d2
  1638. # asm 1: movq <d2=int64#5,80(<rp=int64#1)
  1639. # asm 2: movq <d2=%r8,80(<rp=%rdi)
  1640. movq %r8,80(%rdi)
  1641. # qhasm: *(uint64 *)(rp + 88) = d3
  1642. # asm 1: movq <d3=int64#6,88(<rp=int64#1)
  1643. # asm 2: movq <d3=%r9,88(<rp=%rdi)
  1644. movq %r9,88(%rdi)
  1645. # qhasm: carry? rz0 -= c0_stack
  1646. # asm 1: subq <c0_stack=stack64#16,<rz0=int64#7
  1647. # asm 2: subq <c0_stack=120(%rsp),<rz0=%rax
  1648. subq 120(%rsp),%rax
  1649. # qhasm: carry? rz1 -= c1_stack - carry
  1650. # asm 1: sbbq <c1_stack=stack64#17,<rz1=int64#8
  1651. # asm 2: sbbq <c1_stack=128(%rsp),<rz1=%r10
  1652. sbbq 128(%rsp),%r10
  1653. # qhasm: carry? rz2 -= c2_stack - carry
  1654. # asm 1: sbbq <c2_stack=stack64#18,<rz2=int64#9
  1655. # asm 2: sbbq <c2_stack=136(%rsp),<rz2=%r11
  1656. sbbq 136(%rsp),%r11
  1657. # qhasm: carry? rz3 -= c3_stack - carry
  1658. # asm 1: sbbq <c3_stack=stack64#19,<rz3=int64#10
  1659. # asm 2: sbbq <c3_stack=144(%rsp),<rz3=%r12
  1660. sbbq 144(%rsp),%r12
  1661. # qhasm: subt0 = 0
  1662. # asm 1: mov $0,>subt0=int64#3
  1663. # asm 2: mov $0,>subt0=%rdx
  1664. mov $0,%rdx
  1665. # qhasm: subt1 = 38
  1666. # asm 1: mov $38,>subt1=int64#4
  1667. # asm 2: mov $38,>subt1=%rcx
  1668. mov $38,%rcx
  1669. # qhasm: subt1 = subt0 if !carry
  1670. # asm 1: cmovae <subt0=int64#3,<subt1=int64#4
  1671. # asm 2: cmovae <subt0=%rdx,<subt1=%rcx
  1672. cmovae %rdx,%rcx
  1673. # qhasm: carry? rz0 -= subt1
  1674. # asm 1: sub <subt1=int64#4,<rz0=int64#7
  1675. # asm 2: sub <subt1=%rcx,<rz0=%rax
  1676. sub %rcx,%rax
  1677. # qhasm: carry? rz1 -= subt0 - carry
  1678. # asm 1: sbb <subt0=int64#3,<rz1=int64#8
  1679. # asm 2: sbb <subt0=%rdx,<rz1=%r10
  1680. sbb %rdx,%r10
  1681. # qhasm: carry? rz2 -= subt0 - carry
  1682. # asm 1: sbb <subt0=int64#3,<rz2=int64#9
  1683. # asm 2: sbb <subt0=%rdx,<rz2=%r11
  1684. sbb %rdx,%r11
  1685. # qhasm: carry? rz3 -= subt0 - carry
  1686. # asm 1: sbb <subt0=int64#3,<rz3=int64#10
  1687. # asm 2: sbb <subt0=%rdx,<rz3=%r12
  1688. sbb %rdx,%r12
  1689. # qhasm: subt0 = subt1 if carry
  1690. # asm 1: cmovc <subt1=int64#4,<subt0=int64#3
  1691. # asm 2: cmovc <subt1=%rcx,<subt0=%rdx
  1692. cmovc %rcx,%rdx
  1693. # qhasm: rz0 -= subt0
  1694. # asm 1: sub <subt0=int64#3,<rz0=int64#7
  1695. # asm 2: sub <subt0=%rdx,<rz0=%rax
  1696. sub %rdx,%rax
  1697. # qhasm: *(uint64 *) (rp + 96) = rz0
  1698. # asm 1: movq <rz0=int64#7,96(<rp=int64#1)
  1699. # asm 2: movq <rz0=%rax,96(<rp=%rdi)
  1700. movq %rax,96(%rdi)
  1701. # qhasm: *(uint64 *) (rp + 104) = rz1
  1702. # asm 1: movq <rz1=int64#8,104(<rp=int64#1)
  1703. # asm 2: movq <rz1=%r10,104(<rp=%rdi)
  1704. movq %r10,104(%rdi)
  1705. # qhasm: *(uint64 *) (rp + 112) = rz2
  1706. # asm 1: movq <rz2=int64#9,112(<rp=int64#1)
  1707. # asm 2: movq <rz2=%r11,112(<rp=%rdi)
  1708. movq %r11,112(%rdi)
  1709. # qhasm: *(uint64 *) (rp + 120) = rz3
  1710. # asm 1: movq <rz3=int64#10,120(<rp=int64#1)
  1711. # asm 2: movq <rz3=%r12,120(<rp=%rdi)
  1712. movq %r12,120(%rdi)
  1713. # qhasm: rx0 = *(uint64 *)(pp + 0)
  1714. # asm 1: movq 0(<pp=int64#2),>rx0=int64#3
  1715. # asm 2: movq 0(<pp=%rsi),>rx0=%rdx
  1716. movq 0(%rsi),%rdx
  1717. # qhasm: rx1 = *(uint64 *)(pp + 8)
  1718. # asm 1: movq 8(<pp=int64#2),>rx1=int64#4
  1719. # asm 2: movq 8(<pp=%rsi),>rx1=%rcx
  1720. movq 8(%rsi),%rcx
  1721. # qhasm: rx2 = *(uint64 *)(pp + 16)
  1722. # asm 1: movq 16(<pp=int64#2),>rx2=int64#5
  1723. # asm 2: movq 16(<pp=%rsi),>rx2=%r8
  1724. movq 16(%rsi),%r8
  1725. # qhasm: rx3 = *(uint64 *)(pp + 24)
  1726. # asm 1: movq 24(<pp=int64#2),>rx3=int64#6
  1727. # asm 2: movq 24(<pp=%rsi),>rx3=%r9
  1728. movq 24(%rsi),%r9
  1729. # qhasm: carry? rx0 += *(uint64 *)(pp + 32)
  1730. # asm 1: addq 32(<pp=int64#2),<rx0=int64#3
  1731. # asm 2: addq 32(<pp=%rsi),<rx0=%rdx
  1732. addq 32(%rsi),%rdx
  1733. # qhasm: carry? rx1 += *(uint64 *)(pp + 40) + carry
  1734. # asm 1: adcq 40(<pp=int64#2),<rx1=int64#4
  1735. # asm 2: adcq 40(<pp=%rsi),<rx1=%rcx
  1736. adcq 40(%rsi),%rcx
  1737. # qhasm: carry? rx2 += *(uint64 *)(pp + 48) + carry
  1738. # asm 1: adcq 48(<pp=int64#2),<rx2=int64#5
  1739. # asm 2: adcq 48(<pp=%rsi),<rx2=%r8
  1740. adcq 48(%rsi),%r8
  1741. # qhasm: carry? rx3 += *(uint64 *)(pp + 56) + carry
  1742. # asm 1: adcq 56(<pp=int64#2),<rx3=int64#6
  1743. # asm 2: adcq 56(<pp=%rsi),<rx3=%r9
  1744. adcq 56(%rsi),%r9
  1745. # qhasm: addt0 = 0
  1746. # asm 1: mov $0,>addt0=int64#2
  1747. # asm 2: mov $0,>addt0=%rsi
  1748. mov $0,%rsi
  1749. # qhasm: addt1 = 38
  1750. # asm 1: mov $38,>addt1=int64#7
  1751. # asm 2: mov $38,>addt1=%rax
  1752. mov $38,%rax
  1753. # qhasm: addt1 = addt0 if !carry
  1754. # asm 1: cmovae <addt0=int64#2,<addt1=int64#7
  1755. # asm 2: cmovae <addt0=%rsi,<addt1=%rax
  1756. cmovae %rsi,%rax
  1757. # qhasm: carry? rx0 += addt1
  1758. # asm 1: add <addt1=int64#7,<rx0=int64#3
  1759. # asm 2: add <addt1=%rax,<rx0=%rdx
  1760. add %rax,%rdx
  1761. # qhasm: carry? rx1 += addt0 + carry
  1762. # asm 1: adc <addt0=int64#2,<rx1=int64#4
  1763. # asm 2: adc <addt0=%rsi,<rx1=%rcx
  1764. adc %rsi,%rcx
  1765. # qhasm: carry? rx2 += addt0 + carry
  1766. # asm 1: adc <addt0=int64#2,<rx2=int64#5
  1767. # asm 2: adc <addt0=%rsi,<rx2=%r8
  1768. adc %rsi,%r8
  1769. # qhasm: carry? rx3 += addt0 + carry
  1770. # asm 1: adc <addt0=int64#2,<rx3=int64#6
  1771. # asm 2: adc <addt0=%rsi,<rx3=%r9
  1772. adc %rsi,%r9
  1773. # qhasm: addt0 = addt1 if carry
  1774. # asm 1: cmovc <addt1=int64#7,<addt0=int64#2
  1775. # asm 2: cmovc <addt1=%rax,<addt0=%rsi
  1776. cmovc %rax,%rsi
  1777. # qhasm: rx0 += addt0
  1778. # asm 1: add <addt0=int64#2,<rx0=int64#3
  1779. # asm 2: add <addt0=%rsi,<rx0=%rdx
  1780. add %rsi,%rdx
  1781. # qhasm: rx0_stack = rx0
  1782. # asm 1: movq <rx0=int64#3,>rx0_stack=stack64#12
  1783. # asm 2: movq <rx0=%rdx,>rx0_stack=88(%rsp)
  1784. movq %rdx,88(%rsp)
  1785. # qhasm: rx1_stack = rx1
  1786. # asm 1: movq <rx1=int64#4,>rx1_stack=stack64#13
  1787. # asm 2: movq <rx1=%rcx,>rx1_stack=96(%rsp)
  1788. movq %rcx,96(%rsp)
  1789. # qhasm: rx2_stack = rx2
  1790. # asm 1: movq <rx2=int64#5,>rx2_stack=stack64#14
  1791. # asm 2: movq <rx2=%r8,>rx2_stack=104(%rsp)
  1792. movq %r8,104(%rsp)
  1793. # qhasm: rx3_stack = rx3
  1794. # asm 1: movq <rx3=int64#6,>rx3_stack=stack64#15
  1795. # asm 2: movq <rx3=%r9,>rx3_stack=112(%rsp)
  1796. movq %r9,112(%rsp)
  1797. # qhasm: squarer7 = 0
  1798. # asm 1: mov $0,>squarer7=int64#2
  1799. # asm 2: mov $0,>squarer7=%rsi
  1800. mov $0,%rsi
  1801. # qhasm: squarerax = rx1_stack
  1802. # asm 1: movq <rx1_stack=stack64#13,>squarerax=int64#7
  1803. # asm 2: movq <rx1_stack=96(%rsp),>squarerax=%rax
  1804. movq 96(%rsp),%rax
  1805. # qhasm: (uint128) squarerdx squarerax = squarerax * rx0_stack
  1806. # asm 1: mulq <rx0_stack=stack64#12
  1807. # asm 2: mulq <rx0_stack=88(%rsp)
  1808. mulq 88(%rsp)
  1809. # qhasm: rx1 = squarerax
  1810. # asm 1: mov <squarerax=int64#7,>rx1=int64#4
  1811. # asm 2: mov <squarerax=%rax,>rx1=%rcx
  1812. mov %rax,%rcx
  1813. # qhasm: rx2 = squarerdx
  1814. # asm 1: mov <squarerdx=int64#3,>rx2=int64#5
  1815. # asm 2: mov <squarerdx=%rdx,>rx2=%r8
  1816. mov %rdx,%r8
  1817. # qhasm: squarerax = rx2_stack
  1818. # asm 1: movq <rx2_stack=stack64#14,>squarerax=int64#7
  1819. # asm 2: movq <rx2_stack=104(%rsp),>squarerax=%rax
  1820. movq 104(%rsp),%rax
  1821. # qhasm: (uint128) squarerdx squarerax = squarerax * rx1_stack
  1822. # asm 1: mulq <rx1_stack=stack64#13
  1823. # asm 2: mulq <rx1_stack=96(%rsp)
  1824. mulq 96(%rsp)
  1825. # qhasm: rx3 = squarerax
  1826. # asm 1: mov <squarerax=int64#7,>rx3=int64#6
  1827. # asm 2: mov <squarerax=%rax,>rx3=%r9
  1828. mov %rax,%r9
  1829. # qhasm: squarer4 = squarerdx
  1830. # asm 1: mov <squarerdx=int64#3,>squarer4=int64#8
  1831. # asm 2: mov <squarerdx=%rdx,>squarer4=%r10
  1832. mov %rdx,%r10
  1833. # qhasm: squarerax = rx3_stack
  1834. # asm 1: movq <rx3_stack=stack64#15,>squarerax=int64#7
  1835. # asm 2: movq <rx3_stack=112(%rsp),>squarerax=%rax
  1836. movq 112(%rsp),%rax
  1837. # qhasm: (uint128) squarerdx squarerax = squarerax * rx2_stack
  1838. # asm 1: mulq <rx2_stack=stack64#14
  1839. # asm 2: mulq <rx2_stack=104(%rsp)
  1840. mulq 104(%rsp)
  1841. # qhasm: squarer5 = squarerax
  1842. # asm 1: mov <squarerax=int64#7,>squarer5=int64#9
  1843. # asm 2: mov <squarerax=%rax,>squarer5=%r11
  1844. mov %rax,%r11
  1845. # qhasm: squarer6 = squarerdx
  1846. # asm 1: mov <squarerdx=int64#3,>squarer6=int64#10
  1847. # asm 2: mov <squarerdx=%rdx,>squarer6=%r12
  1848. mov %rdx,%r12
  1849. # qhasm: squarerax = rx2_stack
  1850. # asm 1: movq <rx2_stack=stack64#14,>squarerax=int64#7
  1851. # asm 2: movq <rx2_stack=104(%rsp),>squarerax=%rax
  1852. movq 104(%rsp),%rax
  1853. # qhasm: (uint128) squarerdx squarerax = squarerax * rx0_stack
  1854. # asm 1: mulq <rx0_stack=stack64#12
  1855. # asm 2: mulq <rx0_stack=88(%rsp)
  1856. mulq 88(%rsp)
  1857. # qhasm: carry? rx2 += squarerax
  1858. # asm 1: add <squarerax=int64#7,<rx2=int64#5
  1859. # asm 2: add <squarerax=%rax,<rx2=%r8
  1860. add %rax,%r8
  1861. # qhasm: carry? rx3 += squarerdx + carry
  1862. # asm 1: adc <squarerdx=int64#3,<rx3=int64#6
  1863. # asm 2: adc <squarerdx=%rdx,<rx3=%r9
  1864. adc %rdx,%r9
  1865. # qhasm: squarer4 += 0 + carry
  1866. # asm 1: adc $0,<squarer4=int64#8
  1867. # asm 2: adc $0,<squarer4=%r10
  1868. adc $0,%r10
  1869. # qhasm: squarerax = rx3_stack
  1870. # asm 1: movq <rx3_stack=stack64#15,>squarerax=int64#7
  1871. # asm 2: movq <rx3_stack=112(%rsp),>squarerax=%rax
  1872. movq 112(%rsp),%rax
  1873. # qhasm: (uint128) squarerdx squarerax = squarerax * rx1_stack
  1874. # asm 1: mulq <rx1_stack=stack64#13
  1875. # asm 2: mulq <rx1_stack=96(%rsp)
  1876. mulq 96(%rsp)
  1877. # qhasm: carry? squarer4 += squarerax
  1878. # asm 1: add <squarerax=int64#7,<squarer4=int64#8
  1879. # asm 2: add <squarerax=%rax,<squarer4=%r10
  1880. add %rax,%r10
  1881. # qhasm: carry? squarer5 += squarerdx + carry
  1882. # asm 1: adc <squarerdx=int64#3,<squarer5=int64#9
  1883. # asm 2: adc <squarerdx=%rdx,<squarer5=%r11
  1884. adc %rdx,%r11
  1885. # qhasm: squarer6 += 0 + carry
  1886. # asm 1: adc $0,<squarer6=int64#10
  1887. # asm 2: adc $0,<squarer6=%r12
  1888. adc $0,%r12
  1889. # qhasm: squarerax = rx3_stack
  1890. # asm 1: movq <rx3_stack=stack64#15,>squarerax=int64#7
  1891. # asm 2: movq <rx3_stack=112(%rsp),>squarerax=%rax
  1892. movq 112(%rsp),%rax
  1893. # qhasm: (uint128) squarerdx squarerax = squarerax * rx0_stack
  1894. # asm 1: mulq <rx0_stack=stack64#12
  1895. # asm 2: mulq <rx0_stack=88(%rsp)
  1896. mulq 88(%rsp)
  1897. # qhasm: carry? rx3 += squarerax
  1898. # asm 1: add <squarerax=int64#7,<rx3=int64#6
  1899. # asm 2: add <squarerax=%rax,<rx3=%r9
  1900. add %rax,%r9
  1901. # qhasm: carry? squarer4 += squarerdx + carry
  1902. # asm 1: adc <squarerdx=int64#3,<squarer4=int64#8
  1903. # asm 2: adc <squarerdx=%rdx,<squarer4=%r10
  1904. adc %rdx,%r10
  1905. # qhasm: carry? squarer5 += 0 + carry
  1906. # asm 1: adc $0,<squarer5=int64#9
  1907. # asm 2: adc $0,<squarer5=%r11
  1908. adc $0,%r11
  1909. # qhasm: carry? squarer6 += 0 + carry
  1910. # asm 1: adc $0,<squarer6=int64#10
  1911. # asm 2: adc $0,<squarer6=%r12
  1912. adc $0,%r12
  1913. # qhasm: squarer7 += 0 + carry
  1914. # asm 1: adc $0,<squarer7=int64#2
  1915. # asm 2: adc $0,<squarer7=%rsi
  1916. adc $0,%rsi
  1917. # qhasm: carry? rx1 += rx1
  1918. # asm 1: add <rx1=int64#4,<rx1=int64#4
  1919. # asm 2: add <rx1=%rcx,<rx1=%rcx
  1920. add %rcx,%rcx
  1921. # qhasm: carry? rx2 += rx2 + carry
  1922. # asm 1: adc <rx2=int64#5,<rx2=int64#5
  1923. # asm 2: adc <rx2=%r8,<rx2=%r8
  1924. adc %r8,%r8
  1925. # qhasm: carry? rx3 += rx3 + carry
  1926. # asm 1: adc <rx3=int64#6,<rx3=int64#6
  1927. # asm 2: adc <rx3=%r9,<rx3=%r9
  1928. adc %r9,%r9
  1929. # qhasm: carry? squarer4 += squarer4 + carry
  1930. # asm 1: adc <squarer4=int64#8,<squarer4=int64#8
  1931. # asm 2: adc <squarer4=%r10,<squarer4=%r10
  1932. adc %r10,%r10
  1933. # qhasm: carry? squarer5 += squarer5 + carry
  1934. # asm 1: adc <squarer5=int64#9,<squarer5=int64#9
  1935. # asm 2: adc <squarer5=%r11,<squarer5=%r11
  1936. adc %r11,%r11
  1937. # qhasm: carry? squarer6 += squarer6 + carry
  1938. # asm 1: adc <squarer6=int64#10,<squarer6=int64#10
  1939. # asm 2: adc <squarer6=%r12,<squarer6=%r12
  1940. adc %r12,%r12
  1941. # qhasm: squarer7 += squarer7 + carry
  1942. # asm 1: adc <squarer7=int64#2,<squarer7=int64#2
  1943. # asm 2: adc <squarer7=%rsi,<squarer7=%rsi
  1944. adc %rsi,%rsi
  1945. # qhasm: squarerax = rx0_stack
  1946. # asm 1: movq <rx0_stack=stack64#12,>squarerax=int64#7
  1947. # asm 2: movq <rx0_stack=88(%rsp),>squarerax=%rax
  1948. movq 88(%rsp),%rax
  1949. # qhasm: (uint128) squarerdx squarerax = squarerax * rx0_stack
  1950. # asm 1: mulq <rx0_stack=stack64#12
  1951. # asm 2: mulq <rx0_stack=88(%rsp)
  1952. mulq 88(%rsp)
  1953. # qhasm: rx0 = squarerax
  1954. # asm 1: mov <squarerax=int64#7,>rx0=int64#11
  1955. # asm 2: mov <squarerax=%rax,>rx0=%r13
  1956. mov %rax,%r13
  1957. # qhasm: squaret1 = squarerdx
  1958. # asm 1: mov <squarerdx=int64#3,>squaret1=int64#12
  1959. # asm 2: mov <squarerdx=%rdx,>squaret1=%r14
  1960. mov %rdx,%r14
  1961. # qhasm: squarerax = rx1_stack
  1962. # asm 1: movq <rx1_stack=stack64#13,>squarerax=int64#7
  1963. # asm 2: movq <rx1_stack=96(%rsp),>squarerax=%rax
  1964. movq 96(%rsp),%rax
  1965. # qhasm: (uint128) squarerdx squarerax = squarerax * rx1_stack
  1966. # asm 1: mulq <rx1_stack=stack64#13
  1967. # asm 2: mulq <rx1_stack=96(%rsp)
  1968. mulq 96(%rsp)
  1969. # qhasm: squaret2 = squarerax
  1970. # asm 1: mov <squarerax=int64#7,>squaret2=int64#13
  1971. # asm 2: mov <squarerax=%rax,>squaret2=%r15
  1972. mov %rax,%r15
  1973. # qhasm: squaret3 = squarerdx
  1974. # asm 1: mov <squarerdx=int64#3,>squaret3=int64#14
  1975. # asm 2: mov <squarerdx=%rdx,>squaret3=%rbx
  1976. mov %rdx,%rbx
  1977. # qhasm: squarerax = rx2_stack
  1978. # asm 1: movq <rx2_stack=stack64#14,>squarerax=int64#7
  1979. # asm 2: movq <rx2_stack=104(%rsp),>squarerax=%rax
  1980. movq 104(%rsp),%rax
  1981. # qhasm: (uint128) squarerdx squarerax = squarerax * rx2_stack
  1982. # asm 1: mulq <rx2_stack=stack64#14
  1983. # asm 2: mulq <rx2_stack=104(%rsp)
  1984. mulq 104(%rsp)
  1985. # qhasm: carry? rx1 += squaret1
  1986. # asm 1: add <squaret1=int64#12,<rx1=int64#4
  1987. # asm 2: add <squaret1=%r14,<rx1=%rcx
  1988. add %r14,%rcx
  1989. # qhasm: carry? rx2 += squaret2 + carry
  1990. # asm 1: adc <squaret2=int64#13,<rx2=int64#5
  1991. # asm 2: adc <squaret2=%r15,<rx2=%r8
  1992. adc %r15,%r8
  1993. # qhasm: carry? rx3 += squaret3 + carry
  1994. # asm 1: adc <squaret3=int64#14,<rx3=int64#6
  1995. # asm 2: adc <squaret3=%rbx,<rx3=%r9
  1996. adc %rbx,%r9
  1997. # qhasm: carry? squarer4 += squarerax + carry
  1998. # asm 1: adc <squarerax=int64#7,<squarer4=int64#8
  1999. # asm 2: adc <squarerax=%rax,<squarer4=%r10
  2000. adc %rax,%r10
  2001. # qhasm: carry? squarer5 += squarerdx + carry
  2002. # asm 1: adc <squarerdx=int64#3,<squarer5=int64#9
  2003. # asm 2: adc <squarerdx=%rdx,<squarer5=%r11
  2004. adc %rdx,%r11
  2005. # qhasm: carry? squarer6 += 0 + carry
  2006. # asm 1: adc $0,<squarer6=int64#10
  2007. # asm 2: adc $0,<squarer6=%r12
  2008. adc $0,%r12
  2009. # qhasm: squarer7 += 0 + carry
  2010. # asm 1: adc $0,<squarer7=int64#2
  2011. # asm 2: adc $0,<squarer7=%rsi
  2012. adc $0,%rsi
  2013. # qhasm: squarerax = rx3_stack
  2014. # asm 1: movq <rx3_stack=stack64#15,>squarerax=int64#7
  2015. # asm 2: movq <rx3_stack=112(%rsp),>squarerax=%rax
  2016. movq 112(%rsp),%rax
  2017. # qhasm: (uint128) squarerdx squarerax = squarerax * rx3_stack
  2018. # asm 1: mulq <rx3_stack=stack64#15
  2019. # asm 2: mulq <rx3_stack=112(%rsp)
  2020. mulq 112(%rsp)
  2021. # qhasm: carry? squarer6 += squarerax
  2022. # asm 1: add <squarerax=int64#7,<squarer6=int64#10
  2023. # asm 2: add <squarerax=%rax,<squarer6=%r12
  2024. add %rax,%r12
  2025. # qhasm: squarer7 += squarerdx + carry
  2026. # asm 1: adc <squarerdx=int64#3,<squarer7=int64#2
  2027. # asm 2: adc <squarerdx=%rdx,<squarer7=%rsi
  2028. adc %rdx,%rsi
  2029. # qhasm: squarerax = squarer4
  2030. # asm 1: mov <squarer4=int64#8,>squarerax=int64#7
  2031. # asm 2: mov <squarer4=%r10,>squarerax=%rax
  2032. mov %r10,%rax
  2033. # qhasm: (uint128) squarerdx squarerax = squarerax * *(uint64 *)&CRYPTO_NAMESPACE(38)
  2034. mulq CRYPTO_NAMESPACE(38)(%rip)
  2035. # qhasm: squarer4 = squarerax
  2036. # asm 1: mov <squarerax=int64#7,>squarer4=int64#8
  2037. # asm 2: mov <squarerax=%rax,>squarer4=%r10
  2038. mov %rax,%r10
  2039. # qhasm: squarerax = squarer5
  2040. # asm 1: mov <squarer5=int64#9,>squarerax=int64#7
  2041. # asm 2: mov <squarer5=%r11,>squarerax=%rax
  2042. mov %r11,%rax
  2043. # qhasm: squarer5 = squarerdx
  2044. # asm 1: mov <squarerdx=int64#3,>squarer5=int64#9
  2045. # asm 2: mov <squarerdx=%rdx,>squarer5=%r11
  2046. mov %rdx,%r11
  2047. # qhasm: (uint128) squarerdx squarerax = squarerax * *(uint64 *)&CRYPTO_NAMESPACE(38)
  2048. mulq CRYPTO_NAMESPACE(38)(%rip)
  2049. # qhasm: carry? squarer5 += squarerax
  2050. # asm 1: add <squarerax=int64#7,<squarer5=int64#9
  2051. # asm 2: add <squarerax=%rax,<squarer5=%r11
  2052. add %rax,%r11
  2053. # qhasm: squarerax = squarer6
  2054. # asm 1: mov <squarer6=int64#10,>squarerax=int64#7
  2055. # asm 2: mov <squarer6=%r12,>squarerax=%rax
  2056. mov %r12,%rax
  2057. # qhasm: squarer6 = 0
  2058. # asm 1: mov $0,>squarer6=int64#10
  2059. # asm 2: mov $0,>squarer6=%r12
  2060. mov $0,%r12
  2061. # qhasm: squarer6 += squarerdx + carry
  2062. # asm 1: adc <squarerdx=int64#3,<squarer6=int64#10
  2063. # asm 2: adc <squarerdx=%rdx,<squarer6=%r12
  2064. adc %rdx,%r12
  2065. # qhasm: (uint128) squarerdx squarerax = squarerax * *(uint64 *)&CRYPTO_NAMESPACE(38)
  2066. mulq CRYPTO_NAMESPACE(38)(%rip)
  2067. # qhasm: carry? squarer6 += squarerax
  2068. # asm 1: add <squarerax=int64#7,<squarer6=int64#10
  2069. # asm 2: add <squarerax=%rax,<squarer6=%r12
  2070. add %rax,%r12
  2071. # qhasm: squarerax = squarer7
  2072. # asm 1: mov <squarer7=int64#2,>squarerax=int64#7
  2073. # asm 2: mov <squarer7=%rsi,>squarerax=%rax
  2074. mov %rsi,%rax
  2075. # qhasm: squarer7 = 0
  2076. # asm 1: mov $0,>squarer7=int64#2
  2077. # asm 2: mov $0,>squarer7=%rsi
  2078. mov $0,%rsi
  2079. # qhasm: squarer7 += squarerdx + carry
  2080. # asm 1: adc <squarerdx=int64#3,<squarer7=int64#2
  2081. # asm 2: adc <squarerdx=%rdx,<squarer7=%rsi
  2082. adc %rdx,%rsi
  2083. # qhasm: (uint128) squarerdx squarerax = squarerax * *(uint64 *)&CRYPTO_NAMESPACE(38)
  2084. mulq CRYPTO_NAMESPACE(38)(%rip)
  2085. # qhasm: carry? squarer7 += squarerax
  2086. # asm 1: add <squarerax=int64#7,<squarer7=int64#2
  2087. # asm 2: add <squarerax=%rax,<squarer7=%rsi
  2088. add %rax,%rsi
  2089. # qhasm: squarer8 = 0
  2090. # asm 1: mov $0,>squarer8=int64#7
  2091. # asm 2: mov $0,>squarer8=%rax
  2092. mov $0,%rax
  2093. # qhasm: squarer8 += squarerdx + carry
  2094. # asm 1: adc <squarerdx=int64#3,<squarer8=int64#7
  2095. # asm 2: adc <squarerdx=%rdx,<squarer8=%rax
  2096. adc %rdx,%rax
  2097. # qhasm: carry? rx0 += squarer4
  2098. # asm 1: add <squarer4=int64#8,<rx0=int64#11
  2099. # asm 2: add <squarer4=%r10,<rx0=%r13
  2100. add %r10,%r13
  2101. # qhasm: carry? rx1 += squarer5 + carry
  2102. # asm 1: adc <squarer5=int64#9,<rx1=int64#4
  2103. # asm 2: adc <squarer5=%r11,<rx1=%rcx
  2104. adc %r11,%rcx
  2105. # qhasm: carry? rx2 += squarer6 + carry
  2106. # asm 1: adc <squarer6=int64#10,<rx2=int64#5
  2107. # asm 2: adc <squarer6=%r12,<rx2=%r8
  2108. adc %r12,%r8
  2109. # qhasm: carry? rx3 += squarer7 + carry
  2110. # asm 1: adc <squarer7=int64#2,<rx3=int64#6
  2111. # asm 2: adc <squarer7=%rsi,<rx3=%r9
  2112. adc %rsi,%r9
  2113. # qhasm: squarezero = 0
  2114. # asm 1: mov $0,>squarezero=int64#2
  2115. # asm 2: mov $0,>squarezero=%rsi
  2116. mov $0,%rsi
  2117. # qhasm: squarer8 += squarezero + carry
  2118. # asm 1: adc <squarezero=int64#2,<squarer8=int64#7
  2119. # asm 2: adc <squarezero=%rsi,<squarer8=%rax
  2120. adc %rsi,%rax
  2121. # qhasm: squarer8 *= 38
  2122. # asm 1: imulq $38,<squarer8=int64#7,>squarer8=int64#3
  2123. # asm 2: imulq $38,<squarer8=%rax,>squarer8=%rdx
  2124. imulq $38,%rax,%rdx
  2125. # qhasm: carry? rx0 += squarer8
  2126. # asm 1: add <squarer8=int64#3,<rx0=int64#11
  2127. # asm 2: add <squarer8=%rdx,<rx0=%r13
  2128. add %rdx,%r13
  2129. # qhasm: carry? rx1 += squarezero + carry
  2130. # asm 1: adc <squarezero=int64#2,<rx1=int64#4
  2131. # asm 2: adc <squarezero=%rsi,<rx1=%rcx
  2132. adc %rsi,%rcx
  2133. # qhasm: carry? rx2 += squarezero + carry
  2134. # asm 1: adc <squarezero=int64#2,<rx2=int64#5
  2135. # asm 2: adc <squarezero=%rsi,<rx2=%r8
  2136. adc %rsi,%r8
  2137. # qhasm: carry? rx3 += squarezero + carry
  2138. # asm 1: adc <squarezero=int64#2,<rx3=int64#6
  2139. # asm 2: adc <squarezero=%rsi,<rx3=%r9
  2140. adc %rsi,%r9
  2141. # qhasm: squarezero += squarezero + carry
  2142. # asm 1: adc <squarezero=int64#2,<squarezero=int64#2
  2143. # asm 2: adc <squarezero=%rsi,<squarezero=%rsi
  2144. adc %rsi,%rsi
  2145. # qhasm: squarezero *= 38
  2146. # asm 1: imulq $38,<squarezero=int64#2,>squarezero=int64#2
  2147. # asm 2: imulq $38,<squarezero=%rsi,>squarezero=%rsi
  2148. imulq $38,%rsi,%rsi
  2149. # qhasm: rx0 += squarezero
  2150. # asm 1: add <squarezero=int64#2,<rx0=int64#11
  2151. # asm 2: add <squarezero=%rsi,<rx0=%r13
  2152. add %rsi,%r13
  2153. # qhasm: carry? rx0 += d0_stack
  2154. # asm 1: addq <d0_stack=stack64#8,<rx0=int64#11
  2155. # asm 2: addq <d0_stack=56(%rsp),<rx0=%r13
  2156. addq 56(%rsp),%r13
  2157. # qhasm: carry? rx1 += d1_stack + carry
  2158. # asm 1: adcq <d1_stack=stack64#9,<rx1=int64#4
  2159. # asm 2: adcq <d1_stack=64(%rsp),<rx1=%rcx
  2160. adcq 64(%rsp),%rcx
  2161. # qhasm: carry? rx2 += d2_stack + carry
  2162. # asm 1: adcq <d2_stack=stack64#10,<rx2=int64#5
  2163. # asm 2: adcq <d2_stack=72(%rsp),<rx2=%r8
  2164. adcq 72(%rsp),%r8
  2165. # qhasm: carry? rx3 += d3_stack + carry
  2166. # asm 1: adcq <d3_stack=stack64#11,<rx3=int64#6
  2167. # asm 2: adcq <d3_stack=80(%rsp),<rx3=%r9
  2168. adcq 80(%rsp),%r9
  2169. # qhasm: addt0 = 0
  2170. # asm 1: mov $0,>addt0=int64#2
  2171. # asm 2: mov $0,>addt0=%rsi
  2172. mov $0,%rsi
  2173. # qhasm: addt1 = 38
  2174. # asm 1: mov $38,>addt1=int64#3
  2175. # asm 2: mov $38,>addt1=%rdx
  2176. mov $38,%rdx
  2177. # qhasm: addt1 = addt0 if !carry
  2178. # asm 1: cmovae <addt0=int64#2,<addt1=int64#3
  2179. # asm 2: cmovae <addt0=%rsi,<addt1=%rdx
  2180. cmovae %rsi,%rdx
  2181. # qhasm: carry? rx0 += addt1
  2182. # asm 1: add <addt1=int64#3,<rx0=int64#11
  2183. # asm 2: add <addt1=%rdx,<rx0=%r13
  2184. add %rdx,%r13
  2185. # qhasm: carry? rx1 += addt0 + carry
  2186. # asm 1: adc <addt0=int64#2,<rx1=int64#4
  2187. # asm 2: adc <addt0=%rsi,<rx1=%rcx
  2188. adc %rsi,%rcx
  2189. # qhasm: carry? rx2 += addt0 + carry
  2190. # asm 1: adc <addt0=int64#2,<rx2=int64#5
  2191. # asm 2: adc <addt0=%rsi,<rx2=%r8
  2192. adc %rsi,%r8
  2193. # qhasm: carry? rx3 += addt0 + carry
  2194. # asm 1: adc <addt0=int64#2,<rx3=int64#6
  2195. # asm 2: adc <addt0=%rsi,<rx3=%r9
  2196. adc %rsi,%r9
  2197. # qhasm: addt0 = addt1 if carry
  2198. # asm 1: cmovc <addt1=int64#3,<addt0=int64#2
  2199. # asm 2: cmovc <addt1=%rdx,<addt0=%rsi
  2200. cmovc %rdx,%rsi
  2201. # qhasm: rx0 += addt0
  2202. # asm 1: add <addt0=int64#2,<rx0=int64#11
  2203. # asm 2: add <addt0=%rsi,<rx0=%r13
  2204. add %rsi,%r13
  2205. # qhasm: carry? rx0 += e0_stack
  2206. # asm 1: addq <e0_stack=stack64#20,<rx0=int64#11
  2207. # asm 2: addq <e0_stack=152(%rsp),<rx0=%r13
  2208. addq 152(%rsp),%r13
  2209. # qhasm: carry? rx1 += e1_stack + carry
  2210. # asm 1: adcq <e1_stack=stack64#21,<rx1=int64#4
  2211. # asm 2: adcq <e1_stack=160(%rsp),<rx1=%rcx
  2212. adcq 160(%rsp),%rcx
  2213. # qhasm: carry? rx2 += e2_stack + carry
  2214. # asm 1: adcq <e2_stack=stack64#22,<rx2=int64#5
  2215. # asm 2: adcq <e2_stack=168(%rsp),<rx2=%r8
  2216. adcq 168(%rsp),%r8
  2217. # qhasm: carry? rx3 += e3_stack + carry
  2218. # asm 1: adcq <e3_stack=stack64#23,<rx3=int64#6
  2219. # asm 2: adcq <e3_stack=176(%rsp),<rx3=%r9
  2220. adcq 176(%rsp),%r9
  2221. # qhasm: addt0 = 0
  2222. # asm 1: mov $0,>addt0=int64#2
  2223. # asm 2: mov $0,>addt0=%rsi
  2224. mov $0,%rsi
  2225. # qhasm: addt1 = 38
  2226. # asm 1: mov $38,>addt1=int64#3
  2227. # asm 2: mov $38,>addt1=%rdx
  2228. mov $38,%rdx
  2229. # qhasm: addt1 = addt0 if !carry
  2230. # asm 1: cmovae <addt0=int64#2,<addt1=int64#3
  2231. # asm 2: cmovae <addt0=%rsi,<addt1=%rdx
  2232. cmovae %rsi,%rdx
  2233. # qhasm: carry? rx0 += addt1
  2234. # asm 1: add <addt1=int64#3,<rx0=int64#11
  2235. # asm 2: add <addt1=%rdx,<rx0=%r13
  2236. add %rdx,%r13
  2237. # qhasm: carry? rx1 += addt0 + carry
  2238. # asm 1: adc <addt0=int64#2,<rx1=int64#4
  2239. # asm 2: adc <addt0=%rsi,<rx1=%rcx
  2240. adc %rsi,%rcx
  2241. # qhasm: carry? rx2 += addt0 + carry
  2242. # asm 1: adc <addt0=int64#2,<rx2=int64#5
  2243. # asm 2: adc <addt0=%rsi,<rx2=%r8
  2244. adc %rsi,%r8
  2245. # qhasm: carry? rx3 += addt0 + carry
  2246. # asm 1: adc <addt0=int64#2,<rx3=int64#6
  2247. # asm 2: adc <addt0=%rsi,<rx3=%r9
  2248. adc %rsi,%r9
  2249. # qhasm: addt0 = addt1 if carry
  2250. # asm 1: cmovc <addt1=int64#3,<addt0=int64#2
  2251. # asm 2: cmovc <addt1=%rdx,<addt0=%rsi
  2252. cmovc %rdx,%rsi
  2253. # qhasm: rx0 += addt0
  2254. # asm 1: add <addt0=int64#2,<rx0=int64#11
  2255. # asm 2: add <addt0=%rsi,<rx0=%r13
  2256. add %rsi,%r13
  2257. # qhasm: *(uint64 *)(rp + 0) = rx0
  2258. # asm 1: movq <rx0=int64#11,0(<rp=int64#1)
  2259. # asm 2: movq <rx0=%r13,0(<rp=%rdi)
  2260. movq %r13,0(%rdi)
  2261. # qhasm: *(uint64 *)(rp + 8) = rx1
  2262. # asm 1: movq <rx1=int64#4,8(<rp=int64#1)
  2263. # asm 2: movq <rx1=%rcx,8(<rp=%rdi)
  2264. movq %rcx,8(%rdi)
  2265. # qhasm: *(uint64 *)(rp + 16) = rx2
  2266. # asm 1: movq <rx2=int64#5,16(<rp=int64#1)
  2267. # asm 2: movq <rx2=%r8,16(<rp=%rdi)
  2268. movq %r8,16(%rdi)
  2269. # qhasm: *(uint64 *)(rp + 24) = rx3
  2270. # asm 1: movq <rx3=int64#6,24(<rp=int64#1)
  2271. # asm 2: movq <rx3=%r9,24(<rp=%rdi)
  2272. movq %r9,24(%rdi)
  2273. # qhasm: caller1 = caller1_stack
  2274. # asm 1: movq <caller1_stack=stack64#1,>caller1=int64#9
  2275. # asm 2: movq <caller1_stack=0(%rsp),>caller1=%r11
  2276. movq 0(%rsp),%r11
  2277. # qhasm: caller2 = caller2_stack
  2278. # asm 1: movq <caller2_stack=stack64#2,>caller2=int64#10
  2279. # asm 2: movq <caller2_stack=8(%rsp),>caller2=%r12
  2280. movq 8(%rsp),%r12
  2281. # qhasm: caller3 = caller3_stack
  2282. # asm 1: movq <caller3_stack=stack64#3,>caller3=int64#11
  2283. # asm 2: movq <caller3_stack=16(%rsp),>caller3=%r13
  2284. movq 16(%rsp),%r13
  2285. # qhasm: caller4 = caller4_stack
  2286. # asm 1: movq <caller4_stack=stack64#4,>caller4=int64#12
  2287. # asm 2: movq <caller4_stack=24(%rsp),>caller4=%r14
  2288. movq 24(%rsp),%r14
  2289. # qhasm: caller5 = caller5_stack
  2290. # asm 1: movq <caller5_stack=stack64#5,>caller5=int64#13
  2291. # asm 2: movq <caller5_stack=32(%rsp),>caller5=%r15
  2292. movq 32(%rsp),%r15
  2293. # qhasm: caller6 = caller6_stack
  2294. # asm 1: movq <caller6_stack=stack64#6,>caller6=int64#14
  2295. # asm 2: movq <caller6_stack=40(%rsp),>caller6=%rbx
  2296. movq 40(%rsp),%rbx
  2297. # qhasm: caller7 = caller7_stack
  2298. # asm 1: movq <caller7_stack=stack64#7,>caller7=int64#15
  2299. # asm 2: movq <caller7_stack=48(%rsp),>caller7=%rbp
  2300. movq 48(%rsp),%rbp
  2301. # qhasm: leave
  2302. add %r11,%rsp
  2303. mov %rdi,%rax
  2304. mov %rsi,%rdx
  2305. ret