12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182838485868788899091929394959697989910010110210310410510610710810911011111211311411511611711811912012112212312412512612712812913013113213313413513613713813914014114214314414514614714814915015115215315415515615715815916016116216316416516616716816917017117217317417517617717817918018118218318418518618718818919019119219319419519619719819920020120220320420520620720820921021121221321421521621721821922022122222322422522622722822923023123223323423523623723823924024124224324424524624724824925025125225325425525625725825926026126226326426526626726826927027127227327427527627727827928028128228328428528628728828929029129229329429529629729829930030130230330430530630730830931031131231331431531631731831932032132232332432532632732832933033133233333433533633733833934034134234334434534634734834935035135235335435535635735835936036136236336436536636736836937037137237337437537637737837938038138238338438538638738838939039139239339439539639739839940040140240340440540640740840941041141241341441541641741841942042142242342442542642742842943043143243343443543643743843944044144244344444544644744844945045145245345445545645745845946046146246346446546646746846947047147247347447547647747847948048148248348448548648748848949049149249349449549649749849950050150250350450550650750850951051151251351451551651751851952052152252352452552652752852953053153253353453553653753853954054154254354454554654754854955055155255355455555655755855956056156256356456556656756856957057157257357457557657757857958058158258358458558658758858959059159259359459559659759859960060160260360460560660760860961061161261361461561661761861962062162262362462562662762862963063163263363463563663763863964064164264364464564664764864965065165265365465565665765865966066166266366466566666766866967067167267367467567667767867968068168268368468568668768868969069169269369469569669769869970070170270370470570670770870971071171271371471571671771871972072172272372472572672772872973073173273373473573673773873974074174274374474574674774874975075175275375475575675775875976076176276376476576676776876977077177277377477577677777877978078178278378478578678778878979079179279379479579679779879980080180280380480580680780880981081181281381481581681781881982082182282382482582682782882983083183283383483583683783883984084184284384484584684784884985085185285385485585685785885986086186286386486586686786886987087187287387487587687787887988088188288388488588688788888989089189289389489589689789889990090190290390490590690790890991091191291391491591691791891992092192292392492592692792892993093193293393493593693793893994094194294394494594694794894995095195295395495595695795895996096196296396496596696796896997097197297397497597697797897998098198298398498598698798898999099199299399499599699799899910001001100210031004100510061007100810091010101110121013101410151016101710181019102010211022102310241025102610271028102910301031103210331034103510361037103810391040104110421043104410451046104710481049105010511052105310541055105610571058105910601061106210631064106510661067106810691070107110721073107410751076107710781079108010811082108310841085108610871088108910901091109210931094109510961097109810991100110111021103110411051106110711081109111011111112111311141115111611171118111911201121112211231124112511261127112811291130113111321133113411351136113711381139114011411142114311441145114611471148114911501151115211531154115511561157115811591160116111621163116411651166116711681169117011711172117311741175117611771178117911801181118211831184118511861187118811891190119111921193119411951196119711981199120012011202120312041205120612071208120912101211121212131214121512161217121812191220122112221223122412251226122712281229123012311232123312341235123612371238123912401241124212431244124512461247124812491250125112521253125412551256125712581259126012611262126312641265126612671268126912701271127212731274127512761277127812791280128112821283128412851286128712881289129012911292129312941295129612971298129913001301130213031304130513061307130813091310131113121313131413151316131713181319132013211322132313241325132613271328132913301331133213331334133513361337133813391340134113421343134413451346134713481349135013511352135313541355135613571358135913601361136213631364136513661367136813691370137113721373137413751376137713781379138013811382138313841385138613871388138913901391139213931394139513961397139813991400140114021403140414051406140714081409141014111412141314141415141614171418141914201421142214231424142514261427142814291430143114321433143414351436143714381439144014411442144314441445144614471448144914501451145214531454145514561457145814591460146114621463146414651466146714681469147014711472147314741475147614771478147914801481148214831484148514861487148814891490149114921493149414951496149714981499150015011502150315041505150615071508150915101511151215131514151515161517151815191520152115221523152415251526152715281529153015311532153315341535153615371538153915401541154215431544154515461547154815491550155115521553155415551556155715581559156015611562156315641565156615671568156915701571157215731574157515761577157815791580158115821583158415851586158715881589159015911592159315941595159615971598159916001601160216031604160516061607160816091610161116121613161416151616161716181619162016211622162316241625162616271628162916301631163216331634163516361637163816391640164116421643164416451646164716481649165016511652165316541655165616571658165916601661166216631664166516661667166816691670167116721673167416751676167716781679168016811682168316841685168616871688168916901691169216931694169516961697169816991700170117021703170417051706170717081709171017111712171317141715171617171718171917201721172217231724172517261727172817291730173117321733173417351736173717381739174017411742174317441745174617471748174917501751175217531754175517561757175817591760176117621763176417651766176717681769177017711772177317741775177617771778177917801781178217831784178517861787178817891790179117921793179417951796179717981799180018011802180318041805180618071808180918101811181218131814181518161817181818191820182118221823182418251826182718281829183018311832183318341835183618371838183918401841184218431844184518461847184818491850185118521853185418551856185718581859186018611862186318641865186618671868186918701871187218731874187518761877187818791880188118821883188418851886188718881889189018911892189318941895189618971898189919001901190219031904190519061907190819091910191119121913191419151916191719181919192019211922192319241925192619271928192919301931193219331934193519361937193819391940194119421943194419451946194719481949195019511952195319541955195619571958195919601961196219631964196519661967196819691970197119721973197419751976197719781979198019811982198319841985198619871988198919901991199219931994199519961997199819992000200120022003200420052006200720082009201020112012201320142015201620172018201920202021202220232024202520262027202820292030203120322033203420352036203720382039204020412042204320442045204620472048204920502051205220532054205520562057205820592060206120622063206420652066206720682069207020712072207320742075207620772078207920802081208220832084208520862087208820892090209120922093209420952096209720982099210021012102210321042105210621072108210921102111211221132114211521162117211821192120212121222123212421252126212721282129213021312132213321342135213621372138213921402141214221432144214521462147214821492150215121522153215421552156215721582159216021612162216321642165216621672168216921702171217221732174217521762177217821792180218121822183218421852186218721882189219021912192219321942195219621972198219922002201220222032204220522062207220822092210221122122213221422152216221722182219222022212222222322242225222622272228222922302231223222332234223522362237223822392240224122422243224422452246224722482249225022512252225322542255225622572258225922602261226222632264226522662267226822692270227122722273227422752276227722782279228022812282228322842285228622872288228922902291229222932294229522962297229822992300230123022303230423052306230723082309231023112312231323142315231623172318231923202321232223232324232523262327232823292330233123322333233423352336233723382339234023412342234323442345234623472348234923502351235223532354235523562357235823592360236123622363236423652366236723682369237023712372237323742375237623772378237923802381238223832384238523862387238823892390239123922393239423952396239723982399240024012402240324042405240624072408240924102411241224132414241524162417241824192420242124222423242424252426242724282429243024312432243324342435243624372438243924402441244224432444244524462447244824492450245124522453245424552456245724582459246024612462246324642465246624672468246924702471247224732474247524762477247824792480248124822483248424852486248724882489249024912492249324942495249624972498249925002501250225032504250525062507250825092510251125122513251425152516251725182519252025212522252325242525252625272528252925302531253225332534253525362537253825392540254125422543254425452546254725482549255025512552255325542555255625572558255925602561256225632564256525662567256825692570257125722573257425752576257725782579258025812582258325842585258625872588258925902591259225932594259525962597259825992600260126022603260426052606260726082609261026112612261326142615261626172618261926202621262226232624262526262627262826292630263126322633263426352636263726382639264026412642264326442645264626472648264926502651265226532654265526562657265826592660266126622663266426652666266726682669267026712672267326742675267626772678267926802681268226832684268526862687268826892690269126922693269426952696269726982699270027012702270327042705270627072708270927102711271227132714271527162717271827192720272127222723272427252726272727282729273027312732273327342735273627372738273927402741274227432744274527462747274827492750275127522753275427552756275727582759276027612762276327642765276627672768276927702771277227732774277527762777277827792780278127822783278427852786278727882789279027912792279327942795279627972798279928002801280228032804280528062807280828092810281128122813281428152816281728182819282028212822282328242825282628272828282928302831283228332834283528362837283828392840284128422843284428452846284728482849285028512852285328542855285628572858285928602861286228632864286528662867286828692870287128722873287428752876287728782879288028812882288328842885288628872888288928902891289228932894289528962897289828992900290129022903290429052906290729082909291029112912291329142915291629172918291929202921292229232924292529262927292829292930293129322933293429352936293729382939294029412942294329442945294629472948294929502951295229532954295529562957295829592960296129622963296429652966296729682969297029712972297329742975297629772978297929802981298229832984298529862987298829892990299129922993299429952996299729982999300030013002300330043005300630073008300930103011301230133014301530163017301830193020302130223023302430253026302730283029303030313032303330343035303630373038303930403041304230433044304530463047304830493050305130523053305430553056305730583059306030613062306330643065306630673068306930703071307230733074307530763077307830793080308130823083308430853086308730883089309030913092309330943095309630973098309931003101310231033104310531063107310831093110311131123113311431153116311731183119312031213122312331243125312631273128312931303131313231333134313531363137313831393140314131423143314431453146314731483149315031513152315331543155 |
- # qhasm: int64 rp
- # qhasm: int64 pp
- # qhasm: input rp
- # qhasm: input pp
- # qhasm: int64 a0
- # qhasm: int64 a1
- # qhasm: int64 a2
- # qhasm: int64 a3
- # qhasm: int64 a4
- # qhasm: stack64 a0_stack
- # qhasm: stack64 a1_stack
- # qhasm: stack64 a2_stack
- # qhasm: stack64 a3_stack
- # qhasm: stack64 a4_stack
- # qhasm: int64 b0
- # qhasm: int64 b1
- # qhasm: int64 b2
- # qhasm: int64 b3
- # qhasm: int64 b4
- # qhasm: stack64 b0_stack
- # qhasm: stack64 b1_stack
- # qhasm: stack64 b2_stack
- # qhasm: stack64 b3_stack
- # qhasm: stack64 b4_stack
- # qhasm: int64 c0
- # qhasm: int64 c1
- # qhasm: int64 c2
- # qhasm: int64 c3
- # qhasm: int64 c4
- # qhasm: stack64 c0_stack
- # qhasm: stack64 c1_stack
- # qhasm: stack64 c2_stack
- # qhasm: stack64 c3_stack
- # qhasm: stack64 c4_stack
- # qhasm: int64 d0
- # qhasm: int64 d1
- # qhasm: int64 d2
- # qhasm: int64 d3
- # qhasm: int64 d4
- # qhasm: stack64 d0_stack
- # qhasm: stack64 d1_stack
- # qhasm: stack64 d2_stack
- # qhasm: stack64 d3_stack
- # qhasm: stack64 d4_stack
- # qhasm: int64 e0
- # qhasm: int64 e1
- # qhasm: int64 e2
- # qhasm: int64 e3
- # qhasm: int64 e4
- # qhasm: stack64 e0_stack
- # qhasm: stack64 e1_stack
- # qhasm: stack64 e2_stack
- # qhasm: stack64 e3_stack
- # qhasm: stack64 e4_stack
- # qhasm: int64 rx0
- # qhasm: int64 rx1
- # qhasm: int64 rx2
- # qhasm: int64 rx3
- # qhasm: int64 rx4
- # qhasm: stack64 rx0_stack
- # qhasm: stack64 rx1_stack
- # qhasm: stack64 rx2_stack
- # qhasm: stack64 rx3_stack
- # qhasm: stack64 rx4_stack
- # qhasm: int64 ry0
- # qhasm: int64 ry1
- # qhasm: int64 ry2
- # qhasm: int64 ry3
- # qhasm: int64 ry4
- # qhasm: int64 rz0
- # qhasm: int64 rz1
- # qhasm: int64 rz2
- # qhasm: int64 rz3
- # qhasm: int64 rz4
- # qhasm: int64 rt0
- # qhasm: int64 rt1
- # qhasm: int64 rt2
- # qhasm: int64 rt3
- # qhasm: int64 rt4
- # qhasm: int64 mulr01
- # qhasm: int64 mulr11
- # qhasm: int64 mulr21
- # qhasm: int64 mulr31
- # qhasm: int64 mulr41
- # qhasm: int64 mulrax
- # qhasm: int64 mulrdx
- # qhasm: int64 mult
- # qhasm: int64 mulredmask
- # qhasm: stack64 mulx219_stack
- # qhasm: stack64 mulx319_stack
- # qhasm: stack64 mulx419_stack
- # qhasm: int64 squarer01
- # qhasm: int64 squarer11
- # qhasm: int64 squarer21
- # qhasm: int64 squarer31
- # qhasm: int64 squarer41
- # qhasm: int64 squarerax
- # qhasm: int64 squarerdx
- # qhasm: int64 squaret
- # qhasm: int64 squareredmask
- # qhasm: int64 caller1
- # qhasm: int64 caller2
- # qhasm: int64 caller3
- # qhasm: int64 caller4
- # qhasm: int64 caller5
- # qhasm: int64 caller6
- # qhasm: int64 caller7
- # qhasm: caller caller1
- # qhasm: caller caller2
- # qhasm: caller caller3
- # qhasm: caller caller4
- # qhasm: caller caller5
- # qhasm: caller caller6
- # qhasm: caller caller7
- # qhasm: stack64 caller1_stack
- # qhasm: stack64 caller2_stack
- # qhasm: stack64 caller3_stack
- # qhasm: stack64 caller4_stack
- # qhasm: stack64 caller5_stack
- # qhasm: stack64 caller6_stack
- # qhasm: stack64 caller7_stack
- # qhasm: enter CRYPTO_NAMESPACE(batch_ge25519_dbl_p1p1)
- .text
- .p2align 5
- .globl _CRYPTO_NAMESPACE(batch_ge25519_dbl_p1p1)
- .globl CRYPTO_NAMESPACE(batch_ge25519_dbl_p1p1)
- _CRYPTO_NAMESPACE(batch_ge25519_dbl_p1p1):
- CRYPTO_NAMESPACE(batch_ge25519_dbl_p1p1):
- mov %rsp,%r11
- and $31,%r11
- add $224,%r11
- sub %r11,%rsp
- # qhasm: caller1_stack = caller1
- # asm 1: movq <caller1=int64#9,>caller1_stack=stack64#1
- # asm 2: movq <caller1=%r11,>caller1_stack=0(%rsp)
- movq %r11,0(%rsp)
- # qhasm: caller2_stack = caller2
- # asm 1: movq <caller2=int64#10,>caller2_stack=stack64#2
- # asm 2: movq <caller2=%r12,>caller2_stack=8(%rsp)
- movq %r12,8(%rsp)
- # qhasm: caller3_stack = caller3
- # asm 1: movq <caller3=int64#11,>caller3_stack=stack64#3
- # asm 2: movq <caller3=%r13,>caller3_stack=16(%rsp)
- movq %r13,16(%rsp)
- # qhasm: caller4_stack = caller4
- # asm 1: movq <caller4=int64#12,>caller4_stack=stack64#4
- # asm 2: movq <caller4=%r14,>caller4_stack=24(%rsp)
- movq %r14,24(%rsp)
- # qhasm: caller5_stack = caller5
- # asm 1: movq <caller5=int64#13,>caller5_stack=stack64#5
- # asm 2: movq <caller5=%r15,>caller5_stack=32(%rsp)
- movq %r15,32(%rsp)
- # qhasm: caller6_stack = caller6
- # asm 1: movq <caller6=int64#14,>caller6_stack=stack64#6
- # asm 2: movq <caller6=%rbx,>caller6_stack=40(%rsp)
- movq %rbx,40(%rsp)
- # qhasm: caller7_stack = caller7
- # asm 1: movq <caller7=int64#15,>caller7_stack=stack64#7
- # asm 2: movq <caller7=%rbp,>caller7_stack=48(%rsp)
- movq %rbp,48(%rsp)
- # qhasm: squarerax = *(uint64 *)(pp + 0)
- # asm 1: movq 0(<pp=int64#2),>squarerax=int64#7
- # asm 2: movq 0(<pp=%rsi),>squarerax=%rax
- movq 0(%rsi),%rax
- # qhasm: (uint128) squarerdx squarerax = squarerax * *(uint64 *)(pp + 0)
- # asm 1: mulq 0(<pp=int64#2)
- # asm 2: mulq 0(<pp=%rsi)
- mulq 0(%rsi)
- # qhasm: a0 = squarerax
- # asm 1: mov <squarerax=int64#7,>a0=int64#4
- # asm 2: mov <squarerax=%rax,>a0=%rcx
- mov %rax,%rcx
- # qhasm: squarer01 = squarerdx
- # asm 1: mov <squarerdx=int64#3,>squarer01=int64#5
- # asm 2: mov <squarerdx=%rdx,>squarer01=%r8
- mov %rdx,%r8
- # qhasm: squarerax = *(uint64 *)(pp + 0)
- # asm 1: movq 0(<pp=int64#2),>squarerax=int64#7
- # asm 2: movq 0(<pp=%rsi),>squarerax=%rax
- movq 0(%rsi),%rax
- # qhasm: squarerax <<= 1
- # asm 1: shl $1,<squarerax=int64#7
- # asm 2: shl $1,<squarerax=%rax
- shl $1,%rax
- # qhasm: (uint128) squarerdx squarerax = squarerax * *(uint64 *)(pp + 8)
- # asm 1: mulq 8(<pp=int64#2)
- # asm 2: mulq 8(<pp=%rsi)
- mulq 8(%rsi)
- # qhasm: a1 = squarerax
- # asm 1: mov <squarerax=int64#7,>a1=int64#6
- # asm 2: mov <squarerax=%rax,>a1=%r9
- mov %rax,%r9
- # qhasm: squarer11 = squarerdx
- # asm 1: mov <squarerdx=int64#3,>squarer11=int64#8
- # asm 2: mov <squarerdx=%rdx,>squarer11=%r10
- mov %rdx,%r10
- # qhasm: squarerax = *(uint64 *)(pp + 0)
- # asm 1: movq 0(<pp=int64#2),>squarerax=int64#7
- # asm 2: movq 0(<pp=%rsi),>squarerax=%rax
- movq 0(%rsi),%rax
- # qhasm: squarerax <<= 1
- # asm 1: shl $1,<squarerax=int64#7
- # asm 2: shl $1,<squarerax=%rax
- shl $1,%rax
- # qhasm: (uint128) squarerdx squarerax = squarerax * *(uint64 *)(pp + 16)
- # asm 1: mulq 16(<pp=int64#2)
- # asm 2: mulq 16(<pp=%rsi)
- mulq 16(%rsi)
- # qhasm: a2 = squarerax
- # asm 1: mov <squarerax=int64#7,>a2=int64#9
- # asm 2: mov <squarerax=%rax,>a2=%r11
- mov %rax,%r11
- # qhasm: squarer21 = squarerdx
- # asm 1: mov <squarerdx=int64#3,>squarer21=int64#10
- # asm 2: mov <squarerdx=%rdx,>squarer21=%r12
- mov %rdx,%r12
- # qhasm: squarerax = *(uint64 *)(pp + 0)
- # asm 1: movq 0(<pp=int64#2),>squarerax=int64#7
- # asm 2: movq 0(<pp=%rsi),>squarerax=%rax
- movq 0(%rsi),%rax
- # qhasm: squarerax <<= 1
- # asm 1: shl $1,<squarerax=int64#7
- # asm 2: shl $1,<squarerax=%rax
- shl $1,%rax
- # qhasm: (uint128) squarerdx squarerax = squarerax * *(uint64 *)(pp + 24)
- # asm 1: mulq 24(<pp=int64#2)
- # asm 2: mulq 24(<pp=%rsi)
- mulq 24(%rsi)
- # qhasm: a3 = squarerax
- # asm 1: mov <squarerax=int64#7,>a3=int64#11
- # asm 2: mov <squarerax=%rax,>a3=%r13
- mov %rax,%r13
- # qhasm: squarer31 = squarerdx
- # asm 1: mov <squarerdx=int64#3,>squarer31=int64#12
- # asm 2: mov <squarerdx=%rdx,>squarer31=%r14
- mov %rdx,%r14
- # qhasm: squarerax = *(uint64 *)(pp + 0)
- # asm 1: movq 0(<pp=int64#2),>squarerax=int64#7
- # asm 2: movq 0(<pp=%rsi),>squarerax=%rax
- movq 0(%rsi),%rax
- # qhasm: squarerax <<= 1
- # asm 1: shl $1,<squarerax=int64#7
- # asm 2: shl $1,<squarerax=%rax
- shl $1,%rax
- # qhasm: (uint128) squarerdx squarerax = squarerax * *(uint64 *)(pp + 32)
- # asm 1: mulq 32(<pp=int64#2)
- # asm 2: mulq 32(<pp=%rsi)
- mulq 32(%rsi)
- # qhasm: a4 = squarerax
- # asm 1: mov <squarerax=int64#7,>a4=int64#13
- # asm 2: mov <squarerax=%rax,>a4=%r15
- mov %rax,%r15
- # qhasm: squarer41 = squarerdx
- # asm 1: mov <squarerdx=int64#3,>squarer41=int64#14
- # asm 2: mov <squarerdx=%rdx,>squarer41=%rbx
- mov %rdx,%rbx
- # qhasm: squarerax = *(uint64 *)(pp + 8)
- # asm 1: movq 8(<pp=int64#2),>squarerax=int64#7
- # asm 2: movq 8(<pp=%rsi),>squarerax=%rax
- movq 8(%rsi),%rax
- # qhasm: (uint128) squarerdx squarerax = squarerax * *(uint64 *)(pp + 8)
- # asm 1: mulq 8(<pp=int64#2)
- # asm 2: mulq 8(<pp=%rsi)
- mulq 8(%rsi)
- # qhasm: carry? a2 += squarerax
- # asm 1: add <squarerax=int64#7,<a2=int64#9
- # asm 2: add <squarerax=%rax,<a2=%r11
- add %rax,%r11
- # qhasm: squarer21 += squarerdx + carry
- # asm 1: adc <squarerdx=int64#3,<squarer21=int64#10
- # asm 2: adc <squarerdx=%rdx,<squarer21=%r12
- adc %rdx,%r12
- # qhasm: squarerax = *(uint64 *)(pp + 8)
- # asm 1: movq 8(<pp=int64#2),>squarerax=int64#7
- # asm 2: movq 8(<pp=%rsi),>squarerax=%rax
- movq 8(%rsi),%rax
- # qhasm: squarerax <<= 1
- # asm 1: shl $1,<squarerax=int64#7
- # asm 2: shl $1,<squarerax=%rax
- shl $1,%rax
- # qhasm: (uint128) squarerdx squarerax = squarerax * *(uint64 *)(pp + 16)
- # asm 1: mulq 16(<pp=int64#2)
- # asm 2: mulq 16(<pp=%rsi)
- mulq 16(%rsi)
- # qhasm: carry? a3 += squarerax
- # asm 1: add <squarerax=int64#7,<a3=int64#11
- # asm 2: add <squarerax=%rax,<a3=%r13
- add %rax,%r13
- # qhasm: squarer31 += squarerdx + carry
- # asm 1: adc <squarerdx=int64#3,<squarer31=int64#12
- # asm 2: adc <squarerdx=%rdx,<squarer31=%r14
- adc %rdx,%r14
- # qhasm: squarerax = *(uint64 *)(pp + 8)
- # asm 1: movq 8(<pp=int64#2),>squarerax=int64#7
- # asm 2: movq 8(<pp=%rsi),>squarerax=%rax
- movq 8(%rsi),%rax
- # qhasm: squarerax <<= 1
- # asm 1: shl $1,<squarerax=int64#7
- # asm 2: shl $1,<squarerax=%rax
- shl $1,%rax
- # qhasm: (uint128) squarerdx squarerax = squarerax * *(uint64 *)(pp + 24)
- # asm 1: mulq 24(<pp=int64#2)
- # asm 2: mulq 24(<pp=%rsi)
- mulq 24(%rsi)
- # qhasm: carry? a4 += squarerax
- # asm 1: add <squarerax=int64#7,<a4=int64#13
- # asm 2: add <squarerax=%rax,<a4=%r15
- add %rax,%r15
- # qhasm: squarer41 += squarerdx + carry
- # asm 1: adc <squarerdx=int64#3,<squarer41=int64#14
- # asm 2: adc <squarerdx=%rdx,<squarer41=%rbx
- adc %rdx,%rbx
- # qhasm: squarerax = *(uint64 *)(pp + 8)
- # asm 1: movq 8(<pp=int64#2),>squarerax=int64#3
- # asm 2: movq 8(<pp=%rsi),>squarerax=%rdx
- movq 8(%rsi),%rdx
- # qhasm: squarerax *= 38
- # asm 1: imulq $38,<squarerax=int64#3,>squarerax=int64#7
- # asm 2: imulq $38,<squarerax=%rdx,>squarerax=%rax
- imulq $38,%rdx,%rax
- # qhasm: (uint128) squarerdx squarerax = squarerax * *(uint64 *)(pp + 32)
- # asm 1: mulq 32(<pp=int64#2)
- # asm 2: mulq 32(<pp=%rsi)
- mulq 32(%rsi)
- # qhasm: carry? a0 += squarerax
- # asm 1: add <squarerax=int64#7,<a0=int64#4
- # asm 2: add <squarerax=%rax,<a0=%rcx
- add %rax,%rcx
- # qhasm: squarer01 += squarerdx + carry
- # asm 1: adc <squarerdx=int64#3,<squarer01=int64#5
- # asm 2: adc <squarerdx=%rdx,<squarer01=%r8
- adc %rdx,%r8
- # qhasm: squarerax = *(uint64 *)(pp + 16)
- # asm 1: movq 16(<pp=int64#2),>squarerax=int64#7
- # asm 2: movq 16(<pp=%rsi),>squarerax=%rax
- movq 16(%rsi),%rax
- # qhasm: (uint128) squarerdx squarerax = squarerax * *(uint64 *)(pp + 16)
- # asm 1: mulq 16(<pp=int64#2)
- # asm 2: mulq 16(<pp=%rsi)
- mulq 16(%rsi)
- # qhasm: carry? a4 += squarerax
- # asm 1: add <squarerax=int64#7,<a4=int64#13
- # asm 2: add <squarerax=%rax,<a4=%r15
- add %rax,%r15
- # qhasm: squarer41 += squarerdx + carry
- # asm 1: adc <squarerdx=int64#3,<squarer41=int64#14
- # asm 2: adc <squarerdx=%rdx,<squarer41=%rbx
- adc %rdx,%rbx
- # qhasm: squarerax = *(uint64 *)(pp + 16)
- # asm 1: movq 16(<pp=int64#2),>squarerax=int64#3
- # asm 2: movq 16(<pp=%rsi),>squarerax=%rdx
- movq 16(%rsi),%rdx
- # qhasm: squarerax *= 38
- # asm 1: imulq $38,<squarerax=int64#3,>squarerax=int64#7
- # asm 2: imulq $38,<squarerax=%rdx,>squarerax=%rax
- imulq $38,%rdx,%rax
- # qhasm: (uint128) squarerdx squarerax = squarerax * *(uint64 *)(pp + 24)
- # asm 1: mulq 24(<pp=int64#2)
- # asm 2: mulq 24(<pp=%rsi)
- mulq 24(%rsi)
- # qhasm: carry? a0 += squarerax
- # asm 1: add <squarerax=int64#7,<a0=int64#4
- # asm 2: add <squarerax=%rax,<a0=%rcx
- add %rax,%rcx
- # qhasm: squarer01 += squarerdx + carry
- # asm 1: adc <squarerdx=int64#3,<squarer01=int64#5
- # asm 2: adc <squarerdx=%rdx,<squarer01=%r8
- adc %rdx,%r8
- # qhasm: squarerax = *(uint64 *)(pp + 16)
- # asm 1: movq 16(<pp=int64#2),>squarerax=int64#3
- # asm 2: movq 16(<pp=%rsi),>squarerax=%rdx
- movq 16(%rsi),%rdx
- # qhasm: squarerax *= 38
- # asm 1: imulq $38,<squarerax=int64#3,>squarerax=int64#7
- # asm 2: imulq $38,<squarerax=%rdx,>squarerax=%rax
- imulq $38,%rdx,%rax
- # qhasm: (uint128) squarerdx squarerax = squarerax * *(uint64 *)(pp + 32)
- # asm 1: mulq 32(<pp=int64#2)
- # asm 2: mulq 32(<pp=%rsi)
- mulq 32(%rsi)
- # qhasm: carry? a1 += squarerax
- # asm 1: add <squarerax=int64#7,<a1=int64#6
- # asm 2: add <squarerax=%rax,<a1=%r9
- add %rax,%r9
- # qhasm: squarer11 += squarerdx + carry
- # asm 1: adc <squarerdx=int64#3,<squarer11=int64#8
- # asm 2: adc <squarerdx=%rdx,<squarer11=%r10
- adc %rdx,%r10
- # qhasm: squarerax = *(uint64 *)(pp + 24)
- # asm 1: movq 24(<pp=int64#2),>squarerax=int64#3
- # asm 2: movq 24(<pp=%rsi),>squarerax=%rdx
- movq 24(%rsi),%rdx
- # qhasm: squarerax *= 19
- # asm 1: imulq $19,<squarerax=int64#3,>squarerax=int64#7
- # asm 2: imulq $19,<squarerax=%rdx,>squarerax=%rax
- imulq $19,%rdx,%rax
- # qhasm: (uint128) squarerdx squarerax = squarerax * *(uint64 *)(pp + 24)
- # asm 1: mulq 24(<pp=int64#2)
- # asm 2: mulq 24(<pp=%rsi)
- mulq 24(%rsi)
- # qhasm: carry? a1 += squarerax
- # asm 1: add <squarerax=int64#7,<a1=int64#6
- # asm 2: add <squarerax=%rax,<a1=%r9
- add %rax,%r9
- # qhasm: squarer11 += squarerdx + carry
- # asm 1: adc <squarerdx=int64#3,<squarer11=int64#8
- # asm 2: adc <squarerdx=%rdx,<squarer11=%r10
- adc %rdx,%r10
- # qhasm: squarerax = *(uint64 *)(pp + 24)
- # asm 1: movq 24(<pp=int64#2),>squarerax=int64#3
- # asm 2: movq 24(<pp=%rsi),>squarerax=%rdx
- movq 24(%rsi),%rdx
- # qhasm: squarerax *= 38
- # asm 1: imulq $38,<squarerax=int64#3,>squarerax=int64#7
- # asm 2: imulq $38,<squarerax=%rdx,>squarerax=%rax
- imulq $38,%rdx,%rax
- # qhasm: (uint128) squarerdx squarerax = squarerax * *(uint64 *)(pp + 32)
- # asm 1: mulq 32(<pp=int64#2)
- # asm 2: mulq 32(<pp=%rsi)
- mulq 32(%rsi)
- # qhasm: carry? a2 += squarerax
- # asm 1: add <squarerax=int64#7,<a2=int64#9
- # asm 2: add <squarerax=%rax,<a2=%r11
- add %rax,%r11
- # qhasm: squarer21 += squarerdx + carry
- # asm 1: adc <squarerdx=int64#3,<squarer21=int64#10
- # asm 2: adc <squarerdx=%rdx,<squarer21=%r12
- adc %rdx,%r12
- # qhasm: squarerax = *(uint64 *)(pp + 32)
- # asm 1: movq 32(<pp=int64#2),>squarerax=int64#3
- # asm 2: movq 32(<pp=%rsi),>squarerax=%rdx
- movq 32(%rsi),%rdx
- # qhasm: squarerax *= 19
- # asm 1: imulq $19,<squarerax=int64#3,>squarerax=int64#7
- # asm 2: imulq $19,<squarerax=%rdx,>squarerax=%rax
- imulq $19,%rdx,%rax
- # qhasm: (uint128) squarerdx squarerax = squarerax * *(uint64 *)(pp + 32)
- # asm 1: mulq 32(<pp=int64#2)
- # asm 2: mulq 32(<pp=%rsi)
- mulq 32(%rsi)
- # qhasm: carry? a3 += squarerax
- # asm 1: add <squarerax=int64#7,<a3=int64#11
- # asm 2: add <squarerax=%rax,<a3=%r13
- add %rax,%r13
- # qhasm: squarer31 += squarerdx + carry
- # asm 1: adc <squarerdx=int64#3,<squarer31=int64#12
- # asm 2: adc <squarerdx=%rdx,<squarer31=%r14
- adc %rdx,%r14
- # qhasm: squareredmask = *(uint64 *) &CRYPTO_NAMESPACE(batch_REDMASK51)
- # asm 1: movq CRYPTO_NAMESPACE(batch_REDMASK51),>squareredmask=int64#3
- # asm 2: movq CRYPTO_NAMESPACE(batch_REDMASK51),>squareredmask=%rdx
- movq CRYPTO_NAMESPACE(batch_REDMASK51)(%rip),%rdx
- # qhasm: squarer01 = (squarer01.a0) << 13
- # asm 1: shld $13,<a0=int64#4,<squarer01=int64#5
- # asm 2: shld $13,<a0=%rcx,<squarer01=%r8
- shld $13,%rcx,%r8
- # qhasm: a0 &= squareredmask
- # asm 1: and <squareredmask=int64#3,<a0=int64#4
- # asm 2: and <squareredmask=%rdx,<a0=%rcx
- and %rdx,%rcx
- # qhasm: squarer11 = (squarer11.a1) << 13
- # asm 1: shld $13,<a1=int64#6,<squarer11=int64#8
- # asm 2: shld $13,<a1=%r9,<squarer11=%r10
- shld $13,%r9,%r10
- # qhasm: a1 &= squareredmask
- # asm 1: and <squareredmask=int64#3,<a1=int64#6
- # asm 2: and <squareredmask=%rdx,<a1=%r9
- and %rdx,%r9
- # qhasm: a1 += squarer01
- # asm 1: add <squarer01=int64#5,<a1=int64#6
- # asm 2: add <squarer01=%r8,<a1=%r9
- add %r8,%r9
- # qhasm: squarer21 = (squarer21.a2) << 13
- # asm 1: shld $13,<a2=int64#9,<squarer21=int64#10
- # asm 2: shld $13,<a2=%r11,<squarer21=%r12
- shld $13,%r11,%r12
- # qhasm: a2 &= squareredmask
- # asm 1: and <squareredmask=int64#3,<a2=int64#9
- # asm 2: and <squareredmask=%rdx,<a2=%r11
- and %rdx,%r11
- # qhasm: a2 += squarer11
- # asm 1: add <squarer11=int64#8,<a2=int64#9
- # asm 2: add <squarer11=%r10,<a2=%r11
- add %r10,%r11
- # qhasm: squarer31 = (squarer31.a3) << 13
- # asm 1: shld $13,<a3=int64#11,<squarer31=int64#12
- # asm 2: shld $13,<a3=%r13,<squarer31=%r14
- shld $13,%r13,%r14
- # qhasm: a3 &= squareredmask
- # asm 1: and <squareredmask=int64#3,<a3=int64#11
- # asm 2: and <squareredmask=%rdx,<a3=%r13
- and %rdx,%r13
- # qhasm: a3 += squarer21
- # asm 1: add <squarer21=int64#10,<a3=int64#11
- # asm 2: add <squarer21=%r12,<a3=%r13
- add %r12,%r13
- # qhasm: squarer41 = (squarer41.a4) << 13
- # asm 1: shld $13,<a4=int64#13,<squarer41=int64#14
- # asm 2: shld $13,<a4=%r15,<squarer41=%rbx
- shld $13,%r15,%rbx
- # qhasm: a4 &= squareredmask
- # asm 1: and <squareredmask=int64#3,<a4=int64#13
- # asm 2: and <squareredmask=%rdx,<a4=%r15
- and %rdx,%r15
- # qhasm: a4 += squarer31
- # asm 1: add <squarer31=int64#12,<a4=int64#13
- # asm 2: add <squarer31=%r14,<a4=%r15
- add %r14,%r15
- # qhasm: squarer41 = squarer41 * 19
- # asm 1: imulq $19,<squarer41=int64#14,>squarer41=int64#5
- # asm 2: imulq $19,<squarer41=%rbx,>squarer41=%r8
- imulq $19,%rbx,%r8
- # qhasm: a0 += squarer41
- # asm 1: add <squarer41=int64#5,<a0=int64#4
- # asm 2: add <squarer41=%r8,<a0=%rcx
- add %r8,%rcx
- # qhasm: squaret = a0
- # asm 1: mov <a0=int64#4,>squaret=int64#5
- # asm 2: mov <a0=%rcx,>squaret=%r8
- mov %rcx,%r8
- # qhasm: (uint64) squaret >>= 51
- # asm 1: shr $51,<squaret=int64#5
- # asm 2: shr $51,<squaret=%r8
- shr $51,%r8
- # qhasm: squaret += a1
- # asm 1: add <a1=int64#6,<squaret=int64#5
- # asm 2: add <a1=%r9,<squaret=%r8
- add %r9,%r8
- # qhasm: a0 &= squareredmask
- # asm 1: and <squareredmask=int64#3,<a0=int64#4
- # asm 2: and <squareredmask=%rdx,<a0=%rcx
- and %rdx,%rcx
- # qhasm: a1 = squaret
- # asm 1: mov <squaret=int64#5,>a1=int64#6
- # asm 2: mov <squaret=%r8,>a1=%r9
- mov %r8,%r9
- # qhasm: (uint64) squaret >>= 51
- # asm 1: shr $51,<squaret=int64#5
- # asm 2: shr $51,<squaret=%r8
- shr $51,%r8
- # qhasm: squaret += a2
- # asm 1: add <a2=int64#9,<squaret=int64#5
- # asm 2: add <a2=%r11,<squaret=%r8
- add %r11,%r8
- # qhasm: a1 &= squareredmask
- # asm 1: and <squareredmask=int64#3,<a1=int64#6
- # asm 2: and <squareredmask=%rdx,<a1=%r9
- and %rdx,%r9
- # qhasm: a2 = squaret
- # asm 1: mov <squaret=int64#5,>a2=int64#7
- # asm 2: mov <squaret=%r8,>a2=%rax
- mov %r8,%rax
- # qhasm: (uint64) squaret >>= 51
- # asm 1: shr $51,<squaret=int64#5
- # asm 2: shr $51,<squaret=%r8
- shr $51,%r8
- # qhasm: squaret += a3
- # asm 1: add <a3=int64#11,<squaret=int64#5
- # asm 2: add <a3=%r13,<squaret=%r8
- add %r13,%r8
- # qhasm: a2 &= squareredmask
- # asm 1: and <squareredmask=int64#3,<a2=int64#7
- # asm 2: and <squareredmask=%rdx,<a2=%rax
- and %rdx,%rax
- # qhasm: a3 = squaret
- # asm 1: mov <squaret=int64#5,>a3=int64#8
- # asm 2: mov <squaret=%r8,>a3=%r10
- mov %r8,%r10
- # qhasm: (uint64) squaret >>= 51
- # asm 1: shr $51,<squaret=int64#5
- # asm 2: shr $51,<squaret=%r8
- shr $51,%r8
- # qhasm: squaret += a4
- # asm 1: add <a4=int64#13,<squaret=int64#5
- # asm 2: add <a4=%r15,<squaret=%r8
- add %r15,%r8
- # qhasm: a3 &= squareredmask
- # asm 1: and <squareredmask=int64#3,<a3=int64#8
- # asm 2: and <squareredmask=%rdx,<a3=%r10
- and %rdx,%r10
- # qhasm: a4 = squaret
- # asm 1: mov <squaret=int64#5,>a4=int64#9
- # asm 2: mov <squaret=%r8,>a4=%r11
- mov %r8,%r11
- # qhasm: (uint64) squaret >>= 51
- # asm 1: shr $51,<squaret=int64#5
- # asm 2: shr $51,<squaret=%r8
- shr $51,%r8
- # qhasm: squaret *= 19
- # asm 1: imulq $19,<squaret=int64#5,>squaret=int64#5
- # asm 2: imulq $19,<squaret=%r8,>squaret=%r8
- imulq $19,%r8,%r8
- # qhasm: a0 += squaret
- # asm 1: add <squaret=int64#5,<a0=int64#4
- # asm 2: add <squaret=%r8,<a0=%rcx
- add %r8,%rcx
- # qhasm: a4 &= squareredmask
- # asm 1: and <squareredmask=int64#3,<a4=int64#9
- # asm 2: and <squareredmask=%rdx,<a4=%r11
- and %rdx,%r11
- # qhasm: a0_stack = a0
- # asm 1: movq <a0=int64#4,>a0_stack=stack64#8
- # asm 2: movq <a0=%rcx,>a0_stack=56(%rsp)
- movq %rcx,56(%rsp)
- # qhasm: a1_stack = a1
- # asm 1: movq <a1=int64#6,>a1_stack=stack64#9
- # asm 2: movq <a1=%r9,>a1_stack=64(%rsp)
- movq %r9,64(%rsp)
- # qhasm: a2_stack = a2
- # asm 1: movq <a2=int64#7,>a2_stack=stack64#10
- # asm 2: movq <a2=%rax,>a2_stack=72(%rsp)
- movq %rax,72(%rsp)
- # qhasm: a3_stack = a3
- # asm 1: movq <a3=int64#8,>a3_stack=stack64#11
- # asm 2: movq <a3=%r10,>a3_stack=80(%rsp)
- movq %r10,80(%rsp)
- # qhasm: a4_stack = a4
- # asm 1: movq <a4=int64#9,>a4_stack=stack64#12
- # asm 2: movq <a4=%r11,>a4_stack=88(%rsp)
- movq %r11,88(%rsp)
- # qhasm: squarerax = *(uint64 *)(pp + 40)
- # asm 1: movq 40(<pp=int64#2),>squarerax=int64#7
- # asm 2: movq 40(<pp=%rsi),>squarerax=%rax
- movq 40(%rsi),%rax
- # qhasm: (uint128) squarerdx squarerax = squarerax * *(uint64 *)(pp + 40)
- # asm 1: mulq 40(<pp=int64#2)
- # asm 2: mulq 40(<pp=%rsi)
- mulq 40(%rsi)
- # qhasm: b0 = squarerax
- # asm 1: mov <squarerax=int64#7,>b0=int64#4
- # asm 2: mov <squarerax=%rax,>b0=%rcx
- mov %rax,%rcx
- # qhasm: squarer01 = squarerdx
- # asm 1: mov <squarerdx=int64#3,>squarer01=int64#5
- # asm 2: mov <squarerdx=%rdx,>squarer01=%r8
- mov %rdx,%r8
- # qhasm: squarerax = *(uint64 *)(pp + 40)
- # asm 1: movq 40(<pp=int64#2),>squarerax=int64#7
- # asm 2: movq 40(<pp=%rsi),>squarerax=%rax
- movq 40(%rsi),%rax
- # qhasm: squarerax <<= 1
- # asm 1: shl $1,<squarerax=int64#7
- # asm 2: shl $1,<squarerax=%rax
- shl $1,%rax
- # qhasm: (uint128) squarerdx squarerax = squarerax * *(uint64 *)(pp + 48)
- # asm 1: mulq 48(<pp=int64#2)
- # asm 2: mulq 48(<pp=%rsi)
- mulq 48(%rsi)
- # qhasm: b1 = squarerax
- # asm 1: mov <squarerax=int64#7,>b1=int64#6
- # asm 2: mov <squarerax=%rax,>b1=%r9
- mov %rax,%r9
- # qhasm: squarer11 = squarerdx
- # asm 1: mov <squarerdx=int64#3,>squarer11=int64#8
- # asm 2: mov <squarerdx=%rdx,>squarer11=%r10
- mov %rdx,%r10
- # qhasm: squarerax = *(uint64 *)(pp + 40)
- # asm 1: movq 40(<pp=int64#2),>squarerax=int64#7
- # asm 2: movq 40(<pp=%rsi),>squarerax=%rax
- movq 40(%rsi),%rax
- # qhasm: squarerax <<= 1
- # asm 1: shl $1,<squarerax=int64#7
- # asm 2: shl $1,<squarerax=%rax
- shl $1,%rax
- # qhasm: (uint128) squarerdx squarerax = squarerax * *(uint64 *)(pp + 56)
- # asm 1: mulq 56(<pp=int64#2)
- # asm 2: mulq 56(<pp=%rsi)
- mulq 56(%rsi)
- # qhasm: b2 = squarerax
- # asm 1: mov <squarerax=int64#7,>b2=int64#9
- # asm 2: mov <squarerax=%rax,>b2=%r11
- mov %rax,%r11
- # qhasm: squarer21 = squarerdx
- # asm 1: mov <squarerdx=int64#3,>squarer21=int64#10
- # asm 2: mov <squarerdx=%rdx,>squarer21=%r12
- mov %rdx,%r12
- # qhasm: squarerax = *(uint64 *)(pp + 40)
- # asm 1: movq 40(<pp=int64#2),>squarerax=int64#7
- # asm 2: movq 40(<pp=%rsi),>squarerax=%rax
- movq 40(%rsi),%rax
- # qhasm: squarerax <<= 1
- # asm 1: shl $1,<squarerax=int64#7
- # asm 2: shl $1,<squarerax=%rax
- shl $1,%rax
- # qhasm: (uint128) squarerdx squarerax = squarerax * *(uint64 *)(pp + 64)
- # asm 1: mulq 64(<pp=int64#2)
- # asm 2: mulq 64(<pp=%rsi)
- mulq 64(%rsi)
- # qhasm: b3 = squarerax
- # asm 1: mov <squarerax=int64#7,>b3=int64#11
- # asm 2: mov <squarerax=%rax,>b3=%r13
- mov %rax,%r13
- # qhasm: squarer31 = squarerdx
- # asm 1: mov <squarerdx=int64#3,>squarer31=int64#12
- # asm 2: mov <squarerdx=%rdx,>squarer31=%r14
- mov %rdx,%r14
- # qhasm: squarerax = *(uint64 *)(pp + 40)
- # asm 1: movq 40(<pp=int64#2),>squarerax=int64#7
- # asm 2: movq 40(<pp=%rsi),>squarerax=%rax
- movq 40(%rsi),%rax
- # qhasm: squarerax <<= 1
- # asm 1: shl $1,<squarerax=int64#7
- # asm 2: shl $1,<squarerax=%rax
- shl $1,%rax
- # qhasm: (uint128) squarerdx squarerax = squarerax * *(uint64 *)(pp + 72)
- # asm 1: mulq 72(<pp=int64#2)
- # asm 2: mulq 72(<pp=%rsi)
- mulq 72(%rsi)
- # qhasm: b4 = squarerax
- # asm 1: mov <squarerax=int64#7,>b4=int64#13
- # asm 2: mov <squarerax=%rax,>b4=%r15
- mov %rax,%r15
- # qhasm: squarer41 = squarerdx
- # asm 1: mov <squarerdx=int64#3,>squarer41=int64#14
- # asm 2: mov <squarerdx=%rdx,>squarer41=%rbx
- mov %rdx,%rbx
- # qhasm: squarerax = *(uint64 *)(pp + 48)
- # asm 1: movq 48(<pp=int64#2),>squarerax=int64#7
- # asm 2: movq 48(<pp=%rsi),>squarerax=%rax
- movq 48(%rsi),%rax
- # qhasm: (uint128) squarerdx squarerax = squarerax * *(uint64 *)(pp + 48)
- # asm 1: mulq 48(<pp=int64#2)
- # asm 2: mulq 48(<pp=%rsi)
- mulq 48(%rsi)
- # qhasm: carry? b2 += squarerax
- # asm 1: add <squarerax=int64#7,<b2=int64#9
- # asm 2: add <squarerax=%rax,<b2=%r11
- add %rax,%r11
- # qhasm: squarer21 += squarerdx + carry
- # asm 1: adc <squarerdx=int64#3,<squarer21=int64#10
- # asm 2: adc <squarerdx=%rdx,<squarer21=%r12
- adc %rdx,%r12
- # qhasm: squarerax = *(uint64 *)(pp + 48)
- # asm 1: movq 48(<pp=int64#2),>squarerax=int64#7
- # asm 2: movq 48(<pp=%rsi),>squarerax=%rax
- movq 48(%rsi),%rax
- # qhasm: squarerax <<= 1
- # asm 1: shl $1,<squarerax=int64#7
- # asm 2: shl $1,<squarerax=%rax
- shl $1,%rax
- # qhasm: (uint128) squarerdx squarerax = squarerax * *(uint64 *)(pp + 56)
- # asm 1: mulq 56(<pp=int64#2)
- # asm 2: mulq 56(<pp=%rsi)
- mulq 56(%rsi)
- # qhasm: carry? b3 += squarerax
- # asm 1: add <squarerax=int64#7,<b3=int64#11
- # asm 2: add <squarerax=%rax,<b3=%r13
- add %rax,%r13
- # qhasm: squarer31 += squarerdx + carry
- # asm 1: adc <squarerdx=int64#3,<squarer31=int64#12
- # asm 2: adc <squarerdx=%rdx,<squarer31=%r14
- adc %rdx,%r14
- # qhasm: squarerax = *(uint64 *)(pp + 48)
- # asm 1: movq 48(<pp=int64#2),>squarerax=int64#7
- # asm 2: movq 48(<pp=%rsi),>squarerax=%rax
- movq 48(%rsi),%rax
- # qhasm: squarerax <<= 1
- # asm 1: shl $1,<squarerax=int64#7
- # asm 2: shl $1,<squarerax=%rax
- shl $1,%rax
- # qhasm: (uint128) squarerdx squarerax = squarerax * *(uint64 *)(pp + 64)
- # asm 1: mulq 64(<pp=int64#2)
- # asm 2: mulq 64(<pp=%rsi)
- mulq 64(%rsi)
- # qhasm: carry? b4 += squarerax
- # asm 1: add <squarerax=int64#7,<b4=int64#13
- # asm 2: add <squarerax=%rax,<b4=%r15
- add %rax,%r15
- # qhasm: squarer41 += squarerdx + carry
- # asm 1: adc <squarerdx=int64#3,<squarer41=int64#14
- # asm 2: adc <squarerdx=%rdx,<squarer41=%rbx
- adc %rdx,%rbx
- # qhasm: squarerax = *(uint64 *)(pp + 48)
- # asm 1: movq 48(<pp=int64#2),>squarerax=int64#3
- # asm 2: movq 48(<pp=%rsi),>squarerax=%rdx
- movq 48(%rsi),%rdx
- # qhasm: squarerax *= 38
- # asm 1: imulq $38,<squarerax=int64#3,>squarerax=int64#7
- # asm 2: imulq $38,<squarerax=%rdx,>squarerax=%rax
- imulq $38,%rdx,%rax
- # qhasm: (uint128) squarerdx squarerax = squarerax * *(uint64 *)(pp + 72)
- # asm 1: mulq 72(<pp=int64#2)
- # asm 2: mulq 72(<pp=%rsi)
- mulq 72(%rsi)
- # qhasm: carry? b0 += squarerax
- # asm 1: add <squarerax=int64#7,<b0=int64#4
- # asm 2: add <squarerax=%rax,<b0=%rcx
- add %rax,%rcx
- # qhasm: squarer01 += squarerdx + carry
- # asm 1: adc <squarerdx=int64#3,<squarer01=int64#5
- # asm 2: adc <squarerdx=%rdx,<squarer01=%r8
- adc %rdx,%r8
- # qhasm: squarerax = *(uint64 *)(pp + 56)
- # asm 1: movq 56(<pp=int64#2),>squarerax=int64#7
- # asm 2: movq 56(<pp=%rsi),>squarerax=%rax
- movq 56(%rsi),%rax
- # qhasm: (uint128) squarerdx squarerax = squarerax * *(uint64 *)(pp + 56)
- # asm 1: mulq 56(<pp=int64#2)
- # asm 2: mulq 56(<pp=%rsi)
- mulq 56(%rsi)
- # qhasm: carry? b4 += squarerax
- # asm 1: add <squarerax=int64#7,<b4=int64#13
- # asm 2: add <squarerax=%rax,<b4=%r15
- add %rax,%r15
- # qhasm: squarer41 += squarerdx + carry
- # asm 1: adc <squarerdx=int64#3,<squarer41=int64#14
- # asm 2: adc <squarerdx=%rdx,<squarer41=%rbx
- adc %rdx,%rbx
- # qhasm: squarerax = *(uint64 *)(pp + 56)
- # asm 1: movq 56(<pp=int64#2),>squarerax=int64#3
- # asm 2: movq 56(<pp=%rsi),>squarerax=%rdx
- movq 56(%rsi),%rdx
- # qhasm: squarerax *= 38
- # asm 1: imulq $38,<squarerax=int64#3,>squarerax=int64#7
- # asm 2: imulq $38,<squarerax=%rdx,>squarerax=%rax
- imulq $38,%rdx,%rax
- # qhasm: (uint128) squarerdx squarerax = squarerax * *(uint64 *)(pp + 64)
- # asm 1: mulq 64(<pp=int64#2)
- # asm 2: mulq 64(<pp=%rsi)
- mulq 64(%rsi)
- # qhasm: carry? b0 += squarerax
- # asm 1: add <squarerax=int64#7,<b0=int64#4
- # asm 2: add <squarerax=%rax,<b0=%rcx
- add %rax,%rcx
- # qhasm: squarer01 += squarerdx + carry
- # asm 1: adc <squarerdx=int64#3,<squarer01=int64#5
- # asm 2: adc <squarerdx=%rdx,<squarer01=%r8
- adc %rdx,%r8
- # qhasm: squarerax = *(uint64 *)(pp + 56)
- # asm 1: movq 56(<pp=int64#2),>squarerax=int64#3
- # asm 2: movq 56(<pp=%rsi),>squarerax=%rdx
- movq 56(%rsi),%rdx
- # qhasm: squarerax *= 38
- # asm 1: imulq $38,<squarerax=int64#3,>squarerax=int64#7
- # asm 2: imulq $38,<squarerax=%rdx,>squarerax=%rax
- imulq $38,%rdx,%rax
- # qhasm: (uint128) squarerdx squarerax = squarerax * *(uint64 *)(pp + 72)
- # asm 1: mulq 72(<pp=int64#2)
- # asm 2: mulq 72(<pp=%rsi)
- mulq 72(%rsi)
- # qhasm: carry? b1 += squarerax
- # asm 1: add <squarerax=int64#7,<b1=int64#6
- # asm 2: add <squarerax=%rax,<b1=%r9
- add %rax,%r9
- # qhasm: squarer11 += squarerdx + carry
- # asm 1: adc <squarerdx=int64#3,<squarer11=int64#8
- # asm 2: adc <squarerdx=%rdx,<squarer11=%r10
- adc %rdx,%r10
- # qhasm: squarerax = *(uint64 *)(pp + 64)
- # asm 1: movq 64(<pp=int64#2),>squarerax=int64#3
- # asm 2: movq 64(<pp=%rsi),>squarerax=%rdx
- movq 64(%rsi),%rdx
- # qhasm: squarerax *= 19
- # asm 1: imulq $19,<squarerax=int64#3,>squarerax=int64#7
- # asm 2: imulq $19,<squarerax=%rdx,>squarerax=%rax
- imulq $19,%rdx,%rax
- # qhasm: (uint128) squarerdx squarerax = squarerax * *(uint64 *)(pp + 64)
- # asm 1: mulq 64(<pp=int64#2)
- # asm 2: mulq 64(<pp=%rsi)
- mulq 64(%rsi)
- # qhasm: carry? b1 += squarerax
- # asm 1: add <squarerax=int64#7,<b1=int64#6
- # asm 2: add <squarerax=%rax,<b1=%r9
- add %rax,%r9
- # qhasm: squarer11 += squarerdx + carry
- # asm 1: adc <squarerdx=int64#3,<squarer11=int64#8
- # asm 2: adc <squarerdx=%rdx,<squarer11=%r10
- adc %rdx,%r10
- # qhasm: squarerax = *(uint64 *)(pp + 64)
- # asm 1: movq 64(<pp=int64#2),>squarerax=int64#3
- # asm 2: movq 64(<pp=%rsi),>squarerax=%rdx
- movq 64(%rsi),%rdx
- # qhasm: squarerax *= 38
- # asm 1: imulq $38,<squarerax=int64#3,>squarerax=int64#7
- # asm 2: imulq $38,<squarerax=%rdx,>squarerax=%rax
- imulq $38,%rdx,%rax
- # qhasm: (uint128) squarerdx squarerax = squarerax * *(uint64 *)(pp + 72)
- # asm 1: mulq 72(<pp=int64#2)
- # asm 2: mulq 72(<pp=%rsi)
- mulq 72(%rsi)
- # qhasm: carry? b2 += squarerax
- # asm 1: add <squarerax=int64#7,<b2=int64#9
- # asm 2: add <squarerax=%rax,<b2=%r11
- add %rax,%r11
- # qhasm: squarer21 += squarerdx + carry
- # asm 1: adc <squarerdx=int64#3,<squarer21=int64#10
- # asm 2: adc <squarerdx=%rdx,<squarer21=%r12
- adc %rdx,%r12
- # qhasm: squarerax = *(uint64 *)(pp + 72)
- # asm 1: movq 72(<pp=int64#2),>squarerax=int64#3
- # asm 2: movq 72(<pp=%rsi),>squarerax=%rdx
- movq 72(%rsi),%rdx
- # qhasm: squarerax *= 19
- # asm 1: imulq $19,<squarerax=int64#3,>squarerax=int64#7
- # asm 2: imulq $19,<squarerax=%rdx,>squarerax=%rax
- imulq $19,%rdx,%rax
- # qhasm: (uint128) squarerdx squarerax = squarerax * *(uint64 *)(pp + 72)
- # asm 1: mulq 72(<pp=int64#2)
- # asm 2: mulq 72(<pp=%rsi)
- mulq 72(%rsi)
- # qhasm: carry? b3 += squarerax
- # asm 1: add <squarerax=int64#7,<b3=int64#11
- # asm 2: add <squarerax=%rax,<b3=%r13
- add %rax,%r13
- # qhasm: squarer31 += squarerdx + carry
- # asm 1: adc <squarerdx=int64#3,<squarer31=int64#12
- # asm 2: adc <squarerdx=%rdx,<squarer31=%r14
- adc %rdx,%r14
- # qhasm: squareredmask = *(uint64 *) &CRYPTO_NAMESPACE(batch_REDMASK51)
- # asm 1: movq CRYPTO_NAMESPACE(batch_REDMASK51),>squareredmask=int64#3
- # asm 2: movq CRYPTO_NAMESPACE(batch_REDMASK51),>squareredmask=%rdx
- movq CRYPTO_NAMESPACE(batch_REDMASK51)(%rip),%rdx
- # qhasm: squarer01 = (squarer01.b0) << 13
- # asm 1: shld $13,<b0=int64#4,<squarer01=int64#5
- # asm 2: shld $13,<b0=%rcx,<squarer01=%r8
- shld $13,%rcx,%r8
- # qhasm: b0 &= squareredmask
- # asm 1: and <squareredmask=int64#3,<b0=int64#4
- # asm 2: and <squareredmask=%rdx,<b0=%rcx
- and %rdx,%rcx
- # qhasm: squarer11 = (squarer11.b1) << 13
- # asm 1: shld $13,<b1=int64#6,<squarer11=int64#8
- # asm 2: shld $13,<b1=%r9,<squarer11=%r10
- shld $13,%r9,%r10
- # qhasm: b1 &= squareredmask
- # asm 1: and <squareredmask=int64#3,<b1=int64#6
- # asm 2: and <squareredmask=%rdx,<b1=%r9
- and %rdx,%r9
- # qhasm: b1 += squarer01
- # asm 1: add <squarer01=int64#5,<b1=int64#6
- # asm 2: add <squarer01=%r8,<b1=%r9
- add %r8,%r9
- # qhasm: squarer21 = (squarer21.b2) << 13
- # asm 1: shld $13,<b2=int64#9,<squarer21=int64#10
- # asm 2: shld $13,<b2=%r11,<squarer21=%r12
- shld $13,%r11,%r12
- # qhasm: b2 &= squareredmask
- # asm 1: and <squareredmask=int64#3,<b2=int64#9
- # asm 2: and <squareredmask=%rdx,<b2=%r11
- and %rdx,%r11
- # qhasm: b2 += squarer11
- # asm 1: add <squarer11=int64#8,<b2=int64#9
- # asm 2: add <squarer11=%r10,<b2=%r11
- add %r10,%r11
- # qhasm: squarer31 = (squarer31.b3) << 13
- # asm 1: shld $13,<b3=int64#11,<squarer31=int64#12
- # asm 2: shld $13,<b3=%r13,<squarer31=%r14
- shld $13,%r13,%r14
- # qhasm: b3 &= squareredmask
- # asm 1: and <squareredmask=int64#3,<b3=int64#11
- # asm 2: and <squareredmask=%rdx,<b3=%r13
- and %rdx,%r13
- # qhasm: b3 += squarer21
- # asm 1: add <squarer21=int64#10,<b3=int64#11
- # asm 2: add <squarer21=%r12,<b3=%r13
- add %r12,%r13
- # qhasm: squarer41 = (squarer41.b4) << 13
- # asm 1: shld $13,<b4=int64#13,<squarer41=int64#14
- # asm 2: shld $13,<b4=%r15,<squarer41=%rbx
- shld $13,%r15,%rbx
- # qhasm: b4 &= squareredmask
- # asm 1: and <squareredmask=int64#3,<b4=int64#13
- # asm 2: and <squareredmask=%rdx,<b4=%r15
- and %rdx,%r15
- # qhasm: b4 += squarer31
- # asm 1: add <squarer31=int64#12,<b4=int64#13
- # asm 2: add <squarer31=%r14,<b4=%r15
- add %r14,%r15
- # qhasm: squarer41 = squarer41 * 19
- # asm 1: imulq $19,<squarer41=int64#14,>squarer41=int64#5
- # asm 2: imulq $19,<squarer41=%rbx,>squarer41=%r8
- imulq $19,%rbx,%r8
- # qhasm: b0 += squarer41
- # asm 1: add <squarer41=int64#5,<b0=int64#4
- # asm 2: add <squarer41=%r8,<b0=%rcx
- add %r8,%rcx
- # qhasm: squaret = b0
- # asm 1: mov <b0=int64#4,>squaret=int64#5
- # asm 2: mov <b0=%rcx,>squaret=%r8
- mov %rcx,%r8
- # qhasm: (uint64) squaret >>= 51
- # asm 1: shr $51,<squaret=int64#5
- # asm 2: shr $51,<squaret=%r8
- shr $51,%r8
- # qhasm: squaret += b1
- # asm 1: add <b1=int64#6,<squaret=int64#5
- # asm 2: add <b1=%r9,<squaret=%r8
- add %r9,%r8
- # qhasm: b0 &= squareredmask
- # asm 1: and <squareredmask=int64#3,<b0=int64#4
- # asm 2: and <squareredmask=%rdx,<b0=%rcx
- and %rdx,%rcx
- # qhasm: b1 = squaret
- # asm 1: mov <squaret=int64#5,>b1=int64#6
- # asm 2: mov <squaret=%r8,>b1=%r9
- mov %r8,%r9
- # qhasm: (uint64) squaret >>= 51
- # asm 1: shr $51,<squaret=int64#5
- # asm 2: shr $51,<squaret=%r8
- shr $51,%r8
- # qhasm: squaret += b2
- # asm 1: add <b2=int64#9,<squaret=int64#5
- # asm 2: add <b2=%r11,<squaret=%r8
- add %r11,%r8
- # qhasm: b1 &= squareredmask
- # asm 1: and <squareredmask=int64#3,<b1=int64#6
- # asm 2: and <squareredmask=%rdx,<b1=%r9
- and %rdx,%r9
- # qhasm: b2 = squaret
- # asm 1: mov <squaret=int64#5,>b2=int64#7
- # asm 2: mov <squaret=%r8,>b2=%rax
- mov %r8,%rax
- # qhasm: (uint64) squaret >>= 51
- # asm 1: shr $51,<squaret=int64#5
- # asm 2: shr $51,<squaret=%r8
- shr $51,%r8
- # qhasm: squaret += b3
- # asm 1: add <b3=int64#11,<squaret=int64#5
- # asm 2: add <b3=%r13,<squaret=%r8
- add %r13,%r8
- # qhasm: b2 &= squareredmask
- # asm 1: and <squareredmask=int64#3,<b2=int64#7
- # asm 2: and <squareredmask=%rdx,<b2=%rax
- and %rdx,%rax
- # qhasm: b3 = squaret
- # asm 1: mov <squaret=int64#5,>b3=int64#8
- # asm 2: mov <squaret=%r8,>b3=%r10
- mov %r8,%r10
- # qhasm: (uint64) squaret >>= 51
- # asm 1: shr $51,<squaret=int64#5
- # asm 2: shr $51,<squaret=%r8
- shr $51,%r8
- # qhasm: squaret += b4
- # asm 1: add <b4=int64#13,<squaret=int64#5
- # asm 2: add <b4=%r15,<squaret=%r8
- add %r15,%r8
- # qhasm: b3 &= squareredmask
- # asm 1: and <squareredmask=int64#3,<b3=int64#8
- # asm 2: and <squareredmask=%rdx,<b3=%r10
- and %rdx,%r10
- # qhasm: b4 = squaret
- # asm 1: mov <squaret=int64#5,>b4=int64#9
- # asm 2: mov <squaret=%r8,>b4=%r11
- mov %r8,%r11
- # qhasm: (uint64) squaret >>= 51
- # asm 1: shr $51,<squaret=int64#5
- # asm 2: shr $51,<squaret=%r8
- shr $51,%r8
- # qhasm: squaret *= 19
- # asm 1: imulq $19,<squaret=int64#5,>squaret=int64#5
- # asm 2: imulq $19,<squaret=%r8,>squaret=%r8
- imulq $19,%r8,%r8
- # qhasm: b0 += squaret
- # asm 1: add <squaret=int64#5,<b0=int64#4
- # asm 2: add <squaret=%r8,<b0=%rcx
- add %r8,%rcx
- # qhasm: b4 &= squareredmask
- # asm 1: and <squareredmask=int64#3,<b4=int64#9
- # asm 2: and <squareredmask=%rdx,<b4=%r11
- and %rdx,%r11
- # qhasm: b0_stack = b0
- # asm 1: movq <b0=int64#4,>b0_stack=stack64#13
- # asm 2: movq <b0=%rcx,>b0_stack=96(%rsp)
- movq %rcx,96(%rsp)
- # qhasm: b1_stack = b1
- # asm 1: movq <b1=int64#6,>b1_stack=stack64#14
- # asm 2: movq <b1=%r9,>b1_stack=104(%rsp)
- movq %r9,104(%rsp)
- # qhasm: b2_stack = b2
- # asm 1: movq <b2=int64#7,>b2_stack=stack64#15
- # asm 2: movq <b2=%rax,>b2_stack=112(%rsp)
- movq %rax,112(%rsp)
- # qhasm: b3_stack = b3
- # asm 1: movq <b3=int64#8,>b3_stack=stack64#16
- # asm 2: movq <b3=%r10,>b3_stack=120(%rsp)
- movq %r10,120(%rsp)
- # qhasm: b4_stack = b4
- # asm 1: movq <b4=int64#9,>b4_stack=stack64#17
- # asm 2: movq <b4=%r11,>b4_stack=128(%rsp)
- movq %r11,128(%rsp)
- # qhasm: squarerax = *(uint64 *)(pp + 80)
- # asm 1: movq 80(<pp=int64#2),>squarerax=int64#7
- # asm 2: movq 80(<pp=%rsi),>squarerax=%rax
- movq 80(%rsi),%rax
- # qhasm: (uint128) squarerdx squarerax = squarerax * *(uint64 *)(pp + 80)
- # asm 1: mulq 80(<pp=int64#2)
- # asm 2: mulq 80(<pp=%rsi)
- mulq 80(%rsi)
- # qhasm: c0 = squarerax
- # asm 1: mov <squarerax=int64#7,>c0=int64#4
- # asm 2: mov <squarerax=%rax,>c0=%rcx
- mov %rax,%rcx
- # qhasm: squarer01 = squarerdx
- # asm 1: mov <squarerdx=int64#3,>squarer01=int64#5
- # asm 2: mov <squarerdx=%rdx,>squarer01=%r8
- mov %rdx,%r8
- # qhasm: squarerax = *(uint64 *)(pp + 80)
- # asm 1: movq 80(<pp=int64#2),>squarerax=int64#7
- # asm 2: movq 80(<pp=%rsi),>squarerax=%rax
- movq 80(%rsi),%rax
- # qhasm: squarerax <<= 1
- # asm 1: shl $1,<squarerax=int64#7
- # asm 2: shl $1,<squarerax=%rax
- shl $1,%rax
- # qhasm: (uint128) squarerdx squarerax = squarerax * *(uint64 *)(pp + 88)
- # asm 1: mulq 88(<pp=int64#2)
- # asm 2: mulq 88(<pp=%rsi)
- mulq 88(%rsi)
- # qhasm: c1 = squarerax
- # asm 1: mov <squarerax=int64#7,>c1=int64#6
- # asm 2: mov <squarerax=%rax,>c1=%r9
- mov %rax,%r9
- # qhasm: squarer11 = squarerdx
- # asm 1: mov <squarerdx=int64#3,>squarer11=int64#8
- # asm 2: mov <squarerdx=%rdx,>squarer11=%r10
- mov %rdx,%r10
- # qhasm: squarerax = *(uint64 *)(pp + 80)
- # asm 1: movq 80(<pp=int64#2),>squarerax=int64#7
- # asm 2: movq 80(<pp=%rsi),>squarerax=%rax
- movq 80(%rsi),%rax
- # qhasm: squarerax <<= 1
- # asm 1: shl $1,<squarerax=int64#7
- # asm 2: shl $1,<squarerax=%rax
- shl $1,%rax
- # qhasm: (uint128) squarerdx squarerax = squarerax * *(uint64 *)(pp + 96)
- # asm 1: mulq 96(<pp=int64#2)
- # asm 2: mulq 96(<pp=%rsi)
- mulq 96(%rsi)
- # qhasm: c2 = squarerax
- # asm 1: mov <squarerax=int64#7,>c2=int64#9
- # asm 2: mov <squarerax=%rax,>c2=%r11
- mov %rax,%r11
- # qhasm: squarer21 = squarerdx
- # asm 1: mov <squarerdx=int64#3,>squarer21=int64#10
- # asm 2: mov <squarerdx=%rdx,>squarer21=%r12
- mov %rdx,%r12
- # qhasm: squarerax = *(uint64 *)(pp + 80)
- # asm 1: movq 80(<pp=int64#2),>squarerax=int64#7
- # asm 2: movq 80(<pp=%rsi),>squarerax=%rax
- movq 80(%rsi),%rax
- # qhasm: squarerax <<= 1
- # asm 1: shl $1,<squarerax=int64#7
- # asm 2: shl $1,<squarerax=%rax
- shl $1,%rax
- # qhasm: (uint128) squarerdx squarerax = squarerax * *(uint64 *)(pp + 104)
- # asm 1: mulq 104(<pp=int64#2)
- # asm 2: mulq 104(<pp=%rsi)
- mulq 104(%rsi)
- # qhasm: c3 = squarerax
- # asm 1: mov <squarerax=int64#7,>c3=int64#11
- # asm 2: mov <squarerax=%rax,>c3=%r13
- mov %rax,%r13
- # qhasm: squarer31 = squarerdx
- # asm 1: mov <squarerdx=int64#3,>squarer31=int64#12
- # asm 2: mov <squarerdx=%rdx,>squarer31=%r14
- mov %rdx,%r14
- # qhasm: squarerax = *(uint64 *)(pp + 80)
- # asm 1: movq 80(<pp=int64#2),>squarerax=int64#7
- # asm 2: movq 80(<pp=%rsi),>squarerax=%rax
- movq 80(%rsi),%rax
- # qhasm: squarerax <<= 1
- # asm 1: shl $1,<squarerax=int64#7
- # asm 2: shl $1,<squarerax=%rax
- shl $1,%rax
- # qhasm: (uint128) squarerdx squarerax = squarerax * *(uint64 *)(pp + 112)
- # asm 1: mulq 112(<pp=int64#2)
- # asm 2: mulq 112(<pp=%rsi)
- mulq 112(%rsi)
- # qhasm: c4 = squarerax
- # asm 1: mov <squarerax=int64#7,>c4=int64#13
- # asm 2: mov <squarerax=%rax,>c4=%r15
- mov %rax,%r15
- # qhasm: squarer41 = squarerdx
- # asm 1: mov <squarerdx=int64#3,>squarer41=int64#14
- # asm 2: mov <squarerdx=%rdx,>squarer41=%rbx
- mov %rdx,%rbx
- # qhasm: squarerax = *(uint64 *)(pp + 88)
- # asm 1: movq 88(<pp=int64#2),>squarerax=int64#7
- # asm 2: movq 88(<pp=%rsi),>squarerax=%rax
- movq 88(%rsi),%rax
- # qhasm: (uint128) squarerdx squarerax = squarerax * *(uint64 *)(pp + 88)
- # asm 1: mulq 88(<pp=int64#2)
- # asm 2: mulq 88(<pp=%rsi)
- mulq 88(%rsi)
- # qhasm: carry? c2 += squarerax
- # asm 1: add <squarerax=int64#7,<c2=int64#9
- # asm 2: add <squarerax=%rax,<c2=%r11
- add %rax,%r11
- # qhasm: squarer21 += squarerdx + carry
- # asm 1: adc <squarerdx=int64#3,<squarer21=int64#10
- # asm 2: adc <squarerdx=%rdx,<squarer21=%r12
- adc %rdx,%r12
- # qhasm: squarerax = *(uint64 *)(pp + 88)
- # asm 1: movq 88(<pp=int64#2),>squarerax=int64#7
- # asm 2: movq 88(<pp=%rsi),>squarerax=%rax
- movq 88(%rsi),%rax
- # qhasm: squarerax <<= 1
- # asm 1: shl $1,<squarerax=int64#7
- # asm 2: shl $1,<squarerax=%rax
- shl $1,%rax
- # qhasm: (uint128) squarerdx squarerax = squarerax * *(uint64 *)(pp + 96)
- # asm 1: mulq 96(<pp=int64#2)
- # asm 2: mulq 96(<pp=%rsi)
- mulq 96(%rsi)
- # qhasm: carry? c3 += squarerax
- # asm 1: add <squarerax=int64#7,<c3=int64#11
- # asm 2: add <squarerax=%rax,<c3=%r13
- add %rax,%r13
- # qhasm: squarer31 += squarerdx + carry
- # asm 1: adc <squarerdx=int64#3,<squarer31=int64#12
- # asm 2: adc <squarerdx=%rdx,<squarer31=%r14
- adc %rdx,%r14
- # qhasm: squarerax = *(uint64 *)(pp + 88)
- # asm 1: movq 88(<pp=int64#2),>squarerax=int64#7
- # asm 2: movq 88(<pp=%rsi),>squarerax=%rax
- movq 88(%rsi),%rax
- # qhasm: squarerax <<= 1
- # asm 1: shl $1,<squarerax=int64#7
- # asm 2: shl $1,<squarerax=%rax
- shl $1,%rax
- # qhasm: (uint128) squarerdx squarerax = squarerax * *(uint64 *)(pp + 104)
- # asm 1: mulq 104(<pp=int64#2)
- # asm 2: mulq 104(<pp=%rsi)
- mulq 104(%rsi)
- # qhasm: carry? c4 += squarerax
- # asm 1: add <squarerax=int64#7,<c4=int64#13
- # asm 2: add <squarerax=%rax,<c4=%r15
- add %rax,%r15
- # qhasm: squarer41 += squarerdx + carry
- # asm 1: adc <squarerdx=int64#3,<squarer41=int64#14
- # asm 2: adc <squarerdx=%rdx,<squarer41=%rbx
- adc %rdx,%rbx
- # qhasm: squarerax = *(uint64 *)(pp + 88)
- # asm 1: movq 88(<pp=int64#2),>squarerax=int64#3
- # asm 2: movq 88(<pp=%rsi),>squarerax=%rdx
- movq 88(%rsi),%rdx
- # qhasm: squarerax *= 38
- # asm 1: imulq $38,<squarerax=int64#3,>squarerax=int64#7
- # asm 2: imulq $38,<squarerax=%rdx,>squarerax=%rax
- imulq $38,%rdx,%rax
- # qhasm: (uint128) squarerdx squarerax = squarerax * *(uint64 *)(pp + 112)
- # asm 1: mulq 112(<pp=int64#2)
- # asm 2: mulq 112(<pp=%rsi)
- mulq 112(%rsi)
- # qhasm: carry? c0 += squarerax
- # asm 1: add <squarerax=int64#7,<c0=int64#4
- # asm 2: add <squarerax=%rax,<c0=%rcx
- add %rax,%rcx
- # qhasm: squarer01 += squarerdx + carry
- # asm 1: adc <squarerdx=int64#3,<squarer01=int64#5
- # asm 2: adc <squarerdx=%rdx,<squarer01=%r8
- adc %rdx,%r8
- # qhasm: squarerax = *(uint64 *)(pp + 96)
- # asm 1: movq 96(<pp=int64#2),>squarerax=int64#7
- # asm 2: movq 96(<pp=%rsi),>squarerax=%rax
- movq 96(%rsi),%rax
- # qhasm: (uint128) squarerdx squarerax = squarerax * *(uint64 *)(pp + 96)
- # asm 1: mulq 96(<pp=int64#2)
- # asm 2: mulq 96(<pp=%rsi)
- mulq 96(%rsi)
- # qhasm: carry? c4 += squarerax
- # asm 1: add <squarerax=int64#7,<c4=int64#13
- # asm 2: add <squarerax=%rax,<c4=%r15
- add %rax,%r15
- # qhasm: squarer41 += squarerdx + carry
- # asm 1: adc <squarerdx=int64#3,<squarer41=int64#14
- # asm 2: adc <squarerdx=%rdx,<squarer41=%rbx
- adc %rdx,%rbx
- # qhasm: squarerax = *(uint64 *)(pp + 96)
- # asm 1: movq 96(<pp=int64#2),>squarerax=int64#3
- # asm 2: movq 96(<pp=%rsi),>squarerax=%rdx
- movq 96(%rsi),%rdx
- # qhasm: squarerax *= 38
- # asm 1: imulq $38,<squarerax=int64#3,>squarerax=int64#7
- # asm 2: imulq $38,<squarerax=%rdx,>squarerax=%rax
- imulq $38,%rdx,%rax
- # qhasm: (uint128) squarerdx squarerax = squarerax * *(uint64 *)(pp + 104)
- # asm 1: mulq 104(<pp=int64#2)
- # asm 2: mulq 104(<pp=%rsi)
- mulq 104(%rsi)
- # qhasm: carry? c0 += squarerax
- # asm 1: add <squarerax=int64#7,<c0=int64#4
- # asm 2: add <squarerax=%rax,<c0=%rcx
- add %rax,%rcx
- # qhasm: squarer01 += squarerdx + carry
- # asm 1: adc <squarerdx=int64#3,<squarer01=int64#5
- # asm 2: adc <squarerdx=%rdx,<squarer01=%r8
- adc %rdx,%r8
- # qhasm: squarerax = *(uint64 *)(pp + 96)
- # asm 1: movq 96(<pp=int64#2),>squarerax=int64#3
- # asm 2: movq 96(<pp=%rsi),>squarerax=%rdx
- movq 96(%rsi),%rdx
- # qhasm: squarerax *= 38
- # asm 1: imulq $38,<squarerax=int64#3,>squarerax=int64#7
- # asm 2: imulq $38,<squarerax=%rdx,>squarerax=%rax
- imulq $38,%rdx,%rax
- # qhasm: (uint128) squarerdx squarerax = squarerax * *(uint64 *)(pp + 112)
- # asm 1: mulq 112(<pp=int64#2)
- # asm 2: mulq 112(<pp=%rsi)
- mulq 112(%rsi)
- # qhasm: carry? c1 += squarerax
- # asm 1: add <squarerax=int64#7,<c1=int64#6
- # asm 2: add <squarerax=%rax,<c1=%r9
- add %rax,%r9
- # qhasm: squarer11 += squarerdx + carry
- # asm 1: adc <squarerdx=int64#3,<squarer11=int64#8
- # asm 2: adc <squarerdx=%rdx,<squarer11=%r10
- adc %rdx,%r10
- # qhasm: squarerax = *(uint64 *)(pp + 104)
- # asm 1: movq 104(<pp=int64#2),>squarerax=int64#3
- # asm 2: movq 104(<pp=%rsi),>squarerax=%rdx
- movq 104(%rsi),%rdx
- # qhasm: squarerax *= 19
- # asm 1: imulq $19,<squarerax=int64#3,>squarerax=int64#7
- # asm 2: imulq $19,<squarerax=%rdx,>squarerax=%rax
- imulq $19,%rdx,%rax
- # qhasm: (uint128) squarerdx squarerax = squarerax * *(uint64 *)(pp + 104)
- # asm 1: mulq 104(<pp=int64#2)
- # asm 2: mulq 104(<pp=%rsi)
- mulq 104(%rsi)
- # qhasm: carry? c1 += squarerax
- # asm 1: add <squarerax=int64#7,<c1=int64#6
- # asm 2: add <squarerax=%rax,<c1=%r9
- add %rax,%r9
- # qhasm: squarer11 += squarerdx + carry
- # asm 1: adc <squarerdx=int64#3,<squarer11=int64#8
- # asm 2: adc <squarerdx=%rdx,<squarer11=%r10
- adc %rdx,%r10
- # qhasm: squarerax = *(uint64 *)(pp + 104)
- # asm 1: movq 104(<pp=int64#2),>squarerax=int64#3
- # asm 2: movq 104(<pp=%rsi),>squarerax=%rdx
- movq 104(%rsi),%rdx
- # qhasm: squarerax *= 38
- # asm 1: imulq $38,<squarerax=int64#3,>squarerax=int64#7
- # asm 2: imulq $38,<squarerax=%rdx,>squarerax=%rax
- imulq $38,%rdx,%rax
- # qhasm: (uint128) squarerdx squarerax = squarerax * *(uint64 *)(pp + 112)
- # asm 1: mulq 112(<pp=int64#2)
- # asm 2: mulq 112(<pp=%rsi)
- mulq 112(%rsi)
- # qhasm: carry? c2 += squarerax
- # asm 1: add <squarerax=int64#7,<c2=int64#9
- # asm 2: add <squarerax=%rax,<c2=%r11
- add %rax,%r11
- # qhasm: squarer21 += squarerdx + carry
- # asm 1: adc <squarerdx=int64#3,<squarer21=int64#10
- # asm 2: adc <squarerdx=%rdx,<squarer21=%r12
- adc %rdx,%r12
- # qhasm: squarerax = *(uint64 *)(pp + 112)
- # asm 1: movq 112(<pp=int64#2),>squarerax=int64#3
- # asm 2: movq 112(<pp=%rsi),>squarerax=%rdx
- movq 112(%rsi),%rdx
- # qhasm: squarerax *= 19
- # asm 1: imulq $19,<squarerax=int64#3,>squarerax=int64#7
- # asm 2: imulq $19,<squarerax=%rdx,>squarerax=%rax
- imulq $19,%rdx,%rax
- # qhasm: (uint128) squarerdx squarerax = squarerax * *(uint64 *)(pp + 112)
- # asm 1: mulq 112(<pp=int64#2)
- # asm 2: mulq 112(<pp=%rsi)
- mulq 112(%rsi)
- # qhasm: carry? c3 += squarerax
- # asm 1: add <squarerax=int64#7,<c3=int64#11
- # asm 2: add <squarerax=%rax,<c3=%r13
- add %rax,%r13
- # qhasm: squarer31 += squarerdx + carry
- # asm 1: adc <squarerdx=int64#3,<squarer31=int64#12
- # asm 2: adc <squarerdx=%rdx,<squarer31=%r14
- adc %rdx,%r14
- # qhasm: squareredmask = *(uint64 *) &CRYPTO_NAMESPACE(batch_REDMASK51)
- # asm 1: movq CRYPTO_NAMESPACE(batch_REDMASK51),>squareredmask=int64#3
- # asm 2: movq CRYPTO_NAMESPACE(batch_REDMASK51),>squareredmask=%rdx
- movq CRYPTO_NAMESPACE(batch_REDMASK51)(%rip),%rdx
- # qhasm: squarer01 = (squarer01.c0) << 13
- # asm 1: shld $13,<c0=int64#4,<squarer01=int64#5
- # asm 2: shld $13,<c0=%rcx,<squarer01=%r8
- shld $13,%rcx,%r8
- # qhasm: c0 &= squareredmask
- # asm 1: and <squareredmask=int64#3,<c0=int64#4
- # asm 2: and <squareredmask=%rdx,<c0=%rcx
- and %rdx,%rcx
- # qhasm: squarer11 = (squarer11.c1) << 13
- # asm 1: shld $13,<c1=int64#6,<squarer11=int64#8
- # asm 2: shld $13,<c1=%r9,<squarer11=%r10
- shld $13,%r9,%r10
- # qhasm: c1 &= squareredmask
- # asm 1: and <squareredmask=int64#3,<c1=int64#6
- # asm 2: and <squareredmask=%rdx,<c1=%r9
- and %rdx,%r9
- # qhasm: c1 += squarer01
- # asm 1: add <squarer01=int64#5,<c1=int64#6
- # asm 2: add <squarer01=%r8,<c1=%r9
- add %r8,%r9
- # qhasm: squarer21 = (squarer21.c2) << 13
- # asm 1: shld $13,<c2=int64#9,<squarer21=int64#10
- # asm 2: shld $13,<c2=%r11,<squarer21=%r12
- shld $13,%r11,%r12
- # qhasm: c2 &= squareredmask
- # asm 1: and <squareredmask=int64#3,<c2=int64#9
- # asm 2: and <squareredmask=%rdx,<c2=%r11
- and %rdx,%r11
- # qhasm: c2 += squarer11
- # asm 1: add <squarer11=int64#8,<c2=int64#9
- # asm 2: add <squarer11=%r10,<c2=%r11
- add %r10,%r11
- # qhasm: squarer31 = (squarer31.c3) << 13
- # asm 1: shld $13,<c3=int64#11,<squarer31=int64#12
- # asm 2: shld $13,<c3=%r13,<squarer31=%r14
- shld $13,%r13,%r14
- # qhasm: c3 &= squareredmask
- # asm 1: and <squareredmask=int64#3,<c3=int64#11
- # asm 2: and <squareredmask=%rdx,<c3=%r13
- and %rdx,%r13
- # qhasm: c3 += squarer21
- # asm 1: add <squarer21=int64#10,<c3=int64#11
- # asm 2: add <squarer21=%r12,<c3=%r13
- add %r12,%r13
- # qhasm: squarer41 = (squarer41.c4) << 13
- # asm 1: shld $13,<c4=int64#13,<squarer41=int64#14
- # asm 2: shld $13,<c4=%r15,<squarer41=%rbx
- shld $13,%r15,%rbx
- # qhasm: c4 &= squareredmask
- # asm 1: and <squareredmask=int64#3,<c4=int64#13
- # asm 2: and <squareredmask=%rdx,<c4=%r15
- and %rdx,%r15
- # qhasm: c4 += squarer31
- # asm 1: add <squarer31=int64#12,<c4=int64#13
- # asm 2: add <squarer31=%r14,<c4=%r15
- add %r14,%r15
- # qhasm: squarer41 = squarer41 * 19
- # asm 1: imulq $19,<squarer41=int64#14,>squarer41=int64#5
- # asm 2: imulq $19,<squarer41=%rbx,>squarer41=%r8
- imulq $19,%rbx,%r8
- # qhasm: c0 += squarer41
- # asm 1: add <squarer41=int64#5,<c0=int64#4
- # asm 2: add <squarer41=%r8,<c0=%rcx
- add %r8,%rcx
- # qhasm: squaret = c0
- # asm 1: mov <c0=int64#4,>squaret=int64#5
- # asm 2: mov <c0=%rcx,>squaret=%r8
- mov %rcx,%r8
- # qhasm: (uint64) squaret >>= 51
- # asm 1: shr $51,<squaret=int64#5
- # asm 2: shr $51,<squaret=%r8
- shr $51,%r8
- # qhasm: squaret += c1
- # asm 1: add <c1=int64#6,<squaret=int64#5
- # asm 2: add <c1=%r9,<squaret=%r8
- add %r9,%r8
- # qhasm: c0 &= squareredmask
- # asm 1: and <squareredmask=int64#3,<c0=int64#4
- # asm 2: and <squareredmask=%rdx,<c0=%rcx
- and %rdx,%rcx
- # qhasm: c1 = squaret
- # asm 1: mov <squaret=int64#5,>c1=int64#6
- # asm 2: mov <squaret=%r8,>c1=%r9
- mov %r8,%r9
- # qhasm: (uint64) squaret >>= 51
- # asm 1: shr $51,<squaret=int64#5
- # asm 2: shr $51,<squaret=%r8
- shr $51,%r8
- # qhasm: squaret += c2
- # asm 1: add <c2=int64#9,<squaret=int64#5
- # asm 2: add <c2=%r11,<squaret=%r8
- add %r11,%r8
- # qhasm: c1 &= squareredmask
- # asm 1: and <squareredmask=int64#3,<c1=int64#6
- # asm 2: and <squareredmask=%rdx,<c1=%r9
- and %rdx,%r9
- # qhasm: c2 = squaret
- # asm 1: mov <squaret=int64#5,>c2=int64#7
- # asm 2: mov <squaret=%r8,>c2=%rax
- mov %r8,%rax
- # qhasm: (uint64) squaret >>= 51
- # asm 1: shr $51,<squaret=int64#5
- # asm 2: shr $51,<squaret=%r8
- shr $51,%r8
- # qhasm: squaret += c3
- # asm 1: add <c3=int64#11,<squaret=int64#5
- # asm 2: add <c3=%r13,<squaret=%r8
- add %r13,%r8
- # qhasm: c2 &= squareredmask
- # asm 1: and <squareredmask=int64#3,<c2=int64#7
- # asm 2: and <squareredmask=%rdx,<c2=%rax
- and %rdx,%rax
- # qhasm: c3 = squaret
- # asm 1: mov <squaret=int64#5,>c3=int64#8
- # asm 2: mov <squaret=%r8,>c3=%r10
- mov %r8,%r10
- # qhasm: (uint64) squaret >>= 51
- # asm 1: shr $51,<squaret=int64#5
- # asm 2: shr $51,<squaret=%r8
- shr $51,%r8
- # qhasm: squaret += c4
- # asm 1: add <c4=int64#13,<squaret=int64#5
- # asm 2: add <c4=%r15,<squaret=%r8
- add %r15,%r8
- # qhasm: c3 &= squareredmask
- # asm 1: and <squareredmask=int64#3,<c3=int64#8
- # asm 2: and <squareredmask=%rdx,<c3=%r10
- and %rdx,%r10
- # qhasm: c4 = squaret
- # asm 1: mov <squaret=int64#5,>c4=int64#9
- # asm 2: mov <squaret=%r8,>c4=%r11
- mov %r8,%r11
- # qhasm: (uint64) squaret >>= 51
- # asm 1: shr $51,<squaret=int64#5
- # asm 2: shr $51,<squaret=%r8
- shr $51,%r8
- # qhasm: squaret *= 19
- # asm 1: imulq $19,<squaret=int64#5,>squaret=int64#5
- # asm 2: imulq $19,<squaret=%r8,>squaret=%r8
- imulq $19,%r8,%r8
- # qhasm: c0 += squaret
- # asm 1: add <squaret=int64#5,<c0=int64#4
- # asm 2: add <squaret=%r8,<c0=%rcx
- add %r8,%rcx
- # qhasm: c4 &= squareredmask
- # asm 1: and <squareredmask=int64#3,<c4=int64#9
- # asm 2: and <squareredmask=%rdx,<c4=%r11
- and %rdx,%r11
- # qhasm: c0 += c0
- # asm 1: add <c0=int64#4,<c0=int64#4
- # asm 2: add <c0=%rcx,<c0=%rcx
- add %rcx,%rcx
- # qhasm: c1 += c1
- # asm 1: add <c1=int64#6,<c1=int64#6
- # asm 2: add <c1=%r9,<c1=%r9
- add %r9,%r9
- # qhasm: c2 += c2
- # asm 1: add <c2=int64#7,<c2=int64#7
- # asm 2: add <c2=%rax,<c2=%rax
- add %rax,%rax
- # qhasm: c3 += c3
- # asm 1: add <c3=int64#8,<c3=int64#8
- # asm 2: add <c3=%r10,<c3=%r10
- add %r10,%r10
- # qhasm: c4 += c4
- # asm 1: add <c4=int64#9,<c4=int64#9
- # asm 2: add <c4=%r11,<c4=%r11
- add %r11,%r11
- # qhasm: c0_stack = c0
- # asm 1: movq <c0=int64#4,>c0_stack=stack64#18
- # asm 2: movq <c0=%rcx,>c0_stack=136(%rsp)
- movq %rcx,136(%rsp)
- # qhasm: c1_stack = c1
- # asm 1: movq <c1=int64#6,>c1_stack=stack64#19
- # asm 2: movq <c1=%r9,>c1_stack=144(%rsp)
- movq %r9,144(%rsp)
- # qhasm: c2_stack = c2
- # asm 1: movq <c2=int64#7,>c2_stack=stack64#20
- # asm 2: movq <c2=%rax,>c2_stack=152(%rsp)
- movq %rax,152(%rsp)
- # qhasm: c3_stack = c3
- # asm 1: movq <c3=int64#8,>c3_stack=stack64#21
- # asm 2: movq <c3=%r10,>c3_stack=160(%rsp)
- movq %r10,160(%rsp)
- # qhasm: c4_stack = c4
- # asm 1: movq <c4=int64#9,>c4_stack=stack64#22
- # asm 2: movq <c4=%r11,>c4_stack=168(%rsp)
- movq %r11,168(%rsp)
- # qhasm: d0 = *(uint64 *)&CRYPTO_NAMESPACE(batch_2P0)
- # asm 1: movq CRYPTO_NAMESPACE(batch_2P0),>d0=int64#3
- # asm 2: movq CRYPTO_NAMESPACE(batch_2P0),>d0=%rdx
- movq CRYPTO_NAMESPACE(batch_2P0)(%rip),%rdx
- # qhasm: d1 = *(uint64 *)&CRYPTO_NAMESPACE(batch_2P1234)
- # asm 1: movq CRYPTO_NAMESPACE(batch_2P1234),>d1=int64#4
- # asm 2: movq CRYPTO_NAMESPACE(batch_2P1234),>d1=%rcx
- movq CRYPTO_NAMESPACE(batch_2P1234)(%rip),%rcx
- # qhasm: d2 = *(uint64 *)&CRYPTO_NAMESPACE(batch_2P1234)
- # asm 1: movq CRYPTO_NAMESPACE(batch_2P1234),>d2=int64#5
- # asm 2: movq CRYPTO_NAMESPACE(batch_2P1234),>d2=%r8
- movq CRYPTO_NAMESPACE(batch_2P1234)(%rip),%r8
- # qhasm: d3 = *(uint64 *)&CRYPTO_NAMESPACE(batch_2P1234)
- # asm 1: movq CRYPTO_NAMESPACE(batch_2P1234),>d3=int64#6
- # asm 2: movq CRYPTO_NAMESPACE(batch_2P1234),>d3=%r9
- movq CRYPTO_NAMESPACE(batch_2P1234)(%rip),%r9
- # qhasm: d4 = *(uint64 *)&CRYPTO_NAMESPACE(batch_2P1234)
- # asm 1: movq CRYPTO_NAMESPACE(batch_2P1234),>d4=int64#7
- # asm 2: movq CRYPTO_NAMESPACE(batch_2P1234),>d4=%rax
- movq CRYPTO_NAMESPACE(batch_2P1234)(%rip),%rax
- # qhasm: e0 = d0
- # asm 1: mov <d0=int64#3,>e0=int64#8
- # asm 2: mov <d0=%rdx,>e0=%r10
- mov %rdx,%r10
- # qhasm: e1 = d1
- # asm 1: mov <d1=int64#4,>e1=int64#9
- # asm 2: mov <d1=%rcx,>e1=%r11
- mov %rcx,%r11
- # qhasm: e2 = d2
- # asm 1: mov <d2=int64#5,>e2=int64#10
- # asm 2: mov <d2=%r8,>e2=%r12
- mov %r8,%r12
- # qhasm: e3 = d3
- # asm 1: mov <d3=int64#6,>e3=int64#11
- # asm 2: mov <d3=%r9,>e3=%r13
- mov %r9,%r13
- # qhasm: e4 = d4
- # asm 1: mov <d4=int64#7,>e4=int64#12
- # asm 2: mov <d4=%rax,>e4=%r14
- mov %rax,%r14
- # qhasm: d0 -= a0_stack
- # asm 1: subq <a0_stack=stack64#8,<d0=int64#3
- # asm 2: subq <a0_stack=56(%rsp),<d0=%rdx
- subq 56(%rsp),%rdx
- # qhasm: d1 -= a1_stack
- # asm 1: subq <a1_stack=stack64#9,<d1=int64#4
- # asm 2: subq <a1_stack=64(%rsp),<d1=%rcx
- subq 64(%rsp),%rcx
- # qhasm: d2 -= a2_stack
- # asm 1: subq <a2_stack=stack64#10,<d2=int64#5
- # asm 2: subq <a2_stack=72(%rsp),<d2=%r8
- subq 72(%rsp),%r8
- # qhasm: d3 -= a3_stack
- # asm 1: subq <a3_stack=stack64#11,<d3=int64#6
- # asm 2: subq <a3_stack=80(%rsp),<d3=%r9
- subq 80(%rsp),%r9
- # qhasm: d4 -= a4_stack
- # asm 1: subq <a4_stack=stack64#12,<d4=int64#7
- # asm 2: subq <a4_stack=88(%rsp),<d4=%rax
- subq 88(%rsp),%rax
- # qhasm: e0 -= b0_stack
- # asm 1: subq <b0_stack=stack64#13,<e0=int64#8
- # asm 2: subq <b0_stack=96(%rsp),<e0=%r10
- subq 96(%rsp),%r10
- # qhasm: e1 -= b1_stack
- # asm 1: subq <b1_stack=stack64#14,<e1=int64#9
- # asm 2: subq <b1_stack=104(%rsp),<e1=%r11
- subq 104(%rsp),%r11
- # qhasm: e2 -= b2_stack
- # asm 1: subq <b2_stack=stack64#15,<e2=int64#10
- # asm 2: subq <b2_stack=112(%rsp),<e2=%r12
- subq 112(%rsp),%r12
- # qhasm: e3 -= b3_stack
- # asm 1: subq <b3_stack=stack64#16,<e3=int64#11
- # asm 2: subq <b3_stack=120(%rsp),<e3=%r13
- subq 120(%rsp),%r13
- # qhasm: e4 -= b4_stack
- # asm 1: subq <b4_stack=stack64#17,<e4=int64#12
- # asm 2: subq <b4_stack=128(%rsp),<e4=%r14
- subq 128(%rsp),%r14
- # qhasm: d0_stack = d0
- # asm 1: movq <d0=int64#3,>d0_stack=stack64#8
- # asm 2: movq <d0=%rdx,>d0_stack=56(%rsp)
- movq %rdx,56(%rsp)
- # qhasm: d1_stack = d1
- # asm 1: movq <d1=int64#4,>d1_stack=stack64#9
- # asm 2: movq <d1=%rcx,>d1_stack=64(%rsp)
- movq %rcx,64(%rsp)
- # qhasm: d2_stack = d2
- # asm 1: movq <d2=int64#5,>d2_stack=stack64#10
- # asm 2: movq <d2=%r8,>d2_stack=72(%rsp)
- movq %r8,72(%rsp)
- # qhasm: d3_stack = d3
- # asm 1: movq <d3=int64#6,>d3_stack=stack64#11
- # asm 2: movq <d3=%r9,>d3_stack=80(%rsp)
- movq %r9,80(%rsp)
- # qhasm: d4_stack = d4
- # asm 1: movq <d4=int64#7,>d4_stack=stack64#12
- # asm 2: movq <d4=%rax,>d4_stack=88(%rsp)
- movq %rax,88(%rsp)
- # qhasm: e0_stack = e0
- # asm 1: movq <e0=int64#8,>e0_stack=stack64#23
- # asm 2: movq <e0=%r10,>e0_stack=176(%rsp)
- movq %r10,176(%rsp)
- # qhasm: e1_stack = e1
- # asm 1: movq <e1=int64#9,>e1_stack=stack64#24
- # asm 2: movq <e1=%r11,>e1_stack=184(%rsp)
- movq %r11,184(%rsp)
- # qhasm: e2_stack = e2
- # asm 1: movq <e2=int64#10,>e2_stack=stack64#25
- # asm 2: movq <e2=%r12,>e2_stack=192(%rsp)
- movq %r12,192(%rsp)
- # qhasm: e3_stack = e3
- # asm 1: movq <e3=int64#11,>e3_stack=stack64#26
- # asm 2: movq <e3=%r13,>e3_stack=200(%rsp)
- movq %r13,200(%rsp)
- # qhasm: e4_stack = e4
- # asm 1: movq <e4=int64#12,>e4_stack=stack64#27
- # asm 2: movq <e4=%r14,>e4_stack=208(%rsp)
- movq %r14,208(%rsp)
- # qhasm: rz0 = d0
- # asm 1: mov <d0=int64#3,>rz0=int64#8
- # asm 2: mov <d0=%rdx,>rz0=%r10
- mov %rdx,%r10
- # qhasm: rz1 = d1
- # asm 1: mov <d1=int64#4,>rz1=int64#9
- # asm 2: mov <d1=%rcx,>rz1=%r11
- mov %rcx,%r11
- # qhasm: rz2 = d2
- # asm 1: mov <d2=int64#5,>rz2=int64#10
- # asm 2: mov <d2=%r8,>rz2=%r12
- mov %r8,%r12
- # qhasm: rz3 = d3
- # asm 1: mov <d3=int64#6,>rz3=int64#11
- # asm 2: mov <d3=%r9,>rz3=%r13
- mov %r9,%r13
- # qhasm: rz4 = d4
- # asm 1: mov <d4=int64#7,>rz4=int64#12
- # asm 2: mov <d4=%rax,>rz4=%r14
- mov %rax,%r14
- # qhasm: rz0 += b0_stack
- # asm 1: addq <b0_stack=stack64#13,<rz0=int64#8
- # asm 2: addq <b0_stack=96(%rsp),<rz0=%r10
- addq 96(%rsp),%r10
- # qhasm: rz1 += b1_stack
- # asm 1: addq <b1_stack=stack64#14,<rz1=int64#9
- # asm 2: addq <b1_stack=104(%rsp),<rz1=%r11
- addq 104(%rsp),%r11
- # qhasm: rz2 += b2_stack
- # asm 1: addq <b2_stack=stack64#15,<rz2=int64#10
- # asm 2: addq <b2_stack=112(%rsp),<rz2=%r12
- addq 112(%rsp),%r12
- # qhasm: rz3 += b3_stack
- # asm 1: addq <b3_stack=stack64#16,<rz3=int64#11
- # asm 2: addq <b3_stack=120(%rsp),<rz3=%r13
- addq 120(%rsp),%r13
- # qhasm: rz4 += b4_stack
- # asm 1: addq <b4_stack=stack64#17,<rz4=int64#12
- # asm 2: addq <b4_stack=128(%rsp),<rz4=%r14
- addq 128(%rsp),%r14
- # qhasm: *(uint64 *) (rp + 40) = rz0
- # asm 1: movq <rz0=int64#8,40(<rp=int64#1)
- # asm 2: movq <rz0=%r10,40(<rp=%rdi)
- movq %r10,40(%rdi)
- # qhasm: *(uint64 *) (rp + 48) = rz1
- # asm 1: movq <rz1=int64#9,48(<rp=int64#1)
- # asm 2: movq <rz1=%r11,48(<rp=%rdi)
- movq %r11,48(%rdi)
- # qhasm: *(uint64 *) (rp + 56) = rz2
- # asm 1: movq <rz2=int64#10,56(<rp=int64#1)
- # asm 2: movq <rz2=%r12,56(<rp=%rdi)
- movq %r12,56(%rdi)
- # qhasm: *(uint64 *) (rp + 64) = rz3
- # asm 1: movq <rz3=int64#11,64(<rp=int64#1)
- # asm 2: movq <rz3=%r13,64(<rp=%rdi)
- movq %r13,64(%rdi)
- # qhasm: *(uint64 *) (rp + 72) = rz4
- # asm 1: movq <rz4=int64#12,72(<rp=int64#1)
- # asm 2: movq <rz4=%r14,72(<rp=%rdi)
- movq %r14,72(%rdi)
- # qhasm: d0 += *(uint64 *)&CRYPTO_NAMESPACE(batch_2P0)
- # asm 1: add CRYPTO_NAMESPACE(batch_2P0),<d0=int64#3
- # asm 2: add CRYPTO_NAMESPACE(batch_2P0),<d0=%rdx
- add CRYPTO_NAMESPACE(batch_2P0)(%rip),%rdx
- # qhasm: d1 += *(uint64 *)&CRYPTO_NAMESPACE(batch_2P1234)
- # asm 1: add CRYPTO_NAMESPACE(batch_2P1234),<d1=int64#4
- # asm 2: add CRYPTO_NAMESPACE(batch_2P1234),<d1=%rcx
- add CRYPTO_NAMESPACE(batch_2P1234)(%rip),%rcx
- # qhasm: d2 += *(uint64 *)&CRYPTO_NAMESPACE(batch_2P1234)
- # asm 1: add CRYPTO_NAMESPACE(batch_2P1234),<d2=int64#5
- # asm 2: add CRYPTO_NAMESPACE(batch_2P1234),<d2=%r8
- add CRYPTO_NAMESPACE(batch_2P1234)(%rip),%r8
- # qhasm: d3 += *(uint64 *)&CRYPTO_NAMESPACE(batch_2P1234)
- # asm 1: add CRYPTO_NAMESPACE(batch_2P1234),<d3=int64#6
- # asm 2: add CRYPTO_NAMESPACE(batch_2P1234),<d3=%r9
- add CRYPTO_NAMESPACE(batch_2P1234)(%rip),%r9
- # qhasm: d4 += *(uint64 *)&CRYPTO_NAMESPACE(batch_2P1234)
- # asm 1: add CRYPTO_NAMESPACE(batch_2P1234),<d4=int64#7
- # asm 2: add CRYPTO_NAMESPACE(batch_2P1234),<d4=%rax
- add CRYPTO_NAMESPACE(batch_2P1234)(%rip),%rax
- # qhasm: d0 -= b0_stack
- # asm 1: subq <b0_stack=stack64#13,<d0=int64#3
- # asm 2: subq <b0_stack=96(%rsp),<d0=%rdx
- subq 96(%rsp),%rdx
- # qhasm: d1 -= b1_stack
- # asm 1: subq <b1_stack=stack64#14,<d1=int64#4
- # asm 2: subq <b1_stack=104(%rsp),<d1=%rcx
- subq 104(%rsp),%rcx
- # qhasm: d2 -= b2_stack
- # asm 1: subq <b2_stack=stack64#15,<d2=int64#5
- # asm 2: subq <b2_stack=112(%rsp),<d2=%r8
- subq 112(%rsp),%r8
- # qhasm: d3 -= b3_stack
- # asm 1: subq <b3_stack=stack64#16,<d3=int64#6
- # asm 2: subq <b3_stack=120(%rsp),<d3=%r9
- subq 120(%rsp),%r9
- # qhasm: d4 -= b4_stack
- # asm 1: subq <b4_stack=stack64#17,<d4=int64#7
- # asm 2: subq <b4_stack=128(%rsp),<d4=%rax
- subq 128(%rsp),%rax
- # qhasm: *(uint64 *)(rp + 80) = d0
- # asm 1: movq <d0=int64#3,80(<rp=int64#1)
- # asm 2: movq <d0=%rdx,80(<rp=%rdi)
- movq %rdx,80(%rdi)
- # qhasm: *(uint64 *)(rp + 88) = d1
- # asm 1: movq <d1=int64#4,88(<rp=int64#1)
- # asm 2: movq <d1=%rcx,88(<rp=%rdi)
- movq %rcx,88(%rdi)
- # qhasm: *(uint64 *)(rp + 96) = d2
- # asm 1: movq <d2=int64#5,96(<rp=int64#1)
- # asm 2: movq <d2=%r8,96(<rp=%rdi)
- movq %r8,96(%rdi)
- # qhasm: *(uint64 *)(rp + 104) = d3
- # asm 1: movq <d3=int64#6,104(<rp=int64#1)
- # asm 2: movq <d3=%r9,104(<rp=%rdi)
- movq %r9,104(%rdi)
- # qhasm: *(uint64 *)(rp + 112) = d4
- # asm 1: movq <d4=int64#7,112(<rp=int64#1)
- # asm 2: movq <d4=%rax,112(<rp=%rdi)
- movq %rax,112(%rdi)
- # qhasm: rz0 += *(uint64 *)&CRYPTO_NAMESPACE(batch_4P0)
- # asm 1: add CRYPTO_NAMESPACE(batch_4P0),<rz0=int64#8
- # asm 2: add CRYPTO_NAMESPACE(batch_4P0),<rz0=%r10
- add CRYPTO_NAMESPACE(batch_4P0)(%rip),%r10
- # qhasm: rz1 += *(uint64 *)&CRYPTO_NAMESPACE(batch_4P1234)
- # asm 1: add CRYPTO_NAMESPACE(batch_4P1234),<rz1=int64#9
- # asm 2: add CRYPTO_NAMESPACE(batch_4P1234),<rz1=%r11
- add CRYPTO_NAMESPACE(batch_4P1234)(%rip),%r11
- # qhasm: rz2 += *(uint64 *)&CRYPTO_NAMESPACE(batch_4P1234)
- # asm 1: add CRYPTO_NAMESPACE(batch_4P1234),<rz2=int64#10
- # asm 2: add CRYPTO_NAMESPACE(batch_4P1234),<rz2=%r12
- add CRYPTO_NAMESPACE(batch_4P1234)(%rip),%r12
- # qhasm: rz3 += *(uint64 *)&CRYPTO_NAMESPACE(batch_4P1234)
- # asm 1: add CRYPTO_NAMESPACE(batch_4P1234),<rz3=int64#11
- # asm 2: add CRYPTO_NAMESPACE(batch_4P1234),<rz3=%r13
- add CRYPTO_NAMESPACE(batch_4P1234)(%rip),%r13
- # qhasm: rz4 += *(uint64 *)&CRYPTO_NAMESPACE(batch_4P1234)
- # asm 1: add CRYPTO_NAMESPACE(batch_4P1234),<rz4=int64#12
- # asm 2: add CRYPTO_NAMESPACE(batch_4P1234),<rz4=%r14
- add CRYPTO_NAMESPACE(batch_4P1234)(%rip),%r14
- # qhasm: rz0 -= c0_stack
- # asm 1: subq <c0_stack=stack64#18,<rz0=int64#8
- # asm 2: subq <c0_stack=136(%rsp),<rz0=%r10
- subq 136(%rsp),%r10
- # qhasm: rz1 -= c1_stack
- # asm 1: subq <c1_stack=stack64#19,<rz1=int64#9
- # asm 2: subq <c1_stack=144(%rsp),<rz1=%r11
- subq 144(%rsp),%r11
- # qhasm: rz2 -= c2_stack
- # asm 1: subq <c2_stack=stack64#20,<rz2=int64#10
- # asm 2: subq <c2_stack=152(%rsp),<rz2=%r12
- subq 152(%rsp),%r12
- # qhasm: rz3 -= c3_stack
- # asm 1: subq <c3_stack=stack64#21,<rz3=int64#11
- # asm 2: subq <c3_stack=160(%rsp),<rz3=%r13
- subq 160(%rsp),%r13
- # qhasm: rz4 -= c4_stack
- # asm 1: subq <c4_stack=stack64#22,<rz4=int64#12
- # asm 2: subq <c4_stack=168(%rsp),<rz4=%r14
- subq 168(%rsp),%r14
- # qhasm: *(uint64 *) (rp + 120) = rz0
- # asm 1: movq <rz0=int64#8,120(<rp=int64#1)
- # asm 2: movq <rz0=%r10,120(<rp=%rdi)
- movq %r10,120(%rdi)
- # qhasm: *(uint64 *) (rp + 128) = rz1
- # asm 1: movq <rz1=int64#9,128(<rp=int64#1)
- # asm 2: movq <rz1=%r11,128(<rp=%rdi)
- movq %r11,128(%rdi)
- # qhasm: *(uint64 *) (rp + 136) = rz2
- # asm 1: movq <rz2=int64#10,136(<rp=int64#1)
- # asm 2: movq <rz2=%r12,136(<rp=%rdi)
- movq %r12,136(%rdi)
- # qhasm: *(uint64 *) (rp + 144) = rz3
- # asm 1: movq <rz3=int64#11,144(<rp=int64#1)
- # asm 2: movq <rz3=%r13,144(<rp=%rdi)
- movq %r13,144(%rdi)
- # qhasm: *(uint64 *) (rp + 152) = rz4
- # asm 1: movq <rz4=int64#12,152(<rp=int64#1)
- # asm 2: movq <rz4=%r14,152(<rp=%rdi)
- movq %r14,152(%rdi)
- # qhasm: rx0 = *(uint64 *)(pp + 0)
- # asm 1: movq 0(<pp=int64#2),>rx0=int64#3
- # asm 2: movq 0(<pp=%rsi),>rx0=%rdx
- movq 0(%rsi),%rdx
- # qhasm: rx1 = *(uint64 *)(pp + 8)
- # asm 1: movq 8(<pp=int64#2),>rx1=int64#4
- # asm 2: movq 8(<pp=%rsi),>rx1=%rcx
- movq 8(%rsi),%rcx
- # qhasm: rx2 = *(uint64 *)(pp + 16)
- # asm 1: movq 16(<pp=int64#2),>rx2=int64#5
- # asm 2: movq 16(<pp=%rsi),>rx2=%r8
- movq 16(%rsi),%r8
- # qhasm: rx3 = *(uint64 *)(pp + 24)
- # asm 1: movq 24(<pp=int64#2),>rx3=int64#6
- # asm 2: movq 24(<pp=%rsi),>rx3=%r9
- movq 24(%rsi),%r9
- # qhasm: rx4 = *(uint64 *)(pp + 32)
- # asm 1: movq 32(<pp=int64#2),>rx4=int64#7
- # asm 2: movq 32(<pp=%rsi),>rx4=%rax
- movq 32(%rsi),%rax
- # qhasm: rx0 += *(uint64 *)(pp + 40)
- # asm 1: addq 40(<pp=int64#2),<rx0=int64#3
- # asm 2: addq 40(<pp=%rsi),<rx0=%rdx
- addq 40(%rsi),%rdx
- # qhasm: rx1 += *(uint64 *)(pp + 48)
- # asm 1: addq 48(<pp=int64#2),<rx1=int64#4
- # asm 2: addq 48(<pp=%rsi),<rx1=%rcx
- addq 48(%rsi),%rcx
- # qhasm: rx2 += *(uint64 *)(pp + 56)
- # asm 1: addq 56(<pp=int64#2),<rx2=int64#5
- # asm 2: addq 56(<pp=%rsi),<rx2=%r8
- addq 56(%rsi),%r8
- # qhasm: rx3 += *(uint64 *)(pp + 64)
- # asm 1: addq 64(<pp=int64#2),<rx3=int64#6
- # asm 2: addq 64(<pp=%rsi),<rx3=%r9
- addq 64(%rsi),%r9
- # qhasm: rx4 += *(uint64 *)(pp + 72)
- # asm 1: addq 72(<pp=int64#2),<rx4=int64#7
- # asm 2: addq 72(<pp=%rsi),<rx4=%rax
- addq 72(%rsi),%rax
- # qhasm: rx0_stack = rx0
- # asm 1: movq <rx0=int64#3,>rx0_stack=stack64#13
- # asm 2: movq <rx0=%rdx,>rx0_stack=96(%rsp)
- movq %rdx,96(%rsp)
- # qhasm: rx1_stack = rx1
- # asm 1: movq <rx1=int64#4,>rx1_stack=stack64#14
- # asm 2: movq <rx1=%rcx,>rx1_stack=104(%rsp)
- movq %rcx,104(%rsp)
- # qhasm: rx2_stack = rx2
- # asm 1: movq <rx2=int64#5,>rx2_stack=stack64#15
- # asm 2: movq <rx2=%r8,>rx2_stack=112(%rsp)
- movq %r8,112(%rsp)
- # qhasm: rx3_stack = rx3
- # asm 1: movq <rx3=int64#6,>rx3_stack=stack64#16
- # asm 2: movq <rx3=%r9,>rx3_stack=120(%rsp)
- movq %r9,120(%rsp)
- # qhasm: rx4_stack = rx4
- # asm 1: movq <rx4=int64#7,>rx4_stack=stack64#17
- # asm 2: movq <rx4=%rax,>rx4_stack=128(%rsp)
- movq %rax,128(%rsp)
- # qhasm: squarerax = rx0_stack
- # asm 1: movq <rx0_stack=stack64#13,>squarerax=int64#7
- # asm 2: movq <rx0_stack=96(%rsp),>squarerax=%rax
- movq 96(%rsp),%rax
- # qhasm: (uint128) squarerdx squarerax = squarerax * rx0_stack
- # asm 1: mulq <rx0_stack=stack64#13
- # asm 2: mulq <rx0_stack=96(%rsp)
- mulq 96(%rsp)
- # qhasm: rx0 = squarerax
- # asm 1: mov <squarerax=int64#7,>rx0=int64#2
- # asm 2: mov <squarerax=%rax,>rx0=%rsi
- mov %rax,%rsi
- # qhasm: squarer01 = squarerdx
- # asm 1: mov <squarerdx=int64#3,>squarer01=int64#4
- # asm 2: mov <squarerdx=%rdx,>squarer01=%rcx
- mov %rdx,%rcx
- # qhasm: squarerax = rx0_stack
- # asm 1: movq <rx0_stack=stack64#13,>squarerax=int64#7
- # asm 2: movq <rx0_stack=96(%rsp),>squarerax=%rax
- movq 96(%rsp),%rax
- # qhasm: squarerax <<= 1
- # asm 1: shl $1,<squarerax=int64#7
- # asm 2: shl $1,<squarerax=%rax
- shl $1,%rax
- # qhasm: (uint128) squarerdx squarerax = squarerax * rx1_stack
- # asm 1: mulq <rx1_stack=stack64#14
- # asm 2: mulq <rx1_stack=104(%rsp)
- mulq 104(%rsp)
- # qhasm: rx1 = squarerax
- # asm 1: mov <squarerax=int64#7,>rx1=int64#5
- # asm 2: mov <squarerax=%rax,>rx1=%r8
- mov %rax,%r8
- # qhasm: squarer11 = squarerdx
- # asm 1: mov <squarerdx=int64#3,>squarer11=int64#6
- # asm 2: mov <squarerdx=%rdx,>squarer11=%r9
- mov %rdx,%r9
- # qhasm: squarerax = rx0_stack
- # asm 1: movq <rx0_stack=stack64#13,>squarerax=int64#7
- # asm 2: movq <rx0_stack=96(%rsp),>squarerax=%rax
- movq 96(%rsp),%rax
- # qhasm: squarerax <<= 1
- # asm 1: shl $1,<squarerax=int64#7
- # asm 2: shl $1,<squarerax=%rax
- shl $1,%rax
- # qhasm: (uint128) squarerdx squarerax = squarerax * rx2_stack
- # asm 1: mulq <rx2_stack=stack64#15
- # asm 2: mulq <rx2_stack=112(%rsp)
- mulq 112(%rsp)
- # qhasm: rx2 = squarerax
- # asm 1: mov <squarerax=int64#7,>rx2=int64#8
- # asm 2: mov <squarerax=%rax,>rx2=%r10
- mov %rax,%r10
- # qhasm: squarer21 = squarerdx
- # asm 1: mov <squarerdx=int64#3,>squarer21=int64#9
- # asm 2: mov <squarerdx=%rdx,>squarer21=%r11
- mov %rdx,%r11
- # qhasm: squarerax = rx0_stack
- # asm 1: movq <rx0_stack=stack64#13,>squarerax=int64#7
- # asm 2: movq <rx0_stack=96(%rsp),>squarerax=%rax
- movq 96(%rsp),%rax
- # qhasm: squarerax <<= 1
- # asm 1: shl $1,<squarerax=int64#7
- # asm 2: shl $1,<squarerax=%rax
- shl $1,%rax
- # qhasm: (uint128) squarerdx squarerax = squarerax * rx3_stack
- # asm 1: mulq <rx3_stack=stack64#16
- # asm 2: mulq <rx3_stack=120(%rsp)
- mulq 120(%rsp)
- # qhasm: rx3 = squarerax
- # asm 1: mov <squarerax=int64#7,>rx3=int64#10
- # asm 2: mov <squarerax=%rax,>rx3=%r12
- mov %rax,%r12
- # qhasm: squarer31 = squarerdx
- # asm 1: mov <squarerdx=int64#3,>squarer31=int64#11
- # asm 2: mov <squarerdx=%rdx,>squarer31=%r13
- mov %rdx,%r13
- # qhasm: squarerax = rx0_stack
- # asm 1: movq <rx0_stack=stack64#13,>squarerax=int64#7
- # asm 2: movq <rx0_stack=96(%rsp),>squarerax=%rax
- movq 96(%rsp),%rax
- # qhasm: squarerax <<= 1
- # asm 1: shl $1,<squarerax=int64#7
- # asm 2: shl $1,<squarerax=%rax
- shl $1,%rax
- # qhasm: (uint128) squarerdx squarerax = squarerax * rx4_stack
- # asm 1: mulq <rx4_stack=stack64#17
- # asm 2: mulq <rx4_stack=128(%rsp)
- mulq 128(%rsp)
- # qhasm: rx4 = squarerax
- # asm 1: mov <squarerax=int64#7,>rx4=int64#12
- # asm 2: mov <squarerax=%rax,>rx4=%r14
- mov %rax,%r14
- # qhasm: squarer41 = squarerdx
- # asm 1: mov <squarerdx=int64#3,>squarer41=int64#13
- # asm 2: mov <squarerdx=%rdx,>squarer41=%r15
- mov %rdx,%r15
- # qhasm: squarerax = rx1_stack
- # asm 1: movq <rx1_stack=stack64#14,>squarerax=int64#7
- # asm 2: movq <rx1_stack=104(%rsp),>squarerax=%rax
- movq 104(%rsp),%rax
- # qhasm: (uint128) squarerdx squarerax = squarerax * rx1_stack
- # asm 1: mulq <rx1_stack=stack64#14
- # asm 2: mulq <rx1_stack=104(%rsp)
- mulq 104(%rsp)
- # qhasm: carry? rx2 += squarerax
- # asm 1: add <squarerax=int64#7,<rx2=int64#8
- # asm 2: add <squarerax=%rax,<rx2=%r10
- add %rax,%r10
- # qhasm: squarer21 += squarerdx + carry
- # asm 1: adc <squarerdx=int64#3,<squarer21=int64#9
- # asm 2: adc <squarerdx=%rdx,<squarer21=%r11
- adc %rdx,%r11
- # qhasm: squarerax = rx1_stack
- # asm 1: movq <rx1_stack=stack64#14,>squarerax=int64#7
- # asm 2: movq <rx1_stack=104(%rsp),>squarerax=%rax
- movq 104(%rsp),%rax
- # qhasm: squarerax <<= 1
- # asm 1: shl $1,<squarerax=int64#7
- # asm 2: shl $1,<squarerax=%rax
- shl $1,%rax
- # qhasm: (uint128) squarerdx squarerax = squarerax * rx2_stack
- # asm 1: mulq <rx2_stack=stack64#15
- # asm 2: mulq <rx2_stack=112(%rsp)
- mulq 112(%rsp)
- # qhasm: carry? rx3 += squarerax
- # asm 1: add <squarerax=int64#7,<rx3=int64#10
- # asm 2: add <squarerax=%rax,<rx3=%r12
- add %rax,%r12
- # qhasm: squarer31 += squarerdx + carry
- # asm 1: adc <squarerdx=int64#3,<squarer31=int64#11
- # asm 2: adc <squarerdx=%rdx,<squarer31=%r13
- adc %rdx,%r13
- # qhasm: squarerax = rx1_stack
- # asm 1: movq <rx1_stack=stack64#14,>squarerax=int64#7
- # asm 2: movq <rx1_stack=104(%rsp),>squarerax=%rax
- movq 104(%rsp),%rax
- # qhasm: squarerax <<= 1
- # asm 1: shl $1,<squarerax=int64#7
- # asm 2: shl $1,<squarerax=%rax
- shl $1,%rax
- # qhasm: (uint128) squarerdx squarerax = squarerax * rx3_stack
- # asm 1: mulq <rx3_stack=stack64#16
- # asm 2: mulq <rx3_stack=120(%rsp)
- mulq 120(%rsp)
- # qhasm: carry? rx4 += squarerax
- # asm 1: add <squarerax=int64#7,<rx4=int64#12
- # asm 2: add <squarerax=%rax,<rx4=%r14
- add %rax,%r14
- # qhasm: squarer41 += squarerdx + carry
- # asm 1: adc <squarerdx=int64#3,<squarer41=int64#13
- # asm 2: adc <squarerdx=%rdx,<squarer41=%r15
- adc %rdx,%r15
- # qhasm: squarerax = rx1_stack
- # asm 1: movq <rx1_stack=stack64#14,>squarerax=int64#3
- # asm 2: movq <rx1_stack=104(%rsp),>squarerax=%rdx
- movq 104(%rsp),%rdx
- # qhasm: squarerax *= 38
- # asm 1: imulq $38,<squarerax=int64#3,>squarerax=int64#7
- # asm 2: imulq $38,<squarerax=%rdx,>squarerax=%rax
- imulq $38,%rdx,%rax
- # qhasm: (uint128) squarerdx squarerax = squarerax * rx4_stack
- # asm 1: mulq <rx4_stack=stack64#17
- # asm 2: mulq <rx4_stack=128(%rsp)
- mulq 128(%rsp)
- # qhasm: carry? rx0 += squarerax
- # asm 1: add <squarerax=int64#7,<rx0=int64#2
- # asm 2: add <squarerax=%rax,<rx0=%rsi
- add %rax,%rsi
- # qhasm: squarer01 += squarerdx + carry
- # asm 1: adc <squarerdx=int64#3,<squarer01=int64#4
- # asm 2: adc <squarerdx=%rdx,<squarer01=%rcx
- adc %rdx,%rcx
- # qhasm: squarerax = rx2_stack
- # asm 1: movq <rx2_stack=stack64#15,>squarerax=int64#7
- # asm 2: movq <rx2_stack=112(%rsp),>squarerax=%rax
- movq 112(%rsp),%rax
- # qhasm: (uint128) squarerdx squarerax = squarerax * rx2_stack
- # asm 1: mulq <rx2_stack=stack64#15
- # asm 2: mulq <rx2_stack=112(%rsp)
- mulq 112(%rsp)
- # qhasm: carry? rx4 += squarerax
- # asm 1: add <squarerax=int64#7,<rx4=int64#12
- # asm 2: add <squarerax=%rax,<rx4=%r14
- add %rax,%r14
- # qhasm: squarer41 += squarerdx + carry
- # asm 1: adc <squarerdx=int64#3,<squarer41=int64#13
- # asm 2: adc <squarerdx=%rdx,<squarer41=%r15
- adc %rdx,%r15
- # qhasm: squarerax = rx2_stack
- # asm 1: movq <rx2_stack=stack64#15,>squarerax=int64#3
- # asm 2: movq <rx2_stack=112(%rsp),>squarerax=%rdx
- movq 112(%rsp),%rdx
- # qhasm: squarerax *= 38
- # asm 1: imulq $38,<squarerax=int64#3,>squarerax=int64#7
- # asm 2: imulq $38,<squarerax=%rdx,>squarerax=%rax
- imulq $38,%rdx,%rax
- # qhasm: (uint128) squarerdx squarerax = squarerax * rx3_stack
- # asm 1: mulq <rx3_stack=stack64#16
- # asm 2: mulq <rx3_stack=120(%rsp)
- mulq 120(%rsp)
- # qhasm: carry? rx0 += squarerax
- # asm 1: add <squarerax=int64#7,<rx0=int64#2
- # asm 2: add <squarerax=%rax,<rx0=%rsi
- add %rax,%rsi
- # qhasm: squarer01 += squarerdx + carry
- # asm 1: adc <squarerdx=int64#3,<squarer01=int64#4
- # asm 2: adc <squarerdx=%rdx,<squarer01=%rcx
- adc %rdx,%rcx
- # qhasm: squarerax = rx2_stack
- # asm 1: movq <rx2_stack=stack64#15,>squarerax=int64#3
- # asm 2: movq <rx2_stack=112(%rsp),>squarerax=%rdx
- movq 112(%rsp),%rdx
- # qhasm: squarerax *= 38
- # asm 1: imulq $38,<squarerax=int64#3,>squarerax=int64#7
- # asm 2: imulq $38,<squarerax=%rdx,>squarerax=%rax
- imulq $38,%rdx,%rax
- # qhasm: (uint128) squarerdx squarerax = squarerax * rx4_stack
- # asm 1: mulq <rx4_stack=stack64#17
- # asm 2: mulq <rx4_stack=128(%rsp)
- mulq 128(%rsp)
- # qhasm: carry? rx1 += squarerax
- # asm 1: add <squarerax=int64#7,<rx1=int64#5
- # asm 2: add <squarerax=%rax,<rx1=%r8
- add %rax,%r8
- # qhasm: squarer11 += squarerdx + carry
- # asm 1: adc <squarerdx=int64#3,<squarer11=int64#6
- # asm 2: adc <squarerdx=%rdx,<squarer11=%r9
- adc %rdx,%r9
- # qhasm: squarerax = rx3_stack
- # asm 1: movq <rx3_stack=stack64#16,>squarerax=int64#3
- # asm 2: movq <rx3_stack=120(%rsp),>squarerax=%rdx
- movq 120(%rsp),%rdx
- # qhasm: squarerax *= 19
- # asm 1: imulq $19,<squarerax=int64#3,>squarerax=int64#7
- # asm 2: imulq $19,<squarerax=%rdx,>squarerax=%rax
- imulq $19,%rdx,%rax
- # qhasm: (uint128) squarerdx squarerax = squarerax * rx3_stack
- # asm 1: mulq <rx3_stack=stack64#16
- # asm 2: mulq <rx3_stack=120(%rsp)
- mulq 120(%rsp)
- # qhasm: carry? rx1 += squarerax
- # asm 1: add <squarerax=int64#7,<rx1=int64#5
- # asm 2: add <squarerax=%rax,<rx1=%r8
- add %rax,%r8
- # qhasm: squarer11 += squarerdx + carry
- # asm 1: adc <squarerdx=int64#3,<squarer11=int64#6
- # asm 2: adc <squarerdx=%rdx,<squarer11=%r9
- adc %rdx,%r9
- # qhasm: squarerax = rx3_stack
- # asm 1: movq <rx3_stack=stack64#16,>squarerax=int64#3
- # asm 2: movq <rx3_stack=120(%rsp),>squarerax=%rdx
- movq 120(%rsp),%rdx
- # qhasm: squarerax *= 38
- # asm 1: imulq $38,<squarerax=int64#3,>squarerax=int64#7
- # asm 2: imulq $38,<squarerax=%rdx,>squarerax=%rax
- imulq $38,%rdx,%rax
- # qhasm: (uint128) squarerdx squarerax = squarerax * rx4_stack
- # asm 1: mulq <rx4_stack=stack64#17
- # asm 2: mulq <rx4_stack=128(%rsp)
- mulq 128(%rsp)
- # qhasm: carry? rx2 += squarerax
- # asm 1: add <squarerax=int64#7,<rx2=int64#8
- # asm 2: add <squarerax=%rax,<rx2=%r10
- add %rax,%r10
- # qhasm: squarer21 += squarerdx + carry
- # asm 1: adc <squarerdx=int64#3,<squarer21=int64#9
- # asm 2: adc <squarerdx=%rdx,<squarer21=%r11
- adc %rdx,%r11
- # qhasm: squarerax = rx4_stack
- # asm 1: movq <rx4_stack=stack64#17,>squarerax=int64#3
- # asm 2: movq <rx4_stack=128(%rsp),>squarerax=%rdx
- movq 128(%rsp),%rdx
- # qhasm: squarerax *= 19
- # asm 1: imulq $19,<squarerax=int64#3,>squarerax=int64#7
- # asm 2: imulq $19,<squarerax=%rdx,>squarerax=%rax
- imulq $19,%rdx,%rax
- # qhasm: (uint128) squarerdx squarerax = squarerax * rx4_stack
- # asm 1: mulq <rx4_stack=stack64#17
- # asm 2: mulq <rx4_stack=128(%rsp)
- mulq 128(%rsp)
- # qhasm: carry? rx3 += squarerax
- # asm 1: add <squarerax=int64#7,<rx3=int64#10
- # asm 2: add <squarerax=%rax,<rx3=%r12
- add %rax,%r12
- # qhasm: squarer31 += squarerdx + carry
- # asm 1: adc <squarerdx=int64#3,<squarer31=int64#11
- # asm 2: adc <squarerdx=%rdx,<squarer31=%r13
- adc %rdx,%r13
- # qhasm: squareredmask = *(uint64 *) &CRYPTO_NAMESPACE(batch_REDMASK51)
- # asm 1: movq CRYPTO_NAMESPACE(batch_REDMASK51),>squareredmask=int64#3
- # asm 2: movq CRYPTO_NAMESPACE(batch_REDMASK51),>squareredmask=%rdx
- movq CRYPTO_NAMESPACE(batch_REDMASK51)(%rip),%rdx
- # qhasm: squarer01 = (squarer01.rx0) << 13
- # asm 1: shld $13,<rx0=int64#2,<squarer01=int64#4
- # asm 2: shld $13,<rx0=%rsi,<squarer01=%rcx
- shld $13,%rsi,%rcx
- # qhasm: rx0 &= squareredmask
- # asm 1: and <squareredmask=int64#3,<rx0=int64#2
- # asm 2: and <squareredmask=%rdx,<rx0=%rsi
- and %rdx,%rsi
- # qhasm: squarer11 = (squarer11.rx1) << 13
- # asm 1: shld $13,<rx1=int64#5,<squarer11=int64#6
- # asm 2: shld $13,<rx1=%r8,<squarer11=%r9
- shld $13,%r8,%r9
- # qhasm: rx1 &= squareredmask
- # asm 1: and <squareredmask=int64#3,<rx1=int64#5
- # asm 2: and <squareredmask=%rdx,<rx1=%r8
- and %rdx,%r8
- # qhasm: rx1 += squarer01
- # asm 1: add <squarer01=int64#4,<rx1=int64#5
- # asm 2: add <squarer01=%rcx,<rx1=%r8
- add %rcx,%r8
- # qhasm: squarer21 = (squarer21.rx2) << 13
- # asm 1: shld $13,<rx2=int64#8,<squarer21=int64#9
- # asm 2: shld $13,<rx2=%r10,<squarer21=%r11
- shld $13,%r10,%r11
- # qhasm: rx2 &= squareredmask
- # asm 1: and <squareredmask=int64#3,<rx2=int64#8
- # asm 2: and <squareredmask=%rdx,<rx2=%r10
- and %rdx,%r10
- # qhasm: rx2 += squarer11
- # asm 1: add <squarer11=int64#6,<rx2=int64#8
- # asm 2: add <squarer11=%r9,<rx2=%r10
- add %r9,%r10
- # qhasm: squarer31 = (squarer31.rx3) << 13
- # asm 1: shld $13,<rx3=int64#10,<squarer31=int64#11
- # asm 2: shld $13,<rx3=%r12,<squarer31=%r13
- shld $13,%r12,%r13
- # qhasm: rx3 &= squareredmask
- # asm 1: and <squareredmask=int64#3,<rx3=int64#10
- # asm 2: and <squareredmask=%rdx,<rx3=%r12
- and %rdx,%r12
- # qhasm: rx3 += squarer21
- # asm 1: add <squarer21=int64#9,<rx3=int64#10
- # asm 2: add <squarer21=%r11,<rx3=%r12
- add %r11,%r12
- # qhasm: squarer41 = (squarer41.rx4) << 13
- # asm 1: shld $13,<rx4=int64#12,<squarer41=int64#13
- # asm 2: shld $13,<rx4=%r14,<squarer41=%r15
- shld $13,%r14,%r15
- # qhasm: rx4 &= squareredmask
- # asm 1: and <squareredmask=int64#3,<rx4=int64#12
- # asm 2: and <squareredmask=%rdx,<rx4=%r14
- and %rdx,%r14
- # qhasm: rx4 += squarer31
- # asm 1: add <squarer31=int64#11,<rx4=int64#12
- # asm 2: add <squarer31=%r13,<rx4=%r14
- add %r13,%r14
- # qhasm: squarer41 = squarer41 * 19
- # asm 1: imulq $19,<squarer41=int64#13,>squarer41=int64#4
- # asm 2: imulq $19,<squarer41=%r15,>squarer41=%rcx
- imulq $19,%r15,%rcx
- # qhasm: rx0 += squarer41
- # asm 1: add <squarer41=int64#4,<rx0=int64#2
- # asm 2: add <squarer41=%rcx,<rx0=%rsi
- add %rcx,%rsi
- # qhasm: squaret = rx0
- # asm 1: mov <rx0=int64#2,>squaret=int64#4
- # asm 2: mov <rx0=%rsi,>squaret=%rcx
- mov %rsi,%rcx
- # qhasm: (uint64) squaret >>= 51
- # asm 1: shr $51,<squaret=int64#4
- # asm 2: shr $51,<squaret=%rcx
- shr $51,%rcx
- # qhasm: squaret += rx1
- # asm 1: add <rx1=int64#5,<squaret=int64#4
- # asm 2: add <rx1=%r8,<squaret=%rcx
- add %r8,%rcx
- # qhasm: rx0 &= squareredmask
- # asm 1: and <squareredmask=int64#3,<rx0=int64#2
- # asm 2: and <squareredmask=%rdx,<rx0=%rsi
- and %rdx,%rsi
- # qhasm: rx1 = squaret
- # asm 1: mov <squaret=int64#4,>rx1=int64#5
- # asm 2: mov <squaret=%rcx,>rx1=%r8
- mov %rcx,%r8
- # qhasm: (uint64) squaret >>= 51
- # asm 1: shr $51,<squaret=int64#4
- # asm 2: shr $51,<squaret=%rcx
- shr $51,%rcx
- # qhasm: squaret += rx2
- # asm 1: add <rx2=int64#8,<squaret=int64#4
- # asm 2: add <rx2=%r10,<squaret=%rcx
- add %r10,%rcx
- # qhasm: rx1 &= squareredmask
- # asm 1: and <squareredmask=int64#3,<rx1=int64#5
- # asm 2: and <squareredmask=%rdx,<rx1=%r8
- and %rdx,%r8
- # qhasm: rx2 = squaret
- # asm 1: mov <squaret=int64#4,>rx2=int64#6
- # asm 2: mov <squaret=%rcx,>rx2=%r9
- mov %rcx,%r9
- # qhasm: (uint64) squaret >>= 51
- # asm 1: shr $51,<squaret=int64#4
- # asm 2: shr $51,<squaret=%rcx
- shr $51,%rcx
- # qhasm: squaret += rx3
- # asm 1: add <rx3=int64#10,<squaret=int64#4
- # asm 2: add <rx3=%r12,<squaret=%rcx
- add %r12,%rcx
- # qhasm: rx2 &= squareredmask
- # asm 1: and <squareredmask=int64#3,<rx2=int64#6
- # asm 2: and <squareredmask=%rdx,<rx2=%r9
- and %rdx,%r9
- # qhasm: rx3 = squaret
- # asm 1: mov <squaret=int64#4,>rx3=int64#7
- # asm 2: mov <squaret=%rcx,>rx3=%rax
- mov %rcx,%rax
- # qhasm: (uint64) squaret >>= 51
- # asm 1: shr $51,<squaret=int64#4
- # asm 2: shr $51,<squaret=%rcx
- shr $51,%rcx
- # qhasm: squaret += rx4
- # asm 1: add <rx4=int64#12,<squaret=int64#4
- # asm 2: add <rx4=%r14,<squaret=%rcx
- add %r14,%rcx
- # qhasm: rx3 &= squareredmask
- # asm 1: and <squareredmask=int64#3,<rx3=int64#7
- # asm 2: and <squareredmask=%rdx,<rx3=%rax
- and %rdx,%rax
- # qhasm: rx4 = squaret
- # asm 1: mov <squaret=int64#4,>rx4=int64#8
- # asm 2: mov <squaret=%rcx,>rx4=%r10
- mov %rcx,%r10
- # qhasm: (uint64) squaret >>= 51
- # asm 1: shr $51,<squaret=int64#4
- # asm 2: shr $51,<squaret=%rcx
- shr $51,%rcx
- # qhasm: squaret *= 19
- # asm 1: imulq $19,<squaret=int64#4,>squaret=int64#4
- # asm 2: imulq $19,<squaret=%rcx,>squaret=%rcx
- imulq $19,%rcx,%rcx
- # qhasm: rx0 += squaret
- # asm 1: add <squaret=int64#4,<rx0=int64#2
- # asm 2: add <squaret=%rcx,<rx0=%rsi
- add %rcx,%rsi
- # qhasm: rx4 &= squareredmask
- # asm 1: and <squareredmask=int64#3,<rx4=int64#8
- # asm 2: and <squareredmask=%rdx,<rx4=%r10
- and %rdx,%r10
- # qhasm: rx0 += d0_stack
- # asm 1: addq <d0_stack=stack64#8,<rx0=int64#2
- # asm 2: addq <d0_stack=56(%rsp),<rx0=%rsi
- addq 56(%rsp),%rsi
- # qhasm: rx1 += d1_stack
- # asm 1: addq <d1_stack=stack64#9,<rx1=int64#5
- # asm 2: addq <d1_stack=64(%rsp),<rx1=%r8
- addq 64(%rsp),%r8
- # qhasm: rx2 += d2_stack
- # asm 1: addq <d2_stack=stack64#10,<rx2=int64#6
- # asm 2: addq <d2_stack=72(%rsp),<rx2=%r9
- addq 72(%rsp),%r9
- # qhasm: rx3 += d3_stack
- # asm 1: addq <d3_stack=stack64#11,<rx3=int64#7
- # asm 2: addq <d3_stack=80(%rsp),<rx3=%rax
- addq 80(%rsp),%rax
- # qhasm: rx4 += d4_stack
- # asm 1: addq <d4_stack=stack64#12,<rx4=int64#8
- # asm 2: addq <d4_stack=88(%rsp),<rx4=%r10
- addq 88(%rsp),%r10
- # qhasm: rx0 += e0_stack
- # asm 1: addq <e0_stack=stack64#23,<rx0=int64#2
- # asm 2: addq <e0_stack=176(%rsp),<rx0=%rsi
- addq 176(%rsp),%rsi
- # qhasm: rx1 += e1_stack
- # asm 1: addq <e1_stack=stack64#24,<rx1=int64#5
- # asm 2: addq <e1_stack=184(%rsp),<rx1=%r8
- addq 184(%rsp),%r8
- # qhasm: rx2 += e2_stack
- # asm 1: addq <e2_stack=stack64#25,<rx2=int64#6
- # asm 2: addq <e2_stack=192(%rsp),<rx2=%r9
- addq 192(%rsp),%r9
- # qhasm: rx3 += e3_stack
- # asm 1: addq <e3_stack=stack64#26,<rx3=int64#7
- # asm 2: addq <e3_stack=200(%rsp),<rx3=%rax
- addq 200(%rsp),%rax
- # qhasm: rx4 += e4_stack
- # asm 1: addq <e4_stack=stack64#27,<rx4=int64#8
- # asm 2: addq <e4_stack=208(%rsp),<rx4=%r10
- addq 208(%rsp),%r10
- # qhasm: *(uint64 *)(rp + 0) = rx0
- # asm 1: movq <rx0=int64#2,0(<rp=int64#1)
- # asm 2: movq <rx0=%rsi,0(<rp=%rdi)
- movq %rsi,0(%rdi)
- # qhasm: *(uint64 *)(rp + 8) = rx1
- # asm 1: movq <rx1=int64#5,8(<rp=int64#1)
- # asm 2: movq <rx1=%r8,8(<rp=%rdi)
- movq %r8,8(%rdi)
- # qhasm: *(uint64 *)(rp + 16) = rx2
- # asm 1: movq <rx2=int64#6,16(<rp=int64#1)
- # asm 2: movq <rx2=%r9,16(<rp=%rdi)
- movq %r9,16(%rdi)
- # qhasm: *(uint64 *)(rp + 24) = rx3
- # asm 1: movq <rx3=int64#7,24(<rp=int64#1)
- # asm 2: movq <rx3=%rax,24(<rp=%rdi)
- movq %rax,24(%rdi)
- # qhasm: *(uint64 *)(rp + 32) = rx4
- # asm 1: movq <rx4=int64#8,32(<rp=int64#1)
- # asm 2: movq <rx4=%r10,32(<rp=%rdi)
- movq %r10,32(%rdi)
- # qhasm: caller1 = caller1_stack
- # asm 1: movq <caller1_stack=stack64#1,>caller1=int64#9
- # asm 2: movq <caller1_stack=0(%rsp),>caller1=%r11
- movq 0(%rsp),%r11
- # qhasm: caller2 = caller2_stack
- # asm 1: movq <caller2_stack=stack64#2,>caller2=int64#10
- # asm 2: movq <caller2_stack=8(%rsp),>caller2=%r12
- movq 8(%rsp),%r12
- # qhasm: caller3 = caller3_stack
- # asm 1: movq <caller3_stack=stack64#3,>caller3=int64#11
- # asm 2: movq <caller3_stack=16(%rsp),>caller3=%r13
- movq 16(%rsp),%r13
- # qhasm: caller4 = caller4_stack
- # asm 1: movq <caller4_stack=stack64#4,>caller4=int64#12
- # asm 2: movq <caller4_stack=24(%rsp),>caller4=%r14
- movq 24(%rsp),%r14
- # qhasm: caller5 = caller5_stack
- # asm 1: movq <caller5_stack=stack64#5,>caller5=int64#13
- # asm 2: movq <caller5_stack=32(%rsp),>caller5=%r15
- movq 32(%rsp),%r15
- # qhasm: caller6 = caller6_stack
- # asm 1: movq <caller6_stack=stack64#6,>caller6=int64#14
- # asm 2: movq <caller6_stack=40(%rsp),>caller6=%rbx
- movq 40(%rsp),%rbx
- # qhasm: caller7 = caller7_stack
- # asm 1: movq <caller7_stack=stack64#7,>caller7=int64#15
- # asm 2: movq <caller7_stack=48(%rsp),>caller7=%rbp
- movq 48(%rsp),%rbp
- # qhasm: leave
- add %r11,%rsp
- mov %rdi,%rax
- mov %rsi,%rdx
- ret
|