123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899900901902903904905906907908909910911912913914915916917918919920921922923924925926927928929930931932933934935936937938939940941942943944945946947948949950951952953954955956957958959960961962963964965966967968969970971972973974975976977978979980981982983984985986987988989990991992993994995996997998999100010011002100310041005100610071008100910101011101210131014101510161017101810191020102110221023102410251026102710281029103010311032103310341035103610371038103910401041104210431044104510461047104810491050105110521053105410551056105710581059106010611062106310641065106610671068106910701071107210731074107510761077107810791080108110821083108410851086108710881089109010911092109310941095109610971098109911001101110211031104110511061107110811091110111111121113111411151116111711181119112011211122112311241125112611271128112911301131113211331134113511361137113811391140114111421143114411451146114711481149115011511152115311541155115611571158115911601161116211631164116511661167116811691170117111721173117411751176117711781179118011811182118311841185118611871188118911901191119211931194119511961197119811991200120112021203120412051206120712081209121012111212121312141215121612171218121912201221122212231224122512261227122812291230123112321233123412351236123712381239124012411242124312441245124612471248124912501251125212531254125512561257125812591260126112621263126412651266126712681269127012711272127312741275127612771278127912801281128212831284128512861287128812891290129112921293129412951296129712981299130013011302130313041305130613071308130913101311131213131314131513161317131813191320132113221323132413251326132713281329133013311332133313341335133613371338133913401341134213431344134513461347134813491350135113521353135413551356135713581359136013611362136313641365136613671368136913701371137213731374137513761377137813791380138113821383138413851386138713881389139013911392139313941395139613971398139914001401140214031404140514061407140814091410141114121413141414151416141714181419142014211422142314241425142614271428142914301431143214331434143514361437143814391440144114421443144414451446144714481449145014511452145314541455145614571458145914601461146214631464146514661467146814691470147114721473147414751476147714781479148014811482148314841485148614871488148914901491149214931494149514961497149814991500150115021503150415051506150715081509151015111512151315141515151615171518151915201521152215231524152515261527152815291530153115321533153415351536153715381539154015411542154315441545154615471548154915501551155215531554155515561557155815591560156115621563156415651566156715681569157015711572157315741575157615771578157915801581158215831584158515861587158815891590159115921593159415951596159715981599160016011602160316041605160616071608160916101611161216131614161516161617161816191620162116221623162416251626162716281629163016311632163316341635163616371638163916401641164216431644164516461647164816491650165116521653165416551656165716581659166016611662166316641665166616671668166916701671167216731674167516761677167816791680168116821683168416851686168716881689169016911692169316941695169616971698169917001701170217031704170517061707170817091710171117121713171417151716171717181719172017211722172317241725172617271728172917301731173217331734173517361737173817391740174117421743174417451746174717481749175017511752175317541755175617571758175917601761176217631764176517661767176817691770177117721773177417751776177717781779178017811782178317841785178617871788178917901791179217931794179517961797179817991800180118021803180418051806180718081809181018111812181318141815181618171818181918201821182218231824182518261827182818291830183118321833183418351836183718381839184018411842184318441845184618471848184918501851185218531854185518561857185818591860186118621863186418651866186718681869187018711872187318741875187618771878187918801881188218831884188518861887188818891890189118921893189418951896189718981899190019011902190319041905190619071908190919101911191219131914191519161917191819191920192119221923192419251926192719281929193019311932193319341935193619371938193919401941194219431944194519461947194819491950195119521953195419551956195719581959196019611962196319641965196619671968196919701971197219731974197519761977197819791980198119821983198419851986198719881989199019911992199319941995199619971998199920002001200220032004200520062007200820092010201120122013201420152016201720182019202020212022202320242025202620272028202920302031203220332034203520362037203820392040204120422043204420452046204720482049205020512052205320542055205620572058205920602061206220632064206520662067206820692070207120722073207420752076207720782079208020812082208320842085208620872088208920902091209220932094209520962097209820992100210121022103210421052106210721082109211021112112211321142115211621172118211921202121212221232124212521262127212821292130213121322133213421352136213721382139214021412142214321442145214621472148214921502151215221532154215521562157215821592160216121622163216421652166216721682169217021712172217321742175217621772178217921802181218221832184218521862187218821892190219121922193219421952196219721982199220022012202220322042205220622072208220922102211221222132214221522162217221822192220222122222223222422252226222722282229223022312232223322342235223622372238223922402241224222432244224522462247224822492250225122522253225422552256225722582259226022612262226322642265226622672268226922702271227222732274227522762277227822792280228122822283228422852286228722882289229022912292229322942295229622972298229923002301230223032304230523062307230823092310231123122313231423152316231723182319232023212322232323242325232623272328232923302331233223332334233523362337233823392340234123422343234423452346234723482349235023512352235323542355235623572358235923602361236223632364236523662367236823692370237123722373237423752376237723782379238023812382238323842385238623872388238923902391239223932394239523962397239823992400240124022403240424052406240724082409241024112412241324142415241624172418241924202421242224232424242524262427242824292430243124322433243424352436243724382439244024412442244324442445244624472448244924502451245224532454245524562457245824592460246124622463246424652466246724682469247024712472247324742475247624772478247924802481248224832484248524862487248824892490249124922493249424952496249724982499250025012502250325042505250625072508250925102511251225132514251525162517251825192520252125222523252425252526252725282529253025312532253325342535253625372538253925402541254225432544254525462547254825492550255125522553255425552556255725582559256025612562256325642565256625672568256925702571257225732574257525762577257825792580258125822583258425852586258725882589259025912592259325942595259625972598259926002601260226032604260526062607260826092610261126122613261426152616261726182619262026212622262326242625262626272628262926302631263226332634263526362637263826392640264126422643264426452646264726482649265026512652265326542655265626572658265926602661266226632664266526662667266826692670267126722673267426752676267726782679268026812682268326842685268626872688268926902691269226932694269526962697269826992700270127022703270427052706270727082709271027112712271327142715271627172718271927202721272227232724272527262727272827292730273127322733273427352736273727382739274027412742274327442745274627472748274927502751275227532754275527562757275827592760276127622763276427652766276727682769277027712772277327742775277627772778277927802781278227832784278527862787278827892790279127922793279427952796279727982799280028012802280328042805280628072808280928102811281228132814281528162817281828192820282128222823282428252826282728282829283028312832283328342835283628372838283928402841284228432844284528462847284828492850285128522853285428552856285728582859286028612862286328642865286628672868286928702871287228732874287528762877287828792880288128822883288428852886288728882889289028912892289328942895289628972898289929002901290229032904290529062907290829092910291129122913291429152916291729182919292029212922292329242925292629272928292929302931293229332934293529362937293829392940294129422943294429452946294729482949295029512952295329542955295629572958295929602961296229632964296529662967296829692970297129722973297429752976297729782979298029812982298329842985298629872988298929902991299229932994299529962997299829993000300130023003300430053006300730083009301030113012301330143015301630173018301930203021302230233024302530263027302830293030303130323033303430353036303730383039304030413042304330443045304630473048304930503051305230533054305530563057305830593060306130623063306430653066306730683069307030713072307330743075307630773078307930803081308230833084308530863087308830893090309130923093309430953096309730983099310031013102310331043105310631073108310931103111311231133114311531163117311831193120312131223123312431253126312731283129313031313132313331343135313631373138313931403141314231433144314531463147314831493150315131523153315431553156315731583159316031613162316331643165316631673168316931703171317231733174317531763177317831793180318131823183318431853186318731883189319031913192319331943195319631973198319932003201320232033204320532063207320832093210321132123213321432153216321732183219322032213222322332243225322632273228322932303231323232333234323532363237323832393240324132423243324432453246324732483249325032513252325332543255325632573258325932603261326232633264326532663267326832693270327132723273327432753276327732783279328032813282328332843285328632873288328932903291329232933294329532963297329832993300330133023303330433053306330733083309331033113312331333143315331633173318331933203321332233233324332533263327332833293330333133323333333433353336333733383339334033413342334333443345334633473348334933503351335233533354335533563357335833593360336133623363336433653366336733683369337033713372337333743375337633773378337933803381338233833384338533863387338833893390339133923393339433953396339733983399340034013402340334043405340634073408340934103411341234133414341534163417341834193420342134223423342434253426342734283429343034313432343334343435343634373438343934403441344234433444344534463447344834493450345134523453345434553456345734583459346034613462346334643465346634673468346934703471347234733474347534763477347834793480348134823483348434853486348734883489349034913492349334943495349634973498349935003501350235033504350535063507350835093510351135123513351435153516351735183519352035213522352335243525352635273528352935303531353235333534353535363537353835393540354135423543354435453546354735483549355035513552355335543555355635573558355935603561356235633564356535663567356835693570357135723573357435753576357735783579358035813582358335843585358635873588358935903591359235933594359535963597359835993600360136023603360436053606360736083609361036113612361336143615361636173618361936203621362236233624362536263627362836293630363136323633363436353636363736383639364036413642364336443645364636473648364936503651365236533654365536563657365836593660366136623663366436653666366736683669367036713672367336743675367636773678367936803681368236833684368536863687368836893690369136923693369436953696369736983699370037013702370337043705370637073708370937103711371237133714371537163717371837193720372137223723372437253726372737283729373037313732373337343735373637373738373937403741374237433744374537463747374837493750375137523753375437553756375737583759376037613762376337643765376637673768376937703771377237733774377537763777377837793780378137823783378437853786378737883789379037913792379337943795379637973798379938003801380238033804380538063807380838093810381138123813381438153816381738183819382038213822382338243825382638273828382938303831383238333834383538363837383838393840384138423843384438453846384738483849385038513852385338543855385638573858385938603861386238633864386538663867386838693870387138723873387438753876387738783879388038813882388338843885388638873888388938903891389238933894389538963897389838993900390139023903390439053906390739083909391039113912391339143915391639173918391939203921392239233924392539263927392839293930393139323933393439353936393739383939394039413942394339443945394639473948394939503951395239533954395539563957395839593960396139623963396439653966396739683969397039713972397339743975397639773978397939803981398239833984398539863987398839893990399139923993399439953996399739983999400040014002400340044005400640074008400940104011401240134014401540164017401840194020402140224023402440254026402740284029403040314032403340344035403640374038403940404041404240434044404540464047404840494050405140524053405440554056405740584059406040614062406340644065406640674068406940704071407240734074407540764077407840794080408140824083408440854086408740884089409040914092409340944095409640974098409941004101410241034104410541064107410841094110411141124113411441154116411741184119412041214122412341244125412641274128412941304131413241334134413541364137413841394140414141424143414441454146414741484149415041514152415341544155415641574158415941604161416241634164416541664167416841694170417141724173417441754176417741784179418041814182418341844185418641874188418941904191419241934194419541964197419841994200420142024203420442054206420742084209421042114212421342144215421642174218421942204221422242234224422542264227422842294230423142324233423442354236423742384239424042414242424342444245424642474248424942504251425242534254425542564257425842594260426142624263426442654266426742684269427042714272427342744275427642774278427942804281428242834284428542864287428842894290429142924293429442954296429742984299430043014302430343044305430643074308430943104311431243134314431543164317431843194320432143224323432443254326432743284329433043314332433343344335433643374338433943404341434243434344434543464347434843494350435143524353435443554356435743584359436043614362436343644365436643674368436943704371437243734374437543764377437843794380438143824383438443854386438743884389439043914392439343944395439643974398439944004401440244034404440544064407440844094410441144124413441444154416441744184419442044214422442344244425442644274428442944304431443244334434443544364437443844394440444144424443444444454446444744484449445044514452445344544455445644574458445944604461446244634464446544664467446844694470447144724473447444754476447744784479448044814482448344844485448644874488448944904491449244934494449544964497449844994500450145024503450445054506450745084509451045114512451345144515451645174518451945204521452245234524452545264527452845294530453145324533453445354536453745384539454045414542454345444545454645474548454945504551455245534554455545564557455845594560456145624563456445654566456745684569457045714572457345744575457645774578457945804581458245834584458545864587458845894590459145924593459445954596459745984599460046014602460346044605460646074608460946104611461246134614461546164617461846194620462146224623462446254626462746284629463046314632463346344635463646374638463946404641464246434644464546464647464846494650465146524653465446554656465746584659466046614662466346644665466646674668466946704671467246734674467546764677467846794680468146824683468446854686468746884689469046914692469346944695469646974698469947004701470247034704470547064707470847094710471147124713471447154716471747184719472047214722472347244725472647274728472947304731473247334734473547364737473847394740474147424743474447454746474747484749475047514752475347544755475647574758475947604761476247634764476547664767476847694770477147724773477447754776477747784779478047814782478347844785478647874788478947904791479247934794479547964797479847994800480148024803480448054806480748084809481048114812481348144815481648174818481948204821482248234824482548264827482848294830483148324833483448354836483748384839484048414842484348444845484648474848484948504851485248534854485548564857485848594860486148624863486448654866486748684869487048714872487348744875487648774878487948804881488248834884488548864887488848894890489148924893489448954896489748984899490049014902490349044905490649074908490949104911491249134914491549164917491849194920492149224923492449254926492749284929493049314932493349344935493649374938493949404941494249434944494549464947494849494950495149524953495449554956495749584959496049614962496349644965496649674968496949704971497249734974497549764977497849794980498149824983498449854986498749884989499049914992499349944995499649974998499950005001500250035004500550065007500850095010501150125013501450155016501750185019502050215022502350245025502650275028502950305031503250335034503550365037503850395040504150425043504450455046504750485049505050515052505350545055505650575058505950605061506250635064506550665067506850695070507150725073507450755076507750785079508050815082508350845085508650875088508950905091509250935094509550965097509850995100510151025103510451055106510751085109511051115112511351145115511651175118511951205121512251235124512551265127512851295130513151325133513451355136513751385139514051415142514351445145514651475148514951505151515251535154515551565157515851595160516151625163516451655166516751685169517051715172517351745175517651775178517951805181518251835184518551865187518851895190519151925193519451955196519751985199520052015202520352045205520652075208520952105211521252135214521552165217521852195220522152225223522452255226522752285229523052315232523352345235523652375238523952405241524252435244524552465247524852495250525152525253525452555256525752585259526052615262526352645265526652675268526952705271527252735274527552765277527852795280528152825283528452855286528752885289529052915292529352945295529652975298529953005301530253035304530553065307530853095310531153125313531453155316531753185319532053215322532353245325532653275328532953305331533253335334533553365337533853395340534153425343534453455346534753485349535053515352535353545355535653575358535953605361536253635364536553665367536853695370537153725373537453755376537753785379538053815382538353845385538653875388538953905391539253935394539553965397539853995400540154025403540454055406540754085409541054115412541354145415541654175418541954205421542254235424542554265427542854295430543154325433543454355436543754385439544054415442544354445445544654475448544954505451545254535454545554565457545854595460546154625463546454655466546754685469547054715472547354745475547654775478547954805481548254835484548554865487548854895490549154925493549454955496549754985499550055015502550355045505550655075508550955105511551255135514551555165517551855195520552155225523552455255526552755285529553055315532553355345535553655375538553955405541554255435544554555465547554855495550555155525553555455555556555755585559556055615562556355645565556655675568556955705571557255735574557555765577557855795580558155825583558455855586558755885589559055915592559355945595559655975598559956005601560256035604560556065607560856095610561156125613561456155616561756185619562056215622562356245625562656275628562956305631563256335634563556365637563856395640564156425643564456455646564756485649565056515652565356545655565656575658565956605661566256635664566556665667566856695670567156725673567456755676567756785679568056815682568356845685568656875688568956905691569256935694569556965697569856995700570157025703570457055706570757085709571057115712571357145715571657175718571957205721572257235724572557265727572857295730573157325733573457355736573757385739574057415742574357445745574657475748574957505751575257535754575557565757575857595760576157625763576457655766576757685769577057715772577357745775577657775778577957805781578257835784578557865787578857895790579157925793579457955796579757985799580058015802580358045805580658075808580958105811581258135814581558165817581858195820582158225823582458255826582758285829583058315832583358345835583658375838583958405841584258435844584558465847584858495850585158525853585458555856585758585859586058615862586358645865586658675868586958705871587258735874587558765877587858795880588158825883588458855886588758885889589058915892589358945895589658975898589959005901590259035904590559065907590859095910591159125913591459155916591759185919592059215922592359245925592659275928592959305931593259335934593559365937593859395940594159425943594459455946594759485949595059515952595359545955595659575958595959605961596259635964596559665967596859695970597159725973597459755976597759785979598059815982598359845985598659875988598959905991599259935994599559965997599859996000600160026003600460056006600760086009601060116012601360146015601660176018601960206021602260236024602560266027602860296030603160326033603460356036603760386039604060416042604360446045604660476048604960506051605260536054605560566057605860596060606160626063606460656066606760686069607060716072607360746075607660776078607960806081608260836084608560866087608860896090609160926093609460956096609760986099610061016102610361046105610661076108610961106111611261136114611561166117611861196120612161226123612461256126612761286129613061316132613361346135613661376138613961406141614261436144614561466147614861496150615161526153615461556156615761586159616061616162616361646165616661676168616961706171617261736174617561766177617861796180618161826183618461856186618761886189619061916192619361946195619661976198619962006201620262036204620562066207620862096210621162126213621462156216621762186219622062216222622362246225622662276228622962306231623262336234623562366237623862396240624162426243624462456246624762486249625062516252625362546255625662576258625962606261626262636264626562666267626862696270627162726273627462756276627762786279628062816282628362846285628662876288628962906291629262936294629562966297629862996300630163026303630463056306630763086309631063116312631363146315631663176318631963206321632263236324632563266327632863296330633163326333633463356336633763386339634063416342634363446345634663476348634963506351635263536354635563566357635863596360636163626363636463656366636763686369637063716372637363746375637663776378637963806381638263836384638563866387638863896390639163926393639463956396639763986399640064016402640364046405640664076408640964106411641264136414641564166417641864196420642164226423642464256426642764286429643064316432643364346435643664376438643964406441644264436444644564466447644864496450645164526453645464556456645764586459646064616462646364646465646664676468646964706471647264736474647564766477647864796480648164826483648464856486648764886489649064916492649364946495649664976498649965006501650265036504650565066507650865096510651165126513651465156516651765186519652065216522652365246525652665276528652965306531653265336534653565366537653865396540654165426543654465456546654765486549655065516552655365546555655665576558655965606561656265636564656565666567656865696570657165726573657465756576657765786579658065816582658365846585658665876588658965906591659265936594659565966597659865996600660166026603660466056606660766086609661066116612661366146615661666176618661966206621662266236624662566266627662866296630663166326633663466356636663766386639664066416642664366446645664666476648664966506651665266536654665566566657665866596660666166626663666466656666666766686669667066716672667366746675667666776678667966806681668266836684668566866687668866896690669166926693669466956696669766986699670067016702670367046705670667076708670967106711671267136714671567166717671867196720672167226723672467256726672767286729673067316732673367346735673667376738673967406741674267436744674567466747674867496750675167526753675467556756675767586759676067616762676367646765676667676768676967706771677267736774677567766777677867796780678167826783678467856786678767886789679067916792679367946795679667976798679968006801680268036804680568066807680868096810681168126813681468156816681768186819682068216822682368246825682668276828682968306831683268336834683568366837683868396840684168426843684468456846684768486849685068516852685368546855685668576858685968606861686268636864686568666867686868696870687168726873687468756876687768786879688068816882688368846885688668876888688968906891689268936894689568966897689868996900690169026903690469056906690769086909691069116912691369146915691669176918691969206921692269236924692569266927692869296930693169326933693469356936693769386939694069416942694369446945694669476948694969506951695269536954695569566957695869596960696169626963696469656966696769686969697069716972697369746975697669776978697969806981698269836984698569866987698869896990699169926993699469956996699769986999700070017002700370047005700670077008700970107011701270137014701570167017701870197020702170227023702470257026702770287029703070317032703370347035703670377038703970407041704270437044704570467047704870497050705170527053705470557056705770587059706070617062706370647065706670677068706970707071707270737074707570767077707870797080708170827083708470857086708770887089709070917092709370947095709670977098709971007101710271037104710571067107710871097110711171127113711471157116711771187119712071217122712371247125712671277128712971307131713271337134713571367137713871397140714171427143714471457146714771487149715071517152715371547155715671577158715971607161716271637164716571667167716871697170717171727173717471757176717771787179718071817182718371847185718671877188718971907191719271937194719571967197719871997200720172027203720472057206720772087209721072117212721372147215721672177218721972207221722272237224722572267227722872297230723172327233723472357236723772387239724072417242724372447245724672477248724972507251725272537254725572567257725872597260726172627263726472657266726772687269727072717272727372747275727672777278727972807281728272837284728572867287728872897290729172927293729472957296729772987299730073017302730373047305730673077308730973107311731273137314731573167317731873197320732173227323732473257326732773287329733073317332733373347335733673377338733973407341734273437344734573467347734873497350735173527353735473557356735773587359736073617362736373647365736673677368736973707371737273737374737573767377737873797380738173827383738473857386738773887389739073917392739373947395739673977398739974007401740274037404740574067407740874097410741174127413741474157416741774187419742074217422742374247425742674277428742974307431743274337434743574367437743874397440744174427443744474457446744774487449745074517452745374547455745674577458745974607461746274637464746574667467746874697470747174727473747474757476747774787479748074817482748374847485748674877488748974907491749274937494749574967497749874997500750175027503750475057506750775087509751075117512751375147515751675177518751975207521752275237524752575267527752875297530753175327533753475357536753775387539754075417542754375447545754675477548754975507551755275537554755575567557755875597560756175627563756475657566756775687569757075717572757375747575757675777578757975807581758275837584758575867587758875897590759175927593759475957596759775987599760076017602760376047605760676077608760976107611761276137614761576167617761876197620762176227623762476257626762776287629763076317632763376347635763676377638763976407641764276437644764576467647764876497650765176527653765476557656765776587659766076617662766376647665766676677668766976707671767276737674767576767677767876797680768176827683768476857686768776887689769076917692769376947695769676977698769977007701770277037704770577067707770877097710771177127713771477157716771777187719772077217722772377247725772677277728772977307731773277337734773577367737773877397740774177427743774477457746774777487749775077517752775377547755775677577758775977607761776277637764776577667767776877697770777177727773777477757776777777787779778077817782778377847785778677877788778977907791779277937794779577967797779877997800780178027803780478057806780778087809781078117812781378147815781678177818781978207821782278237824782578267827782878297830783178327833783478357836783778387839784078417842784378447845784678477848784978507851785278537854785578567857785878597860786178627863786478657866786778687869787078717872787378747875787678777878787978807881788278837884788578867887788878897890789178927893789478957896789778987899790079017902790379047905790679077908790979107911791279137914791579167917791879197920792179227923792479257926792779287929793079317932793379347935793679377938793979407941794279437944794579467947794879497950795179527953795479557956795779587959796079617962796379647965796679677968796979707971797279737974797579767977797879797980798179827983798479857986798779887989799079917992799379947995799679977998799980008001800280038004800580068007800880098010801180128013801480158016801780188019802080218022802380248025802680278028802980308031803280338034803580368037803880398040804180428043804480458046804780488049805080518052805380548055805680578058805980608061806280638064806580668067806880698070807180728073807480758076807780788079808080818082808380848085808680878088808980908091809280938094809580968097809880998100810181028103810481058106810781088109811081118112811381148115811681178118811981208121812281238124812581268127812881298130813181328133813481358136813781388139814081418142814381448145814681478148814981508151815281538154815581568157815881598160816181628163816481658166816781688169817081718172817381748175817681778178817981808181818281838184818581868187818881898190819181928193819481958196819781988199820082018202820382048205820682078208820982108211821282138214821582168217821882198220822182228223822482258226822782288229823082318232823382348235823682378238823982408241824282438244824582468247824882498250825182528253825482558256825782588259826082618262826382648265826682678268826982708271827282738274827582768277827882798280828182828283828482858286828782888289829082918292829382948295829682978298829983008301830283038304830583068307830883098310831183128313831483158316831783188319832083218322832383248325832683278328832983308331833283338334833583368337833883398340834183428343834483458346834783488349835083518352835383548355835683578358835983608361836283638364836583668367836883698370837183728373837483758376837783788379838083818382838383848385838683878388838983908391839283938394839583968397839883998400840184028403840484058406840784088409841084118412841384148415841684178418841984208421842284238424842584268427842884298430843184328433843484358436843784388439844084418442844384448445844684478448844984508451845284538454845584568457845884598460846184628463846484658466846784688469847084718472847384748475847684778478847984808481848284838484848584868487848884898490849184928493849484958496849784988499850085018502850385048505850685078508850985108511851285138514851585168517851885198520852185228523852485258526852785288529853085318532853385348535853685378538853985408541854285438544854585468547854885498550855185528553855485558556855785588559856085618562856385648565856685678568856985708571 |
- /* c5625880f4bf417c1463deee4eb92d86ff413f802048621c57e25fe483eb59e4 (2.6.4+)
- __ __ _
- ___\ \/ /_ __ __ _| |_
- / _ \\ /| '_ \ / _` | __|
- | __// \| |_) | (_| | |_
- \___/_/\_\ .__/ \__,_|\__|
- |_| XML parser
- Copyright (c) 1997-2000 Thai Open Source Software Center Ltd
- Copyright (c) 2000 Clark Cooper <coopercc@users.sourceforge.net>
- Copyright (c) 2000-2006 Fred L. Drake, Jr. <fdrake@users.sourceforge.net>
- Copyright (c) 2001-2002 Greg Stein <gstein@users.sourceforge.net>
- Copyright (c) 2002-2016 Karl Waclawek <karl@waclawek.net>
- Copyright (c) 2005-2009 Steven Solie <steven@solie.ca>
- Copyright (c) 2016 Eric Rahm <erahm@mozilla.com>
- Copyright (c) 2016-2024 Sebastian Pipping <sebastian@pipping.org>
- Copyright (c) 2016 Gaurav <g.gupta@samsung.com>
- Copyright (c) 2016 Thomas Beutlich <tc@tbeu.de>
- Copyright (c) 2016 Gustavo Grieco <gustavo.grieco@imag.fr>
- Copyright (c) 2016 Pascal Cuoq <cuoq@trust-in-soft.com>
- Copyright (c) 2016 Ed Schouten <ed@nuxi.nl>
- Copyright (c) 2017-2022 Rhodri James <rhodri@wildebeest.org.uk>
- Copyright (c) 2017 Václav Slavík <vaclav@slavik.io>
- Copyright (c) 2017 Viktor Szakats <commit@vsz.me>
- Copyright (c) 2017 Chanho Park <chanho61.park@samsung.com>
- Copyright (c) 2017 Rolf Eike Beer <eike@sf-mail.de>
- Copyright (c) 2017 Hans Wennborg <hans@chromium.org>
- Copyright (c) 2018 Anton Maklakov <antmak.pub@gmail.com>
- Copyright (c) 2018 Benjamin Peterson <benjamin@python.org>
- Copyright (c) 2018 Marco Maggi <marco.maggi-ipsu@poste.it>
- Copyright (c) 2018 Mariusz Zaborski <oshogbo@vexillium.org>
- Copyright (c) 2019 David Loffredo <loffredo@steptools.com>
- Copyright (c) 2019-2020 Ben Wagner <bungeman@chromium.org>
- Copyright (c) 2019 Vadim Zeitlin <vadim@zeitlins.org>
- Copyright (c) 2021 Donghee Na <donghee.na@python.org>
- Copyright (c) 2022 Samanta Navarro <ferivoz@riseup.net>
- Copyright (c) 2022 Jeffrey Walton <noloader@gmail.com>
- Copyright (c) 2022 Jann Horn <jannh@google.com>
- Copyright (c) 2022 Sean McBride <sean@rogue-research.com>
- Copyright (c) 2023 Owain Davies <owaind@bath.edu>
- Copyright (c) 2023-2024 Sony Corporation / Snild Dolkow <snild@sony.com>
- Copyright (c) 2024 Berkay Eren Ürün <berkay.ueruen@siemens.com>
- Copyright (c) 2024 Hanno Böck <hanno@gentoo.org>
- Licensed under the MIT license:
- Permission is hereby granted, free of charge, to any person obtaining
- a copy of this software and associated documentation files (the
- "Software"), to deal in the Software without restriction, including
- without limitation the rights to use, copy, modify, merge, publish,
- distribute, sublicense, and/or sell copies of the Software, and to permit
- persons to whom the Software is furnished to do so, subject to the
- following conditions:
- The above copyright notice and this permission notice shall be included
- in all copies or substantial portions of the Software.
- THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
- EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
- MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN
- NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM,
- DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR
- OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE
- USE OR OTHER DEALINGS IN THE SOFTWARE.
- */
- #define XML_BUILDING_EXPAT 1
- #include "expat_config.h"
- #if ! defined(XML_GE) || (1 - XML_GE - 1 == 2) || (XML_GE < 0) || (XML_GE > 1)
- # error XML_GE (for general entities) must be defined, non-empty, either 1 or 0 (0 to disable, 1 to enable; 1 is a common default)
- #endif
- #if defined(XML_DTD) && XML_GE == 0
- # error Either undefine XML_DTD or define XML_GE to 1.
- #endif
- #if ! defined(XML_CONTEXT_BYTES) || (1 - XML_CONTEXT_BYTES - 1 == 2) \
- || (XML_CONTEXT_BYTES + 0 < 0)
- # error XML_CONTEXT_BYTES must be defined, non-empty and >=0 (0 to disable, >=1 to enable; 1024 is a common default)
- #endif
- #if defined(HAVE_SYSCALL_GETRANDOM)
- # if ! defined(_GNU_SOURCE)
- # define _GNU_SOURCE 1 /* syscall prototype */
- # endif
- #endif
- #ifdef _WIN32
- /* force stdlib to define rand_s() */
- # if ! defined(_CRT_RAND_S)
- # define _CRT_RAND_S
- # endif
- #endif
- #include <stdbool.h>
- #include <stddef.h>
- #include <string.h> /* memset(), memcpy() */
- #include <assert.h>
- #include <limits.h> /* UINT_MAX */
- #include <stdio.h> /* fprintf */
- #include <stdlib.h> /* getenv, rand_s */
- #include <stdint.h> /* uintptr_t */
- #include <math.h> /* isnan */
- #ifdef _WIN32
- # define getpid GetCurrentProcessId
- #else
- # include <sys/time.h> /* gettimeofday() */
- # include <sys/types.h> /* getpid() */
- # include <unistd.h> /* getpid() */
- # include <fcntl.h> /* O_RDONLY */
- # include <errno.h>
- #endif
- #ifdef _WIN32
- # include "winconfig.h"
- #endif
- #include "ascii.h"
- #include "expat.h"
- #include "siphash.h"
- #if defined(HAVE_GETRANDOM) || defined(HAVE_SYSCALL_GETRANDOM)
- # if defined(HAVE_GETRANDOM)
- # include <sys/random.h> /* getrandom */
- # else
- # include <unistd.h> /* syscall */
- # include <sys/syscall.h> /* SYS_getrandom */
- # endif
- # if ! defined(GRND_NONBLOCK)
- # define GRND_NONBLOCK 0x0001
- # endif /* defined(GRND_NONBLOCK) */
- #endif /* defined(HAVE_GETRANDOM) || defined(HAVE_SYSCALL_GETRANDOM) */
- #if defined(HAVE_LIBBSD) \
- && (defined(HAVE_ARC4RANDOM_BUF) || defined(HAVE_ARC4RANDOM))
- # error #include <bsd/stdlib.h>
- #endif
- #if defined(_WIN32) && ! defined(LOAD_LIBRARY_SEARCH_SYSTEM32)
- # define LOAD_LIBRARY_SEARCH_SYSTEM32 0x00000800
- #endif
- #if ! defined(HAVE_GETRANDOM) && ! defined(HAVE_SYSCALL_GETRANDOM) \
- && ! defined(HAVE_ARC4RANDOM_BUF) && ! defined(HAVE_ARC4RANDOM) \
- && ! defined(XML_DEV_URANDOM) && ! defined(_WIN32) \
- && ! defined(XML_POOR_ENTROPY)
- # error You do not have support for any sources of high quality entropy \
- enabled. For end user security, that is probably not what you want. \
- \
- Your options include: \
- * Linux >=3.17 + glibc >=2.25 (getrandom): HAVE_GETRANDOM, \
- * Linux >=3.17 + glibc (including <2.25) (syscall SYS_getrandom): HAVE_SYSCALL_GETRANDOM, \
- * BSD / macOS >=10.7 / glibc >=2.36 (arc4random_buf): HAVE_ARC4RANDOM_BUF, \
- * BSD / macOS (including <10.7) / glibc >=2.36 (arc4random): HAVE_ARC4RANDOM, \
- * libbsd (arc4random_buf): HAVE_ARC4RANDOM_BUF + HAVE_LIBBSD, \
- * libbsd (arc4random): HAVE_ARC4RANDOM + HAVE_LIBBSD, \
- * Linux (including <3.17) / BSD / macOS (including <10.7) / Solaris >=8 (/dev/urandom): XML_DEV_URANDOM, \
- * Windows >=Vista (rand_s): _WIN32. \
- \
- If insist on not using any of these, bypass this error by defining \
- XML_POOR_ENTROPY; you have been warned. \
- \
- If you have reasons to patch this detection code away or need changes \
- to the build system, please open a bug. Thank you!
- #endif
- #ifdef XML_UNICODE
- # define XML_ENCODE_MAX XML_UTF16_ENCODE_MAX
- # define XmlConvert XmlUtf16Convert
- # define XmlGetInternalEncoding XmlGetUtf16InternalEncoding
- # define XmlGetInternalEncodingNS XmlGetUtf16InternalEncodingNS
- # define XmlEncode XmlUtf16Encode
- # define MUST_CONVERT(enc, s) (! (enc)->isUtf16 || (((uintptr_t)(s)) & 1))
- typedef unsigned short ICHAR;
- #else
- # define XML_ENCODE_MAX XML_UTF8_ENCODE_MAX
- # define XmlConvert XmlUtf8Convert
- # define XmlGetInternalEncoding XmlGetUtf8InternalEncoding
- # define XmlGetInternalEncodingNS XmlGetUtf8InternalEncodingNS
- # define XmlEncode XmlUtf8Encode
- # define MUST_CONVERT(enc, s) (! (enc)->isUtf8)
- typedef char ICHAR;
- #endif
- #ifndef XML_NS
- # define XmlInitEncodingNS XmlInitEncoding
- # define XmlInitUnknownEncodingNS XmlInitUnknownEncoding
- # undef XmlGetInternalEncodingNS
- # define XmlGetInternalEncodingNS XmlGetInternalEncoding
- # define XmlParseXmlDeclNS XmlParseXmlDecl
- #endif
- #ifdef XML_UNICODE
- # ifdef XML_UNICODE_WCHAR_T
- # define XML_T(x) (const wchar_t) x
- # define XML_L(x) L##x
- # else
- # define XML_T(x) (const unsigned short)x
- # define XML_L(x) x
- # endif
- #else
- # define XML_T(x) x
- # define XML_L(x) x
- #endif
- /* Round up n to be a multiple of sz, where sz is a power of 2. */
- #define ROUND_UP(n, sz) (((n) + ((sz) - 1)) & ~((sz) - 1))
- /* Do safe (NULL-aware) pointer arithmetic */
- #define EXPAT_SAFE_PTR_DIFF(p, q) (((p) && (q)) ? ((p) - (q)) : 0)
- #define EXPAT_MIN(a, b) (((a) < (b)) ? (a) : (b))
- #include "internal.h"
- #include "xmltok.h"
- #include "xmlrole.h"
- typedef const XML_Char *KEY;
- typedef struct {
- KEY name;
- } NAMED;
- typedef struct {
- NAMED **v;
- unsigned char power;
- size_t size;
- size_t used;
- const XML_Memory_Handling_Suite *mem;
- } HASH_TABLE;
- static size_t keylen(KEY s);
- static void copy_salt_to_sipkey(XML_Parser parser, struct sipkey *key);
- /* For probing (after a collision) we need a step size relative prime
- to the hash table size, which is a power of 2. We use double-hashing,
- since we can calculate a second hash value cheaply by taking those bits
- of the first hash value that were discarded (masked out) when the table
- index was calculated: index = hash & mask, where mask = table->size - 1.
- We limit the maximum step size to table->size / 4 (mask >> 2) and make
- it odd, since odd numbers are always relative prime to a power of 2.
- */
- #define SECOND_HASH(hash, mask, power) \
- ((((hash) & ~(mask)) >> ((power) - 1)) & ((mask) >> 2))
- #define PROBE_STEP(hash, mask, power) \
- ((unsigned char)((SECOND_HASH(hash, mask, power)) | 1))
- typedef struct {
- NAMED **p;
- NAMED **end;
- } HASH_TABLE_ITER;
- #define INIT_TAG_BUF_SIZE 32 /* must be a multiple of sizeof(XML_Char) */
- #define INIT_DATA_BUF_SIZE 1024
- #define INIT_ATTS_SIZE 16
- #define INIT_ATTS_VERSION 0xFFFFFFFF
- #define INIT_BLOCK_SIZE 1024
- #define INIT_BUFFER_SIZE 1024
- #define EXPAND_SPARE 24
- typedef struct binding {
- struct prefix *prefix;
- struct binding *nextTagBinding;
- struct binding *prevPrefixBinding;
- const struct attribute_id *attId;
- XML_Char *uri;
- int uriLen;
- int uriAlloc;
- } BINDING;
- typedef struct prefix {
- const XML_Char *name;
- BINDING *binding;
- } PREFIX;
- typedef struct {
- const XML_Char *str;
- const XML_Char *localPart;
- const XML_Char *prefix;
- int strLen;
- int uriLen;
- int prefixLen;
- } TAG_NAME;
- /* TAG represents an open element.
- The name of the element is stored in both the document and API
- encodings. The memory buffer 'buf' is a separately-allocated
- memory area which stores the name. During the XML_Parse()/
- XML_ParseBuffer() when the element is open, the memory for the 'raw'
- version of the name (in the document encoding) is shared with the
- document buffer. If the element is open across calls to
- XML_Parse()/XML_ParseBuffer(), the buffer is re-allocated to
- contain the 'raw' name as well.
- A parser reuses these structures, maintaining a list of allocated
- TAG objects in a free list.
- */
- typedef struct tag {
- struct tag *parent; /* parent of this element */
- const char *rawName; /* tagName in the original encoding */
- int rawNameLength;
- TAG_NAME name; /* tagName in the API encoding */
- char *buf; /* buffer for name components */
- char *bufEnd; /* end of the buffer */
- BINDING *bindings;
- } TAG;
- typedef struct {
- const XML_Char *name;
- const XML_Char *textPtr;
- int textLen; /* length in XML_Chars */
- int processed; /* # of processed bytes - when suspended */
- const XML_Char *systemId;
- const XML_Char *base;
- const XML_Char *publicId;
- const XML_Char *notation;
- XML_Bool open;
- XML_Bool is_param;
- XML_Bool is_internal; /* true if declared in internal subset outside PE */
- } ENTITY;
- typedef struct {
- enum XML_Content_Type type;
- enum XML_Content_Quant quant;
- const XML_Char *name;
- int firstchild;
- int lastchild;
- int childcnt;
- int nextsib;
- } CONTENT_SCAFFOLD;
- #define INIT_SCAFFOLD_ELEMENTS 32
- typedef struct block {
- struct block *next;
- int size;
- XML_Char s[1];
- } BLOCK;
- typedef struct {
- BLOCK *blocks;
- BLOCK *freeBlocks;
- const XML_Char *end;
- XML_Char *ptr;
- XML_Char *start;
- const XML_Memory_Handling_Suite *mem;
- } STRING_POOL;
- /* The XML_Char before the name is used to determine whether
- an attribute has been specified. */
- typedef struct attribute_id {
- XML_Char *name;
- PREFIX *prefix;
- XML_Bool maybeTokenized;
- XML_Bool xmlns;
- } ATTRIBUTE_ID;
- typedef struct {
- const ATTRIBUTE_ID *id;
- XML_Bool isCdata;
- const XML_Char *value;
- } DEFAULT_ATTRIBUTE;
- typedef struct {
- unsigned long version;
- unsigned long hash;
- const XML_Char *uriName;
- } NS_ATT;
- typedef struct {
- const XML_Char *name;
- PREFIX *prefix;
- const ATTRIBUTE_ID *idAtt;
- int nDefaultAtts;
- int allocDefaultAtts;
- DEFAULT_ATTRIBUTE *defaultAtts;
- } ELEMENT_TYPE;
- typedef struct {
- HASH_TABLE generalEntities;
- HASH_TABLE elementTypes;
- HASH_TABLE attributeIds;
- HASH_TABLE prefixes;
- STRING_POOL pool;
- STRING_POOL entityValuePool;
- /* false once a parameter entity reference has been skipped */
- XML_Bool keepProcessing;
- /* true once an internal or external PE reference has been encountered;
- this includes the reference to an external subset */
- XML_Bool hasParamEntityRefs;
- XML_Bool standalone;
- #ifdef XML_DTD
- /* indicates if external PE has been read */
- XML_Bool paramEntityRead;
- HASH_TABLE paramEntities;
- #endif /* XML_DTD */
- PREFIX defaultPrefix;
- /* === scaffolding for building content model === */
- XML_Bool in_eldecl;
- CONTENT_SCAFFOLD *scaffold;
- unsigned contentStringLen;
- unsigned scaffSize;
- unsigned scaffCount;
- int scaffLevel;
- int *scaffIndex;
- } DTD;
- typedef struct open_internal_entity {
- const char *internalEventPtr;
- const char *internalEventEndPtr;
- struct open_internal_entity *next;
- ENTITY *entity;
- int startTagLevel;
- XML_Bool betweenDecl; /* WFC: PE Between Declarations */
- } OPEN_INTERNAL_ENTITY;
- enum XML_Account {
- XML_ACCOUNT_DIRECT, /* bytes directly passed to the Expat parser */
- XML_ACCOUNT_ENTITY_EXPANSION, /* intermediate bytes produced during entity
- expansion */
- XML_ACCOUNT_NONE /* i.e. do not account, was accounted already */
- };
- #if XML_GE == 1
- typedef unsigned long long XmlBigCount;
- typedef struct accounting {
- XmlBigCount countBytesDirect;
- XmlBigCount countBytesIndirect;
- unsigned long debugLevel;
- float maximumAmplificationFactor; // >=1.0
- unsigned long long activationThresholdBytes;
- } ACCOUNTING;
- typedef struct entity_stats {
- unsigned int countEverOpened;
- unsigned int currentDepth;
- unsigned int maximumDepthSeen;
- unsigned long debugLevel;
- } ENTITY_STATS;
- #endif /* XML_GE == 1 */
- typedef enum XML_Error PTRCALL Processor(XML_Parser parser, const char *start,
- const char *end, const char **endPtr);
- static Processor prologProcessor;
- static Processor prologInitProcessor;
- static Processor contentProcessor;
- static Processor cdataSectionProcessor;
- #ifdef XML_DTD
- static Processor ignoreSectionProcessor;
- static Processor externalParEntProcessor;
- static Processor externalParEntInitProcessor;
- static Processor entityValueProcessor;
- static Processor entityValueInitProcessor;
- #endif /* XML_DTD */
- static Processor epilogProcessor;
- static Processor errorProcessor;
- static Processor externalEntityInitProcessor;
- static Processor externalEntityInitProcessor2;
- static Processor externalEntityInitProcessor3;
- static Processor externalEntityContentProcessor;
- static Processor internalEntityProcessor;
- static enum XML_Error handleUnknownEncoding(XML_Parser parser,
- const XML_Char *encodingName);
- static enum XML_Error processXmlDecl(XML_Parser parser, int isGeneralTextEntity,
- const char *s, const char *next);
- static enum XML_Error initializeEncoding(XML_Parser parser);
- static enum XML_Error doProlog(XML_Parser parser, const ENCODING *enc,
- const char *s, const char *end, int tok,
- const char *next, const char **nextPtr,
- XML_Bool haveMore, XML_Bool allowClosingDoctype,
- enum XML_Account account);
- static enum XML_Error processInternalEntity(XML_Parser parser, ENTITY *entity,
- XML_Bool betweenDecl);
- static enum XML_Error doContent(XML_Parser parser, int startTagLevel,
- const ENCODING *enc, const char *start,
- const char *end, const char **endPtr,
- XML_Bool haveMore, enum XML_Account account);
- static enum XML_Error doCdataSection(XML_Parser parser, const ENCODING *enc,
- const char **startPtr, const char *end,
- const char **nextPtr, XML_Bool haveMore,
- enum XML_Account account);
- #ifdef XML_DTD
- static enum XML_Error doIgnoreSection(XML_Parser parser, const ENCODING *enc,
- const char **startPtr, const char *end,
- const char **nextPtr, XML_Bool haveMore);
- #endif /* XML_DTD */
- static void freeBindings(XML_Parser parser, BINDING *bindings);
- static enum XML_Error storeAtts(XML_Parser parser, const ENCODING *enc,
- const char *attStr, TAG_NAME *tagNamePtr,
- BINDING **bindingsPtr,
- enum XML_Account account);
- static enum XML_Error addBinding(XML_Parser parser, PREFIX *prefix,
- const ATTRIBUTE_ID *attId, const XML_Char *uri,
- BINDING **bindingsPtr);
- static int defineAttribute(ELEMENT_TYPE *type, ATTRIBUTE_ID *attId,
- XML_Bool isCdata, XML_Bool isId,
- const XML_Char *value, XML_Parser parser);
- static enum XML_Error storeAttributeValue(XML_Parser parser,
- const ENCODING *enc, XML_Bool isCdata,
- const char *ptr, const char *end,
- STRING_POOL *pool,
- enum XML_Account account);
- static enum XML_Error appendAttributeValue(XML_Parser parser,
- const ENCODING *enc,
- XML_Bool isCdata, const char *ptr,
- const char *end, STRING_POOL *pool,
- enum XML_Account account);
- static ATTRIBUTE_ID *getAttributeId(XML_Parser parser, const ENCODING *enc,
- const char *start, const char *end);
- static int setElementTypePrefix(XML_Parser parser, ELEMENT_TYPE *elementType);
- #if XML_GE == 1
- static enum XML_Error storeEntityValue(XML_Parser parser, const ENCODING *enc,
- const char *start, const char *end,
- enum XML_Account account);
- #else
- static enum XML_Error storeSelfEntityValue(XML_Parser parser, ENTITY *entity);
- #endif
- static int reportProcessingInstruction(XML_Parser parser, const ENCODING *enc,
- const char *start, const char *end);
- static int reportComment(XML_Parser parser, const ENCODING *enc,
- const char *start, const char *end);
- static void reportDefault(XML_Parser parser, const ENCODING *enc,
- const char *start, const char *end);
- static const XML_Char *getContext(XML_Parser parser);
- static XML_Bool setContext(XML_Parser parser, const XML_Char *context);
- static void FASTCALL normalizePublicId(XML_Char *s);
- static DTD *dtdCreate(const XML_Memory_Handling_Suite *ms);
- /* do not call if m_parentParser != NULL */
- static void dtdReset(DTD *p, const XML_Memory_Handling_Suite *ms);
- static void dtdDestroy(DTD *p, XML_Bool isDocEntity,
- const XML_Memory_Handling_Suite *ms);
- static int dtdCopy(XML_Parser oldParser, DTD *newDtd, const DTD *oldDtd,
- const XML_Memory_Handling_Suite *ms);
- static int copyEntityTable(XML_Parser oldParser, HASH_TABLE *newTable,
- STRING_POOL *newPool, const HASH_TABLE *oldTable);
- static NAMED *lookup(XML_Parser parser, HASH_TABLE *table, KEY name,
- size_t createSize);
- static void FASTCALL hashTableInit(HASH_TABLE *table,
- const XML_Memory_Handling_Suite *ms);
- static void FASTCALL hashTableClear(HASH_TABLE *table);
- static void FASTCALL hashTableDestroy(HASH_TABLE *table);
- static void FASTCALL hashTableIterInit(HASH_TABLE_ITER *iter,
- const HASH_TABLE *table);
- static NAMED *FASTCALL hashTableIterNext(HASH_TABLE_ITER *iter);
- static void FASTCALL poolInit(STRING_POOL *pool,
- const XML_Memory_Handling_Suite *ms);
- static void FASTCALL poolClear(STRING_POOL *pool);
- static void FASTCALL poolDestroy(STRING_POOL *pool);
- static XML_Char *poolAppend(STRING_POOL *pool, const ENCODING *enc,
- const char *ptr, const char *end);
- static XML_Char *poolStoreString(STRING_POOL *pool, const ENCODING *enc,
- const char *ptr, const char *end);
- static XML_Bool FASTCALL poolGrow(STRING_POOL *pool);
- static const XML_Char *FASTCALL poolCopyString(STRING_POOL *pool,
- const XML_Char *s);
- static const XML_Char *poolCopyStringN(STRING_POOL *pool, const XML_Char *s,
- int n);
- static const XML_Char *FASTCALL poolAppendString(STRING_POOL *pool,
- const XML_Char *s);
- static int FASTCALL nextScaffoldPart(XML_Parser parser);
- static XML_Content *build_model(XML_Parser parser);
- static ELEMENT_TYPE *getElementType(XML_Parser parser, const ENCODING *enc,
- const char *ptr, const char *end);
- static XML_Char *copyString(const XML_Char *s,
- const XML_Memory_Handling_Suite *memsuite);
- static unsigned long generate_hash_secret_salt(XML_Parser parser);
- static XML_Bool startParsing(XML_Parser parser);
- static XML_Parser parserCreate(const XML_Char *encodingName,
- const XML_Memory_Handling_Suite *memsuite,
- const XML_Char *nameSep, DTD *dtd);
- static void parserInit(XML_Parser parser, const XML_Char *encodingName);
- #if XML_GE == 1
- static float accountingGetCurrentAmplification(XML_Parser rootParser);
- static void accountingReportStats(XML_Parser originParser, const char *epilog);
- static void accountingOnAbort(XML_Parser originParser);
- static void accountingReportDiff(XML_Parser rootParser,
- unsigned int levelsAwayFromRootParser,
- const char *before, const char *after,
- ptrdiff_t bytesMore, int source_line,
- enum XML_Account account);
- static XML_Bool accountingDiffTolerated(XML_Parser originParser, int tok,
- const char *before, const char *after,
- int source_line,
- enum XML_Account account);
- static void entityTrackingReportStats(XML_Parser parser, ENTITY *entity,
- const char *action, int sourceLine);
- static void entityTrackingOnOpen(XML_Parser parser, ENTITY *entity,
- int sourceLine);
- static void entityTrackingOnClose(XML_Parser parser, ENTITY *entity,
- int sourceLine);
- static XML_Parser getRootParserOf(XML_Parser parser,
- unsigned int *outLevelDiff);
- #endif /* XML_GE == 1 */
- static unsigned long getDebugLevel(const char *variableName,
- unsigned long defaultDebugLevel);
- #define poolStart(pool) ((pool)->start)
- #define poolLength(pool) ((pool)->ptr - (pool)->start)
- #define poolChop(pool) ((void)--(pool->ptr))
- #define poolLastChar(pool) (((pool)->ptr)[-1])
- #define poolDiscard(pool) ((pool)->ptr = (pool)->start)
- #define poolFinish(pool) ((pool)->start = (pool)->ptr)
- #define poolAppendChar(pool, c) \
- (((pool)->ptr == (pool)->end && ! poolGrow(pool)) \
- ? 0 \
- : ((*((pool)->ptr)++ = c), 1))
- #if ! defined(XML_TESTING)
- const
- #endif
- XML_Bool g_reparseDeferralEnabledDefault
- = XML_TRUE; // write ONLY in runtests.c
- #if defined(XML_TESTING)
- unsigned int g_bytesScanned = 0; // used for testing only
- #endif
- struct XML_ParserStruct {
- /* The first member must be m_userData so that the XML_GetUserData
- macro works. */
- void *m_userData;
- void *m_handlerArg;
- // How the four parse buffer pointers below relate in time and space:
- //
- // m_buffer <= m_bufferPtr <= m_bufferEnd <= m_bufferLim
- // | | | |
- // <--parsed-->| | |
- // <---parsing--->| |
- // <--unoccupied-->|
- // <---------total-malloced/realloced-------->|
- char *m_buffer; // malloc/realloc base pointer of parse buffer
- const XML_Memory_Handling_Suite m_mem;
- const char *m_bufferPtr; // first character to be parsed
- char *m_bufferEnd; // past last character to be parsed
- const char *m_bufferLim; // allocated end of m_buffer
- XML_Index m_parseEndByteIndex;
- const char *m_parseEndPtr;
- size_t m_partialTokenBytesBefore; /* used in heuristic to avoid O(n^2) */
- XML_Bool m_reparseDeferralEnabled;
- int m_lastBufferRequestSize;
- XML_Char *m_dataBuf;
- XML_Char *m_dataBufEnd;
- XML_StartElementHandler m_startElementHandler;
- XML_EndElementHandler m_endElementHandler;
- XML_CharacterDataHandler m_characterDataHandler;
- XML_ProcessingInstructionHandler m_processingInstructionHandler;
- XML_CommentHandler m_commentHandler;
- XML_StartCdataSectionHandler m_startCdataSectionHandler;
- XML_EndCdataSectionHandler m_endCdataSectionHandler;
- XML_DefaultHandler m_defaultHandler;
- XML_StartDoctypeDeclHandler m_startDoctypeDeclHandler;
- XML_EndDoctypeDeclHandler m_endDoctypeDeclHandler;
- XML_UnparsedEntityDeclHandler m_unparsedEntityDeclHandler;
- XML_NotationDeclHandler m_notationDeclHandler;
- XML_StartNamespaceDeclHandler m_startNamespaceDeclHandler;
- XML_EndNamespaceDeclHandler m_endNamespaceDeclHandler;
- XML_NotStandaloneHandler m_notStandaloneHandler;
- XML_ExternalEntityRefHandler m_externalEntityRefHandler;
- XML_Parser m_externalEntityRefHandlerArg;
- XML_SkippedEntityHandler m_skippedEntityHandler;
- XML_UnknownEncodingHandler m_unknownEncodingHandler;
- XML_ElementDeclHandler m_elementDeclHandler;
- XML_AttlistDeclHandler m_attlistDeclHandler;
- XML_EntityDeclHandler m_entityDeclHandler;
- XML_XmlDeclHandler m_xmlDeclHandler;
- const ENCODING *m_encoding;
- INIT_ENCODING m_initEncoding;
- const ENCODING *m_internalEncoding;
- const XML_Char *m_protocolEncodingName;
- XML_Bool m_ns;
- XML_Bool m_ns_triplets;
- void *m_unknownEncodingMem;
- void *m_unknownEncodingData;
- void *m_unknownEncodingHandlerData;
- void(XMLCALL *m_unknownEncodingRelease)(void *);
- PROLOG_STATE m_prologState;
- Processor *m_processor;
- enum XML_Error m_errorCode;
- const char *m_eventPtr;
- const char *m_eventEndPtr;
- const char *m_positionPtr;
- OPEN_INTERNAL_ENTITY *m_openInternalEntities;
- OPEN_INTERNAL_ENTITY *m_freeInternalEntities;
- XML_Bool m_defaultExpandInternalEntities;
- int m_tagLevel;
- ENTITY *m_declEntity;
- const XML_Char *m_doctypeName;
- const XML_Char *m_doctypeSysid;
- const XML_Char *m_doctypePubid;
- const XML_Char *m_declAttributeType;
- const XML_Char *m_declNotationName;
- const XML_Char *m_declNotationPublicId;
- ELEMENT_TYPE *m_declElementType;
- ATTRIBUTE_ID *m_declAttributeId;
- XML_Bool m_declAttributeIsCdata;
- XML_Bool m_declAttributeIsId;
- DTD *m_dtd;
- const XML_Char *m_curBase;
- TAG *m_tagStack;
- TAG *m_freeTagList;
- BINDING *m_inheritedBindings;
- BINDING *m_freeBindingList;
- int m_attsSize;
- int m_nSpecifiedAtts;
- int m_idAttIndex;
- ATTRIBUTE *m_atts;
- NS_ATT *m_nsAtts;
- unsigned long m_nsAttsVersion;
- unsigned char m_nsAttsPower;
- #ifdef XML_ATTR_INFO
- XML_AttrInfo *m_attInfo;
- #endif
- POSITION m_position;
- STRING_POOL m_tempPool;
- STRING_POOL m_temp2Pool;
- char *m_groupConnector;
- unsigned int m_groupSize;
- XML_Char m_namespaceSeparator;
- XML_Parser m_parentParser;
- XML_ParsingStatus m_parsingStatus;
- #ifdef XML_DTD
- XML_Bool m_isParamEntity;
- XML_Bool m_useForeignDTD;
- enum XML_ParamEntityParsing m_paramEntityParsing;
- #endif
- unsigned long m_hash_secret_salt;
- #if XML_GE == 1
- ACCOUNTING m_accounting;
- ENTITY_STATS m_entity_stats;
- #endif
- };
- #define MALLOC(parser, s) (parser->m_mem.malloc_fcn((s)))
- #define REALLOC(parser, p, s) (parser->m_mem.realloc_fcn((p), (s)))
- #define FREE(parser, p) (parser->m_mem.free_fcn((p)))
- XML_Parser XMLCALL
- XML_ParserCreate(const XML_Char *encodingName) {
- return XML_ParserCreate_MM(encodingName, NULL, NULL);
- }
- XML_Parser XMLCALL
- XML_ParserCreateNS(const XML_Char *encodingName, XML_Char nsSep) {
- XML_Char tmp[2] = {nsSep, 0};
- return XML_ParserCreate_MM(encodingName, NULL, tmp);
- }
- // "xml=http://www.w3.org/XML/1998/namespace"
- static const XML_Char implicitContext[]
- = {ASCII_x, ASCII_m, ASCII_l, ASCII_EQUALS, ASCII_h,
- ASCII_t, ASCII_t, ASCII_p, ASCII_COLON, ASCII_SLASH,
- ASCII_SLASH, ASCII_w, ASCII_w, ASCII_w, ASCII_PERIOD,
- ASCII_w, ASCII_3, ASCII_PERIOD, ASCII_o, ASCII_r,
- ASCII_g, ASCII_SLASH, ASCII_X, ASCII_M, ASCII_L,
- ASCII_SLASH, ASCII_1, ASCII_9, ASCII_9, ASCII_8,
- ASCII_SLASH, ASCII_n, ASCII_a, ASCII_m, ASCII_e,
- ASCII_s, ASCII_p, ASCII_a, ASCII_c, ASCII_e,
- '\0'};
- /* To avoid warnings about unused functions: */
- #if ! defined(HAVE_ARC4RANDOM_BUF) && ! defined(HAVE_ARC4RANDOM)
- # if defined(HAVE_GETRANDOM) || defined(HAVE_SYSCALL_GETRANDOM)
- /* Obtain entropy on Linux 3.17+ */
- static int
- writeRandomBytes_getrandom_nonblock(void *target, size_t count) {
- int success = 0; /* full count bytes written? */
- size_t bytesWrittenTotal = 0;
- const unsigned int getrandomFlags = GRND_NONBLOCK;
- do {
- void *const currentTarget = (void *)((char *)target + bytesWrittenTotal);
- const size_t bytesToWrite = count - bytesWrittenTotal;
- const int bytesWrittenMore =
- # if defined(HAVE_GETRANDOM)
- getrandom(currentTarget, bytesToWrite, getrandomFlags);
- # else
- syscall(SYS_getrandom, currentTarget, bytesToWrite, getrandomFlags);
- # endif
- if (bytesWrittenMore > 0) {
- bytesWrittenTotal += bytesWrittenMore;
- if (bytesWrittenTotal >= count)
- success = 1;
- }
- } while (! success && (errno == EINTR));
- return success;
- }
- # endif /* defined(HAVE_GETRANDOM) || defined(HAVE_SYSCALL_GETRANDOM) */
- # if ! defined(_WIN32) && defined(XML_DEV_URANDOM)
- /* Extract entropy from /dev/urandom */
- static int
- writeRandomBytes_dev_urandom(void *target, size_t count) {
- int success = 0; /* full count bytes written? */
- size_t bytesWrittenTotal = 0;
- const int fd = open("/dev/urandom", O_RDONLY);
- if (fd < 0) {
- return 0;
- }
- do {
- void *const currentTarget = (void *)((char *)target + bytesWrittenTotal);
- const size_t bytesToWrite = count - bytesWrittenTotal;
- const ssize_t bytesWrittenMore = read(fd, currentTarget, bytesToWrite);
- if (bytesWrittenMore > 0) {
- bytesWrittenTotal += bytesWrittenMore;
- if (bytesWrittenTotal >= count)
- success = 1;
- }
- } while (! success && (errno == EINTR));
- close(fd);
- return success;
- }
- # endif /* ! defined(_WIN32) && defined(XML_DEV_URANDOM) */
- #endif /* ! defined(HAVE_ARC4RANDOM_BUF) && ! defined(HAVE_ARC4RANDOM) */
- #if defined(HAVE_ARC4RANDOM) && ! defined(HAVE_ARC4RANDOM_BUF)
- static void
- writeRandomBytes_arc4random(void *target, size_t count) {
- size_t bytesWrittenTotal = 0;
- while (bytesWrittenTotal < count) {
- const uint32_t random32 = arc4random();
- size_t i = 0;
- for (; (i < sizeof(random32)) && (bytesWrittenTotal < count);
- i++, bytesWrittenTotal++) {
- const uint8_t random8 = (uint8_t)(random32 >> (i * 8));
- ((uint8_t *)target)[bytesWrittenTotal] = random8;
- }
- }
- }
- #endif /* defined(HAVE_ARC4RANDOM) && ! defined(HAVE_ARC4RANDOM_BUF) */
- #ifdef _WIN32
- /* Provide declaration of rand_s() for MinGW-32 (not 64, which has it),
- as it didn't declare it in its header prior to version 5.3.0 of its
- runtime package (mingwrt, containing stdlib.h). The upstream fix
- was introduced at https://osdn.net/projects/mingw/ticket/39658 . */
- # if defined(__MINGW32__) && defined(__MINGW32_VERSION) \
- && __MINGW32_VERSION < 5003000L && ! defined(__MINGW64_VERSION_MAJOR)
- __declspec(dllimport) int rand_s(unsigned int *);
- # endif
- /* Obtain entropy on Windows using the rand_s() function which
- * generates cryptographically secure random numbers. Internally it
- * uses RtlGenRandom API which is present in Windows XP and later.
- */
- static int
- writeRandomBytes_rand_s(void *target, size_t count) {
- size_t bytesWrittenTotal = 0;
- while (bytesWrittenTotal < count) {
- unsigned int random32 = 0;
- size_t i = 0;
- if (rand_s(&random32))
- return 0; /* failure */
- for (; (i < sizeof(random32)) && (bytesWrittenTotal < count);
- i++, bytesWrittenTotal++) {
- const uint8_t random8 = (uint8_t)(random32 >> (i * 8));
- ((uint8_t *)target)[bytesWrittenTotal] = random8;
- }
- }
- return 1; /* success */
- }
- #endif /* _WIN32 */
- #if ! defined(HAVE_ARC4RANDOM_BUF) && ! defined(HAVE_ARC4RANDOM)
- static unsigned long
- gather_time_entropy(void) {
- # ifdef _WIN32
- FILETIME ft;
- GetSystemTimeAsFileTime(&ft); /* never fails */
- return ft.dwHighDateTime ^ ft.dwLowDateTime;
- # else
- struct timeval tv;
- int gettimeofday_res;
- gettimeofday_res = gettimeofday(&tv, NULL);
- # if defined(NDEBUG)
- (void)gettimeofday_res;
- # else
- assert(gettimeofday_res == 0);
- # endif /* defined(NDEBUG) */
- /* Microseconds time is <20 bits entropy */
- return tv.tv_usec;
- # endif
- }
- #endif /* ! defined(HAVE_ARC4RANDOM_BUF) && ! defined(HAVE_ARC4RANDOM) */
- static unsigned long
- ENTROPY_DEBUG(const char *label, unsigned long entropy) {
- if (getDebugLevel("EXPAT_ENTROPY_DEBUG", 0) >= 1u) {
- fprintf(stderr, "expat: Entropy: %s --> 0x%0*lx (%lu bytes)\n", label,
- (int)sizeof(entropy) * 2, entropy, (unsigned long)sizeof(entropy));
- }
- return entropy;
- }
- static unsigned long
- generate_hash_secret_salt(XML_Parser parser) {
- unsigned long entropy;
- (void)parser;
- /* "Failproof" high quality providers: */
- #if defined(HAVE_ARC4RANDOM_BUF)
- arc4random_buf(&entropy, sizeof(entropy));
- return ENTROPY_DEBUG("arc4random_buf", entropy);
- #elif defined(HAVE_ARC4RANDOM)
- writeRandomBytes_arc4random((void *)&entropy, sizeof(entropy));
- return ENTROPY_DEBUG("arc4random", entropy);
- #else
- /* Try high quality providers first .. */
- # ifdef _WIN32
- if (writeRandomBytes_rand_s((void *)&entropy, sizeof(entropy))) {
- return ENTROPY_DEBUG("rand_s", entropy);
- }
- # elif defined(HAVE_GETRANDOM) || defined(HAVE_SYSCALL_GETRANDOM)
- if (writeRandomBytes_getrandom_nonblock((void *)&entropy, sizeof(entropy))) {
- return ENTROPY_DEBUG("getrandom", entropy);
- }
- # endif
- # if ! defined(_WIN32) && defined(XML_DEV_URANDOM)
- if (writeRandomBytes_dev_urandom((void *)&entropy, sizeof(entropy))) {
- return ENTROPY_DEBUG("/dev/urandom", entropy);
- }
- # endif /* ! defined(_WIN32) && defined(XML_DEV_URANDOM) */
- /* .. and self-made low quality for backup: */
- /* Process ID is 0 bits entropy if attacker has local access */
- entropy = gather_time_entropy() ^ getpid();
- /* Factors are 2^31-1 and 2^61-1 (Mersenne primes M31 and M61) */
- if (sizeof(unsigned long) == 4) {
- return ENTROPY_DEBUG("fallback(4)", entropy * 2147483647);
- } else {
- return ENTROPY_DEBUG("fallback(8)",
- entropy * (unsigned long)2305843009213693951ULL);
- }
- #endif
- }
- static unsigned long
- get_hash_secret_salt(XML_Parser parser) {
- if (parser->m_parentParser != NULL)
- return get_hash_secret_salt(parser->m_parentParser);
- return parser->m_hash_secret_salt;
- }
- static enum XML_Error
- callProcessor(XML_Parser parser, const char *start, const char *end,
- const char **endPtr) {
- const size_t have_now = EXPAT_SAFE_PTR_DIFF(end, start);
- if (parser->m_reparseDeferralEnabled
- && ! parser->m_parsingStatus.finalBuffer) {
- // Heuristic: don't try to parse a partial token again until the amount of
- // available data has increased significantly.
- const size_t had_before = parser->m_partialTokenBytesBefore;
- // ...but *do* try anyway if we're close to causing a reallocation.
- size_t available_buffer
- = EXPAT_SAFE_PTR_DIFF(parser->m_bufferPtr, parser->m_buffer);
- #if XML_CONTEXT_BYTES > 0
- available_buffer -= EXPAT_MIN(available_buffer, XML_CONTEXT_BYTES);
- #endif
- available_buffer
- += EXPAT_SAFE_PTR_DIFF(parser->m_bufferLim, parser->m_bufferEnd);
- // m_lastBufferRequestSize is never assigned a value < 0, so the cast is ok
- const bool enough
- = (have_now >= 2 * had_before)
- || ((size_t)parser->m_lastBufferRequestSize > available_buffer);
- if (! enough) {
- *endPtr = start; // callers may expect this to be set
- return XML_ERROR_NONE;
- }
- }
- #if defined(XML_TESTING)
- g_bytesScanned += (unsigned)have_now;
- #endif
- const enum XML_Error ret = parser->m_processor(parser, start, end, endPtr);
- if (ret == XML_ERROR_NONE) {
- // if we consumed nothing, remember what we had on this parse attempt.
- if (*endPtr == start) {
- parser->m_partialTokenBytesBefore = have_now;
- } else {
- parser->m_partialTokenBytesBefore = 0;
- }
- }
- return ret;
- }
- static XML_Bool /* only valid for root parser */
- startParsing(XML_Parser parser) {
- /* hash functions must be initialized before setContext() is called */
- if (parser->m_hash_secret_salt == 0)
- parser->m_hash_secret_salt = generate_hash_secret_salt(parser);
- if (parser->m_ns) {
- /* implicit context only set for root parser, since child
- parsers (i.e. external entity parsers) will inherit it
- */
- return setContext(parser, implicitContext);
- }
- return XML_TRUE;
- }
- XML_Parser XMLCALL
- XML_ParserCreate_MM(const XML_Char *encodingName,
- const XML_Memory_Handling_Suite *memsuite,
- const XML_Char *nameSep) {
- return parserCreate(encodingName, memsuite, nameSep, NULL);
- }
- static XML_Parser
- parserCreate(const XML_Char *encodingName,
- const XML_Memory_Handling_Suite *memsuite, const XML_Char *nameSep,
- DTD *dtd) {
- XML_Parser parser;
- if (memsuite) {
- XML_Memory_Handling_Suite *mtemp;
- parser = memsuite->malloc_fcn(sizeof(struct XML_ParserStruct));
- if (parser != NULL) {
- mtemp = (XML_Memory_Handling_Suite *)&(parser->m_mem);
- mtemp->malloc_fcn = memsuite->malloc_fcn;
- mtemp->realloc_fcn = memsuite->realloc_fcn;
- mtemp->free_fcn = memsuite->free_fcn;
- }
- } else {
- XML_Memory_Handling_Suite *mtemp;
- parser = (XML_Parser)malloc(sizeof(struct XML_ParserStruct));
- if (parser != NULL) {
- mtemp = (XML_Memory_Handling_Suite *)&(parser->m_mem);
- mtemp->malloc_fcn = malloc;
- mtemp->realloc_fcn = realloc;
- mtemp->free_fcn = free;
- }
- }
- if (! parser)
- return parser;
- parser->m_buffer = NULL;
- parser->m_bufferLim = NULL;
- parser->m_attsSize = INIT_ATTS_SIZE;
- parser->m_atts
- = (ATTRIBUTE *)MALLOC(parser, parser->m_attsSize * sizeof(ATTRIBUTE));
- if (parser->m_atts == NULL) {
- FREE(parser, parser);
- return NULL;
- }
- #ifdef XML_ATTR_INFO
- parser->m_attInfo = (XML_AttrInfo *)MALLOC(
- parser, parser->m_attsSize * sizeof(XML_AttrInfo));
- if (parser->m_attInfo == NULL) {
- FREE(parser, parser->m_atts);
- FREE(parser, parser);
- return NULL;
- }
- #endif
- parser->m_dataBuf
- = (XML_Char *)MALLOC(parser, INIT_DATA_BUF_SIZE * sizeof(XML_Char));
- if (parser->m_dataBuf == NULL) {
- FREE(parser, parser->m_atts);
- #ifdef XML_ATTR_INFO
- FREE(parser, parser->m_attInfo);
- #endif
- FREE(parser, parser);
- return NULL;
- }
- parser->m_dataBufEnd = parser->m_dataBuf + INIT_DATA_BUF_SIZE;
- if (dtd)
- parser->m_dtd = dtd;
- else {
- parser->m_dtd = dtdCreate(&parser->m_mem);
- if (parser->m_dtd == NULL) {
- FREE(parser, parser->m_dataBuf);
- FREE(parser, parser->m_atts);
- #ifdef XML_ATTR_INFO
- FREE(parser, parser->m_attInfo);
- #endif
- FREE(parser, parser);
- return NULL;
- }
- }
- parser->m_freeBindingList = NULL;
- parser->m_freeTagList = NULL;
- parser->m_freeInternalEntities = NULL;
- parser->m_groupSize = 0;
- parser->m_groupConnector = NULL;
- parser->m_unknownEncodingHandler = NULL;
- parser->m_unknownEncodingHandlerData = NULL;
- parser->m_namespaceSeparator = ASCII_EXCL;
- parser->m_ns = XML_FALSE;
- parser->m_ns_triplets = XML_FALSE;
- parser->m_nsAtts = NULL;
- parser->m_nsAttsVersion = 0;
- parser->m_nsAttsPower = 0;
- parser->m_protocolEncodingName = NULL;
- poolInit(&parser->m_tempPool, &(parser->m_mem));
- poolInit(&parser->m_temp2Pool, &(parser->m_mem));
- parserInit(parser, encodingName);
- if (encodingName && ! parser->m_protocolEncodingName) {
- if (dtd) {
- // We need to stop the upcoming call to XML_ParserFree from happily
- // destroying parser->m_dtd because the DTD is shared with the parent
- // parser and the only guard that keeps XML_ParserFree from destroying
- // parser->m_dtd is parser->m_isParamEntity but it will be set to
- // XML_TRUE only later in XML_ExternalEntityParserCreate (or not at all).
- parser->m_dtd = NULL;
- }
- XML_ParserFree(parser);
- return NULL;
- }
- if (nameSep) {
- parser->m_ns = XML_TRUE;
- parser->m_internalEncoding = XmlGetInternalEncodingNS();
- parser->m_namespaceSeparator = *nameSep;
- } else {
- parser->m_internalEncoding = XmlGetInternalEncoding();
- }
- return parser;
- }
- static void
- parserInit(XML_Parser parser, const XML_Char *encodingName) {
- parser->m_processor = prologInitProcessor;
- XmlPrologStateInit(&parser->m_prologState);
- if (encodingName != NULL) {
- parser->m_protocolEncodingName = copyString(encodingName, &(parser->m_mem));
- }
- parser->m_curBase = NULL;
- XmlInitEncoding(&parser->m_initEncoding, &parser->m_encoding, 0);
- parser->m_userData = NULL;
- parser->m_handlerArg = NULL;
- parser->m_startElementHandler = NULL;
- parser->m_endElementHandler = NULL;
- parser->m_characterDataHandler = NULL;
- parser->m_processingInstructionHandler = NULL;
- parser->m_commentHandler = NULL;
- parser->m_startCdataSectionHandler = NULL;
- parser->m_endCdataSectionHandler = NULL;
- parser->m_defaultHandler = NULL;
- parser->m_startDoctypeDeclHandler = NULL;
- parser->m_endDoctypeDeclHandler = NULL;
- parser->m_unparsedEntityDeclHandler = NULL;
- parser->m_notationDeclHandler = NULL;
- parser->m_startNamespaceDeclHandler = NULL;
- parser->m_endNamespaceDeclHandler = NULL;
- parser->m_notStandaloneHandler = NULL;
- parser->m_externalEntityRefHandler = NULL;
- parser->m_externalEntityRefHandlerArg = parser;
- parser->m_skippedEntityHandler = NULL;
- parser->m_elementDeclHandler = NULL;
- parser->m_attlistDeclHandler = NULL;
- parser->m_entityDeclHandler = NULL;
- parser->m_xmlDeclHandler = NULL;
- parser->m_bufferPtr = parser->m_buffer;
- parser->m_bufferEnd = parser->m_buffer;
- parser->m_parseEndByteIndex = 0;
- parser->m_parseEndPtr = NULL;
- parser->m_partialTokenBytesBefore = 0;
- parser->m_reparseDeferralEnabled = g_reparseDeferralEnabledDefault;
- parser->m_lastBufferRequestSize = 0;
- parser->m_declElementType = NULL;
- parser->m_declAttributeId = NULL;
- parser->m_declEntity = NULL;
- parser->m_doctypeName = NULL;
- parser->m_doctypeSysid = NULL;
- parser->m_doctypePubid = NULL;
- parser->m_declAttributeType = NULL;
- parser->m_declNotationName = NULL;
- parser->m_declNotationPublicId = NULL;
- parser->m_declAttributeIsCdata = XML_FALSE;
- parser->m_declAttributeIsId = XML_FALSE;
- memset(&parser->m_position, 0, sizeof(POSITION));
- parser->m_errorCode = XML_ERROR_NONE;
- parser->m_eventPtr = NULL;
- parser->m_eventEndPtr = NULL;
- parser->m_positionPtr = NULL;
- parser->m_openInternalEntities = NULL;
- parser->m_defaultExpandInternalEntities = XML_TRUE;
- parser->m_tagLevel = 0;
- parser->m_tagStack = NULL;
- parser->m_inheritedBindings = NULL;
- parser->m_nSpecifiedAtts = 0;
- parser->m_unknownEncodingMem = NULL;
- parser->m_unknownEncodingRelease = NULL;
- parser->m_unknownEncodingData = NULL;
- parser->m_parentParser = NULL;
- parser->m_parsingStatus.parsing = XML_INITIALIZED;
- #ifdef XML_DTD
- parser->m_isParamEntity = XML_FALSE;
- parser->m_useForeignDTD = XML_FALSE;
- parser->m_paramEntityParsing = XML_PARAM_ENTITY_PARSING_NEVER;
- #endif
- parser->m_hash_secret_salt = 0;
- #if XML_GE == 1
- memset(&parser->m_accounting, 0, sizeof(ACCOUNTING));
- parser->m_accounting.debugLevel = getDebugLevel("EXPAT_ACCOUNTING_DEBUG", 0u);
- parser->m_accounting.maximumAmplificationFactor
- = EXPAT_BILLION_LAUGHS_ATTACK_PROTECTION_MAXIMUM_AMPLIFICATION_DEFAULT;
- parser->m_accounting.activationThresholdBytes
- = EXPAT_BILLION_LAUGHS_ATTACK_PROTECTION_ACTIVATION_THRESHOLD_DEFAULT;
- memset(&parser->m_entity_stats, 0, sizeof(ENTITY_STATS));
- parser->m_entity_stats.debugLevel = getDebugLevel("EXPAT_ENTITY_DEBUG", 0u);
- #endif
- }
- /* moves list of bindings to m_freeBindingList */
- static void FASTCALL
- moveToFreeBindingList(XML_Parser parser, BINDING *bindings) {
- while (bindings) {
- BINDING *b = bindings;
- bindings = bindings->nextTagBinding;
- b->nextTagBinding = parser->m_freeBindingList;
- parser->m_freeBindingList = b;
- }
- }
- XML_Bool XMLCALL
- XML_ParserReset(XML_Parser parser, const XML_Char *encodingName) {
- TAG *tStk;
- OPEN_INTERNAL_ENTITY *openEntityList;
- if (parser == NULL)
- return XML_FALSE;
- if (parser->m_parentParser)
- return XML_FALSE;
- /* move m_tagStack to m_freeTagList */
- tStk = parser->m_tagStack;
- while (tStk) {
- TAG *tag = tStk;
- tStk = tStk->parent;
- tag->parent = parser->m_freeTagList;
- moveToFreeBindingList(parser, tag->bindings);
- tag->bindings = NULL;
- parser->m_freeTagList = tag;
- }
- /* move m_openInternalEntities to m_freeInternalEntities */
- openEntityList = parser->m_openInternalEntities;
- while (openEntityList) {
- OPEN_INTERNAL_ENTITY *openEntity = openEntityList;
- openEntityList = openEntity->next;
- openEntity->next = parser->m_freeInternalEntities;
- parser->m_freeInternalEntities = openEntity;
- }
- moveToFreeBindingList(parser, parser->m_inheritedBindings);
- FREE(parser, parser->m_unknownEncodingMem);
- if (parser->m_unknownEncodingRelease)
- parser->m_unknownEncodingRelease(parser->m_unknownEncodingData);
- poolClear(&parser->m_tempPool);
- poolClear(&parser->m_temp2Pool);
- FREE(parser, (void *)parser->m_protocolEncodingName);
- parser->m_protocolEncodingName = NULL;
- parserInit(parser, encodingName);
- dtdReset(parser->m_dtd, &parser->m_mem);
- return XML_TRUE;
- }
- enum XML_Status XMLCALL
- XML_SetEncoding(XML_Parser parser, const XML_Char *encodingName) {
- if (parser == NULL)
- return XML_STATUS_ERROR;
- /* Block after XML_Parse()/XML_ParseBuffer() has been called.
- XXX There's no way for the caller to determine which of the
- XXX possible error cases caused the XML_STATUS_ERROR return.
- */
- if (parser->m_parsingStatus.parsing == XML_PARSING
- || parser->m_parsingStatus.parsing == XML_SUSPENDED)
- return XML_STATUS_ERROR;
- /* Get rid of any previous encoding name */
- FREE(parser, (void *)parser->m_protocolEncodingName);
- if (encodingName == NULL)
- /* No new encoding name */
- parser->m_protocolEncodingName = NULL;
- else {
- /* Copy the new encoding name into allocated memory */
- parser->m_protocolEncodingName = copyString(encodingName, &(parser->m_mem));
- if (! parser->m_protocolEncodingName)
- return XML_STATUS_ERROR;
- }
- return XML_STATUS_OK;
- }
- XML_Parser XMLCALL
- XML_ExternalEntityParserCreate(XML_Parser oldParser, const XML_Char *context,
- const XML_Char *encodingName) {
- XML_Parser parser = oldParser;
- DTD *newDtd = NULL;
- DTD *oldDtd;
- XML_StartElementHandler oldStartElementHandler;
- XML_EndElementHandler oldEndElementHandler;
- XML_CharacterDataHandler oldCharacterDataHandler;
- XML_ProcessingInstructionHandler oldProcessingInstructionHandler;
- XML_CommentHandler oldCommentHandler;
- XML_StartCdataSectionHandler oldStartCdataSectionHandler;
- XML_EndCdataSectionHandler oldEndCdataSectionHandler;
- XML_DefaultHandler oldDefaultHandler;
- XML_UnparsedEntityDeclHandler oldUnparsedEntityDeclHandler;
- XML_NotationDeclHandler oldNotationDeclHandler;
- XML_StartNamespaceDeclHandler oldStartNamespaceDeclHandler;
- XML_EndNamespaceDeclHandler oldEndNamespaceDeclHandler;
- XML_NotStandaloneHandler oldNotStandaloneHandler;
- XML_ExternalEntityRefHandler oldExternalEntityRefHandler;
- XML_SkippedEntityHandler oldSkippedEntityHandler;
- XML_UnknownEncodingHandler oldUnknownEncodingHandler;
- XML_ElementDeclHandler oldElementDeclHandler;
- XML_AttlistDeclHandler oldAttlistDeclHandler;
- XML_EntityDeclHandler oldEntityDeclHandler;
- XML_XmlDeclHandler oldXmlDeclHandler;
- ELEMENT_TYPE *oldDeclElementType;
- void *oldUserData;
- void *oldHandlerArg;
- XML_Bool oldDefaultExpandInternalEntities;
- XML_Parser oldExternalEntityRefHandlerArg;
- #ifdef XML_DTD
- enum XML_ParamEntityParsing oldParamEntityParsing;
- int oldInEntityValue;
- #endif
- XML_Bool oldns_triplets;
- /* Note that the new parser shares the same hash secret as the old
- parser, so that dtdCopy and copyEntityTable can lookup values
- from hash tables associated with either parser without us having
- to worry which hash secrets each table has.
- */
- unsigned long oldhash_secret_salt;
- XML_Bool oldReparseDeferralEnabled;
- /* Validate the oldParser parameter before we pull everything out of it */
- if (oldParser == NULL)
- return NULL;
- /* Stash the original parser contents on the stack */
- oldDtd = parser->m_dtd;
- oldStartElementHandler = parser->m_startElementHandler;
- oldEndElementHandler = parser->m_endElementHandler;
- oldCharacterDataHandler = parser->m_characterDataHandler;
- oldProcessingInstructionHandler = parser->m_processingInstructionHandler;
- oldCommentHandler = parser->m_commentHandler;
- oldStartCdataSectionHandler = parser->m_startCdataSectionHandler;
- oldEndCdataSectionHandler = parser->m_endCdataSectionHandler;
- oldDefaultHandler = parser->m_defaultHandler;
- oldUnparsedEntityDeclHandler = parser->m_unparsedEntityDeclHandler;
- oldNotationDeclHandler = parser->m_notationDeclHandler;
- oldStartNamespaceDeclHandler = parser->m_startNamespaceDeclHandler;
- oldEndNamespaceDeclHandler = parser->m_endNamespaceDeclHandler;
- oldNotStandaloneHandler = parser->m_notStandaloneHandler;
- oldExternalEntityRefHandler = parser->m_externalEntityRefHandler;
- oldSkippedEntityHandler = parser->m_skippedEntityHandler;
- oldUnknownEncodingHandler = parser->m_unknownEncodingHandler;
- oldElementDeclHandler = parser->m_elementDeclHandler;
- oldAttlistDeclHandler = parser->m_attlistDeclHandler;
- oldEntityDeclHandler = parser->m_entityDeclHandler;
- oldXmlDeclHandler = parser->m_xmlDeclHandler;
- oldDeclElementType = parser->m_declElementType;
- oldUserData = parser->m_userData;
- oldHandlerArg = parser->m_handlerArg;
- oldDefaultExpandInternalEntities = parser->m_defaultExpandInternalEntities;
- oldExternalEntityRefHandlerArg = parser->m_externalEntityRefHandlerArg;
- #ifdef XML_DTD
- oldParamEntityParsing = parser->m_paramEntityParsing;
- oldInEntityValue = parser->m_prologState.inEntityValue;
- #endif
- oldns_triplets = parser->m_ns_triplets;
- /* Note that the new parser shares the same hash secret as the old
- parser, so that dtdCopy and copyEntityTable can lookup values
- from hash tables associated with either parser without us having
- to worry which hash secrets each table has.
- */
- oldhash_secret_salt = parser->m_hash_secret_salt;
- oldReparseDeferralEnabled = parser->m_reparseDeferralEnabled;
- #ifdef XML_DTD
- if (! context)
- newDtd = oldDtd;
- #endif /* XML_DTD */
- /* Note that the magical uses of the pre-processor to make field
- access look more like C++ require that `parser' be overwritten
- here. This makes this function more painful to follow than it
- would be otherwise.
- */
- if (parser->m_ns) {
- XML_Char tmp[2] = {parser->m_namespaceSeparator, 0};
- parser = parserCreate(encodingName, &parser->m_mem, tmp, newDtd);
- } else {
- parser = parserCreate(encodingName, &parser->m_mem, NULL, newDtd);
- }
- if (! parser)
- return NULL;
- parser->m_startElementHandler = oldStartElementHandler;
- parser->m_endElementHandler = oldEndElementHandler;
- parser->m_characterDataHandler = oldCharacterDataHandler;
- parser->m_processingInstructionHandler = oldProcessingInstructionHandler;
- parser->m_commentHandler = oldCommentHandler;
- parser->m_startCdataSectionHandler = oldStartCdataSectionHandler;
- parser->m_endCdataSectionHandler = oldEndCdataSectionHandler;
- parser->m_defaultHandler = oldDefaultHandler;
- parser->m_unparsedEntityDeclHandler = oldUnparsedEntityDeclHandler;
- parser->m_notationDeclHandler = oldNotationDeclHandler;
- parser->m_startNamespaceDeclHandler = oldStartNamespaceDeclHandler;
- parser->m_endNamespaceDeclHandler = oldEndNamespaceDeclHandler;
- parser->m_notStandaloneHandler = oldNotStandaloneHandler;
- parser->m_externalEntityRefHandler = oldExternalEntityRefHandler;
- parser->m_skippedEntityHandler = oldSkippedEntityHandler;
- parser->m_unknownEncodingHandler = oldUnknownEncodingHandler;
- parser->m_elementDeclHandler = oldElementDeclHandler;
- parser->m_attlistDeclHandler = oldAttlistDeclHandler;
- parser->m_entityDeclHandler = oldEntityDeclHandler;
- parser->m_xmlDeclHandler = oldXmlDeclHandler;
- parser->m_declElementType = oldDeclElementType;
- parser->m_userData = oldUserData;
- if (oldUserData == oldHandlerArg)
- parser->m_handlerArg = parser->m_userData;
- else
- parser->m_handlerArg = parser;
- if (oldExternalEntityRefHandlerArg != oldParser)
- parser->m_externalEntityRefHandlerArg = oldExternalEntityRefHandlerArg;
- parser->m_defaultExpandInternalEntities = oldDefaultExpandInternalEntities;
- parser->m_ns_triplets = oldns_triplets;
- parser->m_hash_secret_salt = oldhash_secret_salt;
- parser->m_reparseDeferralEnabled = oldReparseDeferralEnabled;
- parser->m_parentParser = oldParser;
- #ifdef XML_DTD
- parser->m_paramEntityParsing = oldParamEntityParsing;
- parser->m_prologState.inEntityValue = oldInEntityValue;
- if (context) {
- #endif /* XML_DTD */
- if (! dtdCopy(oldParser, parser->m_dtd, oldDtd, &parser->m_mem)
- || ! setContext(parser, context)) {
- XML_ParserFree(parser);
- return NULL;
- }
- parser->m_processor = externalEntityInitProcessor;
- #ifdef XML_DTD
- } else {
- /* The DTD instance referenced by parser->m_dtd is shared between the
- document's root parser and external PE parsers, therefore one does not
- need to call setContext. In addition, one also *must* not call
- setContext, because this would overwrite existing prefix->binding
- pointers in parser->m_dtd with ones that get destroyed with the external
- PE parser. This would leave those prefixes with dangling pointers.
- */
- parser->m_isParamEntity = XML_TRUE;
- XmlPrologStateInitExternalEntity(&parser->m_prologState);
- parser->m_processor = externalParEntInitProcessor;
- }
- #endif /* XML_DTD */
- return parser;
- }
- static void FASTCALL
- destroyBindings(BINDING *bindings, XML_Parser parser) {
- for (;;) {
- BINDING *b = bindings;
- if (! b)
- break;
- bindings = b->nextTagBinding;
- FREE(parser, b->uri);
- FREE(parser, b);
- }
- }
- void XMLCALL
- XML_ParserFree(XML_Parser parser) {
- TAG *tagList;
- OPEN_INTERNAL_ENTITY *entityList;
- if (parser == NULL)
- return;
- /* free m_tagStack and m_freeTagList */
- tagList = parser->m_tagStack;
- for (;;) {
- TAG *p;
- if (tagList == NULL) {
- if (parser->m_freeTagList == NULL)
- break;
- tagList = parser->m_freeTagList;
- parser->m_freeTagList = NULL;
- }
- p = tagList;
- tagList = tagList->parent;
- FREE(parser, p->buf);
- destroyBindings(p->bindings, parser);
- FREE(parser, p);
- }
- /* free m_openInternalEntities and m_freeInternalEntities */
- entityList = parser->m_openInternalEntities;
- for (;;) {
- OPEN_INTERNAL_ENTITY *openEntity;
- if (entityList == NULL) {
- if (parser->m_freeInternalEntities == NULL)
- break;
- entityList = parser->m_freeInternalEntities;
- parser->m_freeInternalEntities = NULL;
- }
- openEntity = entityList;
- entityList = entityList->next;
- FREE(parser, openEntity);
- }
- destroyBindings(parser->m_freeBindingList, parser);
- destroyBindings(parser->m_inheritedBindings, parser);
- poolDestroy(&parser->m_tempPool);
- poolDestroy(&parser->m_temp2Pool);
- FREE(parser, (void *)parser->m_protocolEncodingName);
- #ifdef XML_DTD
- /* external parameter entity parsers share the DTD structure
- parser->m_dtd with the root parser, so we must not destroy it
- */
- if (! parser->m_isParamEntity && parser->m_dtd)
- #else
- if (parser->m_dtd)
- #endif /* XML_DTD */
- dtdDestroy(parser->m_dtd, (XML_Bool)! parser->m_parentParser,
- &parser->m_mem);
- FREE(parser, (void *)parser->m_atts);
- #ifdef XML_ATTR_INFO
- FREE(parser, (void *)parser->m_attInfo);
- #endif
- FREE(parser, parser->m_groupConnector);
- FREE(parser, parser->m_buffer);
- FREE(parser, parser->m_dataBuf);
- FREE(parser, parser->m_nsAtts);
- FREE(parser, parser->m_unknownEncodingMem);
- if (parser->m_unknownEncodingRelease)
- parser->m_unknownEncodingRelease(parser->m_unknownEncodingData);
- FREE(parser, parser);
- }
- void XMLCALL
- XML_UseParserAsHandlerArg(XML_Parser parser) {
- if (parser != NULL)
- parser->m_handlerArg = parser;
- }
- enum XML_Error XMLCALL
- XML_UseForeignDTD(XML_Parser parser, XML_Bool useDTD) {
- if (parser == NULL)
- return XML_ERROR_INVALID_ARGUMENT;
- #ifdef XML_DTD
- /* block after XML_Parse()/XML_ParseBuffer() has been called */
- if (parser->m_parsingStatus.parsing == XML_PARSING
- || parser->m_parsingStatus.parsing == XML_SUSPENDED)
- return XML_ERROR_CANT_CHANGE_FEATURE_ONCE_PARSING;
- parser->m_useForeignDTD = useDTD;
- return XML_ERROR_NONE;
- #else
- UNUSED_P(useDTD);
- return XML_ERROR_FEATURE_REQUIRES_XML_DTD;
- #endif
- }
- void XMLCALL
- XML_SetReturnNSTriplet(XML_Parser parser, int do_nst) {
- if (parser == NULL)
- return;
- /* block after XML_Parse()/XML_ParseBuffer() has been called */
- if (parser->m_parsingStatus.parsing == XML_PARSING
- || parser->m_parsingStatus.parsing == XML_SUSPENDED)
- return;
- parser->m_ns_triplets = do_nst ? XML_TRUE : XML_FALSE;
- }
- void XMLCALL
- XML_SetUserData(XML_Parser parser, void *p) {
- if (parser == NULL)
- return;
- if (parser->m_handlerArg == parser->m_userData)
- parser->m_handlerArg = parser->m_userData = p;
- else
- parser->m_userData = p;
- }
- enum XML_Status XMLCALL
- XML_SetBase(XML_Parser parser, const XML_Char *p) {
- if (parser == NULL)
- return XML_STATUS_ERROR;
- if (p) {
- p = poolCopyString(&parser->m_dtd->pool, p);
- if (! p)
- return XML_STATUS_ERROR;
- parser->m_curBase = p;
- } else
- parser->m_curBase = NULL;
- return XML_STATUS_OK;
- }
- const XML_Char *XMLCALL
- XML_GetBase(XML_Parser parser) {
- if (parser == NULL)
- return NULL;
- return parser->m_curBase;
- }
- int XMLCALL
- XML_GetSpecifiedAttributeCount(XML_Parser parser) {
- if (parser == NULL)
- return -1;
- return parser->m_nSpecifiedAtts;
- }
- int XMLCALL
- XML_GetIdAttributeIndex(XML_Parser parser) {
- if (parser == NULL)
- return -1;
- return parser->m_idAttIndex;
- }
- #ifdef XML_ATTR_INFO
- const XML_AttrInfo *XMLCALL
- XML_GetAttributeInfo(XML_Parser parser) {
- if (parser == NULL)
- return NULL;
- return parser->m_attInfo;
- }
- #endif
- void XMLCALL
- XML_SetElementHandler(XML_Parser parser, XML_StartElementHandler start,
- XML_EndElementHandler end) {
- if (parser == NULL)
- return;
- parser->m_startElementHandler = start;
- parser->m_endElementHandler = end;
- }
- void XMLCALL
- XML_SetStartElementHandler(XML_Parser parser, XML_StartElementHandler start) {
- if (parser != NULL)
- parser->m_startElementHandler = start;
- }
- void XMLCALL
- XML_SetEndElementHandler(XML_Parser parser, XML_EndElementHandler end) {
- if (parser != NULL)
- parser->m_endElementHandler = end;
- }
- void XMLCALL
- XML_SetCharacterDataHandler(XML_Parser parser,
- XML_CharacterDataHandler handler) {
- if (parser != NULL)
- parser->m_characterDataHandler = handler;
- }
- void XMLCALL
- XML_SetProcessingInstructionHandler(XML_Parser parser,
- XML_ProcessingInstructionHandler handler) {
- if (parser != NULL)
- parser->m_processingInstructionHandler = handler;
- }
- void XMLCALL
- XML_SetCommentHandler(XML_Parser parser, XML_CommentHandler handler) {
- if (parser != NULL)
- parser->m_commentHandler = handler;
- }
- void XMLCALL
- XML_SetCdataSectionHandler(XML_Parser parser,
- XML_StartCdataSectionHandler start,
- XML_EndCdataSectionHandler end) {
- if (parser == NULL)
- return;
- parser->m_startCdataSectionHandler = start;
- parser->m_endCdataSectionHandler = end;
- }
- void XMLCALL
- XML_SetStartCdataSectionHandler(XML_Parser parser,
- XML_StartCdataSectionHandler start) {
- if (parser != NULL)
- parser->m_startCdataSectionHandler = start;
- }
- void XMLCALL
- XML_SetEndCdataSectionHandler(XML_Parser parser,
- XML_EndCdataSectionHandler end) {
- if (parser != NULL)
- parser->m_endCdataSectionHandler = end;
- }
- void XMLCALL
- XML_SetDefaultHandler(XML_Parser parser, XML_DefaultHandler handler) {
- if (parser == NULL)
- return;
- parser->m_defaultHandler = handler;
- parser->m_defaultExpandInternalEntities = XML_FALSE;
- }
- void XMLCALL
- XML_SetDefaultHandlerExpand(XML_Parser parser, XML_DefaultHandler handler) {
- if (parser == NULL)
- return;
- parser->m_defaultHandler = handler;
- parser->m_defaultExpandInternalEntities = XML_TRUE;
- }
- void XMLCALL
- XML_SetDoctypeDeclHandler(XML_Parser parser, XML_StartDoctypeDeclHandler start,
- XML_EndDoctypeDeclHandler end) {
- if (parser == NULL)
- return;
- parser->m_startDoctypeDeclHandler = start;
- parser->m_endDoctypeDeclHandler = end;
- }
- void XMLCALL
- XML_SetStartDoctypeDeclHandler(XML_Parser parser,
- XML_StartDoctypeDeclHandler start) {
- if (parser != NULL)
- parser->m_startDoctypeDeclHandler = start;
- }
- void XMLCALL
- XML_SetEndDoctypeDeclHandler(XML_Parser parser, XML_EndDoctypeDeclHandler end) {
- if (parser != NULL)
- parser->m_endDoctypeDeclHandler = end;
- }
- void XMLCALL
- XML_SetUnparsedEntityDeclHandler(XML_Parser parser,
- XML_UnparsedEntityDeclHandler handler) {
- if (parser != NULL)
- parser->m_unparsedEntityDeclHandler = handler;
- }
- void XMLCALL
- XML_SetNotationDeclHandler(XML_Parser parser, XML_NotationDeclHandler handler) {
- if (parser != NULL)
- parser->m_notationDeclHandler = handler;
- }
- void XMLCALL
- XML_SetNamespaceDeclHandler(XML_Parser parser,
- XML_StartNamespaceDeclHandler start,
- XML_EndNamespaceDeclHandler end) {
- if (parser == NULL)
- return;
- parser->m_startNamespaceDeclHandler = start;
- parser->m_endNamespaceDeclHandler = end;
- }
- void XMLCALL
- XML_SetStartNamespaceDeclHandler(XML_Parser parser,
- XML_StartNamespaceDeclHandler start) {
- if (parser != NULL)
- parser->m_startNamespaceDeclHandler = start;
- }
- void XMLCALL
- XML_SetEndNamespaceDeclHandler(XML_Parser parser,
- XML_EndNamespaceDeclHandler end) {
- if (parser != NULL)
- parser->m_endNamespaceDeclHandler = end;
- }
- void XMLCALL
- XML_SetNotStandaloneHandler(XML_Parser parser,
- XML_NotStandaloneHandler handler) {
- if (parser != NULL)
- parser->m_notStandaloneHandler = handler;
- }
- void XMLCALL
- XML_SetExternalEntityRefHandler(XML_Parser parser,
- XML_ExternalEntityRefHandler handler) {
- if (parser != NULL)
- parser->m_externalEntityRefHandler = handler;
- }
- void XMLCALL
- XML_SetExternalEntityRefHandlerArg(XML_Parser parser, void *arg) {
- if (parser == NULL)
- return;
- if (arg)
- parser->m_externalEntityRefHandlerArg = (XML_Parser)arg;
- else
- parser->m_externalEntityRefHandlerArg = parser;
- }
- void XMLCALL
- XML_SetSkippedEntityHandler(XML_Parser parser,
- XML_SkippedEntityHandler handler) {
- if (parser != NULL)
- parser->m_skippedEntityHandler = handler;
- }
- void XMLCALL
- XML_SetUnknownEncodingHandler(XML_Parser parser,
- XML_UnknownEncodingHandler handler, void *data) {
- if (parser == NULL)
- return;
- parser->m_unknownEncodingHandler = handler;
- parser->m_unknownEncodingHandlerData = data;
- }
- void XMLCALL
- XML_SetElementDeclHandler(XML_Parser parser, XML_ElementDeclHandler eldecl) {
- if (parser != NULL)
- parser->m_elementDeclHandler = eldecl;
- }
- void XMLCALL
- XML_SetAttlistDeclHandler(XML_Parser parser, XML_AttlistDeclHandler attdecl) {
- if (parser != NULL)
- parser->m_attlistDeclHandler = attdecl;
- }
- void XMLCALL
- XML_SetEntityDeclHandler(XML_Parser parser, XML_EntityDeclHandler handler) {
- if (parser != NULL)
- parser->m_entityDeclHandler = handler;
- }
- void XMLCALL
- XML_SetXmlDeclHandler(XML_Parser parser, XML_XmlDeclHandler handler) {
- if (parser != NULL)
- parser->m_xmlDeclHandler = handler;
- }
- int XMLCALL
- XML_SetParamEntityParsing(XML_Parser parser,
- enum XML_ParamEntityParsing peParsing) {
- if (parser == NULL)
- return 0;
- /* block after XML_Parse()/XML_ParseBuffer() has been called */
- if (parser->m_parsingStatus.parsing == XML_PARSING
- || parser->m_parsingStatus.parsing == XML_SUSPENDED)
- return 0;
- #ifdef XML_DTD
- parser->m_paramEntityParsing = peParsing;
- return 1;
- #else
- return peParsing == XML_PARAM_ENTITY_PARSING_NEVER;
- #endif
- }
- int XMLCALL
- XML_SetHashSalt(XML_Parser parser, unsigned long hash_salt) {
- if (parser == NULL)
- return 0;
- if (parser->m_parentParser)
- return XML_SetHashSalt(parser->m_parentParser, hash_salt);
- /* block after XML_Parse()/XML_ParseBuffer() has been called */
- if (parser->m_parsingStatus.parsing == XML_PARSING
- || parser->m_parsingStatus.parsing == XML_SUSPENDED)
- return 0;
- parser->m_hash_secret_salt = hash_salt;
- return 1;
- }
- enum XML_Status XMLCALL
- XML_Parse(XML_Parser parser, const char *s, int len, int isFinal) {
- if ((parser == NULL) || (len < 0) || ((s == NULL) && (len != 0))) {
- if (parser != NULL)
- parser->m_errorCode = XML_ERROR_INVALID_ARGUMENT;
- return XML_STATUS_ERROR;
- }
- switch (parser->m_parsingStatus.parsing) {
- case XML_SUSPENDED:
- parser->m_errorCode = XML_ERROR_SUSPENDED;
- return XML_STATUS_ERROR;
- case XML_FINISHED:
- parser->m_errorCode = XML_ERROR_FINISHED;
- return XML_STATUS_ERROR;
- case XML_INITIALIZED:
- if (parser->m_parentParser == NULL && ! startParsing(parser)) {
- parser->m_errorCode = XML_ERROR_NO_MEMORY;
- return XML_STATUS_ERROR;
- }
- /* fall through */
- default:
- parser->m_parsingStatus.parsing = XML_PARSING;
- }
- #if XML_CONTEXT_BYTES == 0
- if (parser->m_bufferPtr == parser->m_bufferEnd) {
- const char *end;
- int nLeftOver;
- enum XML_Status result;
- /* Detect overflow (a+b > MAX <==> b > MAX-a) */
- if ((XML_Size)len > ((XML_Size)-1) / 2 - parser->m_parseEndByteIndex) {
- parser->m_errorCode = XML_ERROR_NO_MEMORY;
- parser->m_eventPtr = parser->m_eventEndPtr = NULL;
- parser->m_processor = errorProcessor;
- return XML_STATUS_ERROR;
- }
- // though this isn't a buffer request, we assume that `len` is the app's
- // preferred buffer fill size, and therefore save it here.
- parser->m_lastBufferRequestSize = len;
- parser->m_parseEndByteIndex += len;
- parser->m_positionPtr = s;
- parser->m_parsingStatus.finalBuffer = (XML_Bool)isFinal;
- parser->m_errorCode
- = callProcessor(parser, s, parser->m_parseEndPtr = s + len, &end);
- if (parser->m_errorCode != XML_ERROR_NONE) {
- parser->m_eventEndPtr = parser->m_eventPtr;
- parser->m_processor = errorProcessor;
- return XML_STATUS_ERROR;
- } else {
- switch (parser->m_parsingStatus.parsing) {
- case XML_SUSPENDED:
- result = XML_STATUS_SUSPENDED;
- break;
- case XML_INITIALIZED:
- case XML_PARSING:
- if (isFinal) {
- parser->m_parsingStatus.parsing = XML_FINISHED;
- return XML_STATUS_OK;
- }
- /* fall through */
- default:
- result = XML_STATUS_OK;
- }
- }
- XmlUpdatePosition(parser->m_encoding, parser->m_positionPtr, end,
- &parser->m_position);
- nLeftOver = s + len - end;
- if (nLeftOver) {
- // Back up and restore the parsing status to avoid XML_ERROR_SUSPENDED
- // (and XML_ERROR_FINISHED) from XML_GetBuffer.
- const enum XML_Parsing originalStatus = parser->m_parsingStatus.parsing;
- parser->m_parsingStatus.parsing = XML_PARSING;
- void *const temp = XML_GetBuffer(parser, nLeftOver);
- parser->m_parsingStatus.parsing = originalStatus;
- // GetBuffer may have overwritten this, but we want to remember what the
- // app requested, not how many bytes were left over after parsing.
- parser->m_lastBufferRequestSize = len;
- if (temp == NULL) {
- // NOTE: parser->m_errorCode has already been set by XML_GetBuffer().
- parser->m_eventPtr = parser->m_eventEndPtr = NULL;
- parser->m_processor = errorProcessor;
- return XML_STATUS_ERROR;
- }
- // Since we know that the buffer was empty and XML_CONTEXT_BYTES is 0, we
- // don't have any data to preserve, and can copy straight into the start
- // of the buffer rather than the GetBuffer return pointer (which may be
- // pointing further into the allocated buffer).
- memcpy(parser->m_buffer, end, nLeftOver);
- }
- parser->m_bufferPtr = parser->m_buffer;
- parser->m_bufferEnd = parser->m_buffer + nLeftOver;
- parser->m_positionPtr = parser->m_bufferPtr;
- parser->m_parseEndPtr = parser->m_bufferEnd;
- parser->m_eventPtr = parser->m_bufferPtr;
- parser->m_eventEndPtr = parser->m_bufferPtr;
- return result;
- }
- #endif /* XML_CONTEXT_BYTES == 0 */
- void *buff = XML_GetBuffer(parser, len);
- if (buff == NULL)
- return XML_STATUS_ERROR;
- if (len > 0) {
- assert(s != NULL); // make sure s==NULL && len!=0 was rejected above
- memcpy(buff, s, len);
- }
- return XML_ParseBuffer(parser, len, isFinal);
- }
- enum XML_Status XMLCALL
- XML_ParseBuffer(XML_Parser parser, int len, int isFinal) {
- const char *start;
- enum XML_Status result = XML_STATUS_OK;
- if (parser == NULL)
- return XML_STATUS_ERROR;
- if (len < 0) {
- parser->m_errorCode = XML_ERROR_INVALID_ARGUMENT;
- return XML_STATUS_ERROR;
- }
- switch (parser->m_parsingStatus.parsing) {
- case XML_SUSPENDED:
- parser->m_errorCode = XML_ERROR_SUSPENDED;
- return XML_STATUS_ERROR;
- case XML_FINISHED:
- parser->m_errorCode = XML_ERROR_FINISHED;
- return XML_STATUS_ERROR;
- case XML_INITIALIZED:
- /* Has someone called XML_GetBuffer successfully before? */
- if (! parser->m_bufferPtr) {
- parser->m_errorCode = XML_ERROR_NO_BUFFER;
- return XML_STATUS_ERROR;
- }
- if (parser->m_parentParser == NULL && ! startParsing(parser)) {
- parser->m_errorCode = XML_ERROR_NO_MEMORY;
- return XML_STATUS_ERROR;
- }
- /* fall through */
- default:
- parser->m_parsingStatus.parsing = XML_PARSING;
- }
- start = parser->m_bufferPtr;
- parser->m_positionPtr = start;
- parser->m_bufferEnd += len;
- parser->m_parseEndPtr = parser->m_bufferEnd;
- parser->m_parseEndByteIndex += len;
- parser->m_parsingStatus.finalBuffer = (XML_Bool)isFinal;
- parser->m_errorCode = callProcessor(parser, start, parser->m_parseEndPtr,
- &parser->m_bufferPtr);
- if (parser->m_errorCode != XML_ERROR_NONE) {
- parser->m_eventEndPtr = parser->m_eventPtr;
- parser->m_processor = errorProcessor;
- return XML_STATUS_ERROR;
- } else {
- switch (parser->m_parsingStatus.parsing) {
- case XML_SUSPENDED:
- result = XML_STATUS_SUSPENDED;
- break;
- case XML_INITIALIZED:
- case XML_PARSING:
- if (isFinal) {
- parser->m_parsingStatus.parsing = XML_FINISHED;
- return result;
- }
- default:; /* should not happen */
- }
- }
- XmlUpdatePosition(parser->m_encoding, parser->m_positionPtr,
- parser->m_bufferPtr, &parser->m_position);
- parser->m_positionPtr = parser->m_bufferPtr;
- return result;
- }
- void *XMLCALL
- XML_GetBuffer(XML_Parser parser, int len) {
- if (parser == NULL)
- return NULL;
- if (len < 0) {
- parser->m_errorCode = XML_ERROR_NO_MEMORY;
- return NULL;
- }
- switch (parser->m_parsingStatus.parsing) {
- case XML_SUSPENDED:
- parser->m_errorCode = XML_ERROR_SUSPENDED;
- return NULL;
- case XML_FINISHED:
- parser->m_errorCode = XML_ERROR_FINISHED;
- return NULL;
- default:;
- }
- // whether or not the request succeeds, `len` seems to be the app's preferred
- // buffer fill size; remember it.
- parser->m_lastBufferRequestSize = len;
- if (len > EXPAT_SAFE_PTR_DIFF(parser->m_bufferLim, parser->m_bufferEnd)
- || parser->m_buffer == NULL) {
- #if XML_CONTEXT_BYTES > 0
- int keep;
- #endif /* XML_CONTEXT_BYTES > 0 */
- /* Do not invoke signed arithmetic overflow: */
- int neededSize = (int)((unsigned)len
- + (unsigned)EXPAT_SAFE_PTR_DIFF(
- parser->m_bufferEnd, parser->m_bufferPtr));
- if (neededSize < 0) {
- parser->m_errorCode = XML_ERROR_NO_MEMORY;
- return NULL;
- }
- #if XML_CONTEXT_BYTES > 0
- keep = (int)EXPAT_SAFE_PTR_DIFF(parser->m_bufferPtr, parser->m_buffer);
- if (keep > XML_CONTEXT_BYTES)
- keep = XML_CONTEXT_BYTES;
- /* Detect and prevent integer overflow */
- if (keep > INT_MAX - neededSize) {
- parser->m_errorCode = XML_ERROR_NO_MEMORY;
- return NULL;
- }
- neededSize += keep;
- #endif /* XML_CONTEXT_BYTES > 0 */
- if (parser->m_buffer && parser->m_bufferPtr
- && neededSize
- <= EXPAT_SAFE_PTR_DIFF(parser->m_bufferLim, parser->m_buffer)) {
- #if XML_CONTEXT_BYTES > 0
- if (keep < EXPAT_SAFE_PTR_DIFF(parser->m_bufferPtr, parser->m_buffer)) {
- int offset
- = (int)EXPAT_SAFE_PTR_DIFF(parser->m_bufferPtr, parser->m_buffer)
- - keep;
- /* The buffer pointers cannot be NULL here; we have at least some bytes
- * in the buffer */
- memmove(parser->m_buffer, &parser->m_buffer[offset],
- parser->m_bufferEnd - parser->m_bufferPtr + keep);
- parser->m_bufferEnd -= offset;
- parser->m_bufferPtr -= offset;
- }
- #else
- memmove(parser->m_buffer, parser->m_bufferPtr,
- EXPAT_SAFE_PTR_DIFF(parser->m_bufferEnd, parser->m_bufferPtr));
- parser->m_bufferEnd
- = parser->m_buffer
- + EXPAT_SAFE_PTR_DIFF(parser->m_bufferEnd, parser->m_bufferPtr);
- parser->m_bufferPtr = parser->m_buffer;
- #endif /* XML_CONTEXT_BYTES > 0 */
- } else {
- char *newBuf;
- int bufferSize
- = (int)EXPAT_SAFE_PTR_DIFF(parser->m_bufferLim, parser->m_buffer);
- if (bufferSize == 0)
- bufferSize = INIT_BUFFER_SIZE;
- do {
- /* Do not invoke signed arithmetic overflow: */
- bufferSize = (int)(2U * (unsigned)bufferSize);
- } while (bufferSize < neededSize && bufferSize > 0);
- if (bufferSize <= 0) {
- parser->m_errorCode = XML_ERROR_NO_MEMORY;
- return NULL;
- }
- newBuf = (char *)MALLOC(parser, bufferSize);
- if (newBuf == 0) {
- parser->m_errorCode = XML_ERROR_NO_MEMORY;
- return NULL;
- }
- parser->m_bufferLim = newBuf + bufferSize;
- #if XML_CONTEXT_BYTES > 0
- if (parser->m_bufferPtr) {
- memcpy(newBuf, &parser->m_bufferPtr[-keep],
- EXPAT_SAFE_PTR_DIFF(parser->m_bufferEnd, parser->m_bufferPtr)
- + keep);
- FREE(parser, parser->m_buffer);
- parser->m_buffer = newBuf;
- parser->m_bufferEnd
- = parser->m_buffer
- + EXPAT_SAFE_PTR_DIFF(parser->m_bufferEnd, parser->m_bufferPtr)
- + keep;
- parser->m_bufferPtr = parser->m_buffer + keep;
- } else {
- /* This must be a brand new buffer with no data in it yet */
- parser->m_bufferEnd = newBuf;
- parser->m_bufferPtr = parser->m_buffer = newBuf;
- }
- #else
- if (parser->m_bufferPtr) {
- memcpy(newBuf, parser->m_bufferPtr,
- EXPAT_SAFE_PTR_DIFF(parser->m_bufferEnd, parser->m_bufferPtr));
- FREE(parser, parser->m_buffer);
- parser->m_bufferEnd
- = newBuf
- + EXPAT_SAFE_PTR_DIFF(parser->m_bufferEnd, parser->m_bufferPtr);
- } else {
- /* This must be a brand new buffer with no data in it yet */
- parser->m_bufferEnd = newBuf;
- }
- parser->m_bufferPtr = parser->m_buffer = newBuf;
- #endif /* XML_CONTEXT_BYTES > 0 */
- }
- parser->m_eventPtr = parser->m_eventEndPtr = NULL;
- parser->m_positionPtr = NULL;
- }
- return parser->m_bufferEnd;
- }
- enum XML_Status XMLCALL
- XML_StopParser(XML_Parser parser, XML_Bool resumable) {
- if (parser == NULL)
- return XML_STATUS_ERROR;
- switch (parser->m_parsingStatus.parsing) {
- case XML_INITIALIZED:
- parser->m_errorCode = XML_ERROR_NOT_STARTED;
- return XML_STATUS_ERROR;
- case XML_SUSPENDED:
- if (resumable) {
- parser->m_errorCode = XML_ERROR_SUSPENDED;
- return XML_STATUS_ERROR;
- }
- parser->m_parsingStatus.parsing = XML_FINISHED;
- break;
- case XML_FINISHED:
- parser->m_errorCode = XML_ERROR_FINISHED;
- return XML_STATUS_ERROR;
- case XML_PARSING:
- if (resumable) {
- #ifdef XML_DTD
- if (parser->m_isParamEntity) {
- parser->m_errorCode = XML_ERROR_SUSPEND_PE;
- return XML_STATUS_ERROR;
- }
- #endif
- parser->m_parsingStatus.parsing = XML_SUSPENDED;
- } else
- parser->m_parsingStatus.parsing = XML_FINISHED;
- break;
- default:
- assert(0);
- }
- return XML_STATUS_OK;
- }
- enum XML_Status XMLCALL
- XML_ResumeParser(XML_Parser parser) {
- enum XML_Status result = XML_STATUS_OK;
- if (parser == NULL)
- return XML_STATUS_ERROR;
- if (parser->m_parsingStatus.parsing != XML_SUSPENDED) {
- parser->m_errorCode = XML_ERROR_NOT_SUSPENDED;
- return XML_STATUS_ERROR;
- }
- parser->m_parsingStatus.parsing = XML_PARSING;
- parser->m_errorCode = callProcessor(
- parser, parser->m_bufferPtr, parser->m_parseEndPtr, &parser->m_bufferPtr);
- if (parser->m_errorCode != XML_ERROR_NONE) {
- parser->m_eventEndPtr = parser->m_eventPtr;
- parser->m_processor = errorProcessor;
- return XML_STATUS_ERROR;
- } else {
- switch (parser->m_parsingStatus.parsing) {
- case XML_SUSPENDED:
- result = XML_STATUS_SUSPENDED;
- break;
- case XML_INITIALIZED:
- case XML_PARSING:
- if (parser->m_parsingStatus.finalBuffer) {
- parser->m_parsingStatus.parsing = XML_FINISHED;
- return result;
- }
- default:;
- }
- }
- XmlUpdatePosition(parser->m_encoding, parser->m_positionPtr,
- parser->m_bufferPtr, &parser->m_position);
- parser->m_positionPtr = parser->m_bufferPtr;
- return result;
- }
- void XMLCALL
- XML_GetParsingStatus(XML_Parser parser, XML_ParsingStatus *status) {
- if (parser == NULL)
- return;
- assert(status != NULL);
- *status = parser->m_parsingStatus;
- }
- enum XML_Error XMLCALL
- XML_GetErrorCode(XML_Parser parser) {
- if (parser == NULL)
- return XML_ERROR_INVALID_ARGUMENT;
- return parser->m_errorCode;
- }
- XML_Index XMLCALL
- XML_GetCurrentByteIndex(XML_Parser parser) {
- if (parser == NULL)
- return -1;
- if (parser->m_eventPtr)
- return (XML_Index)(parser->m_parseEndByteIndex
- - (parser->m_parseEndPtr - parser->m_eventPtr));
- return -1;
- }
- int XMLCALL
- XML_GetCurrentByteCount(XML_Parser parser) {
- if (parser == NULL)
- return 0;
- if (parser->m_eventEndPtr && parser->m_eventPtr)
- return (int)(parser->m_eventEndPtr - parser->m_eventPtr);
- return 0;
- }
- const char *XMLCALL
- XML_GetInputContext(XML_Parser parser, int *offset, int *size) {
- #if XML_CONTEXT_BYTES > 0
- if (parser == NULL)
- return NULL;
- if (parser->m_eventPtr && parser->m_buffer) {
- if (offset != NULL)
- *offset = (int)(parser->m_eventPtr - parser->m_buffer);
- if (size != NULL)
- *size = (int)(parser->m_bufferEnd - parser->m_buffer);
- return parser->m_buffer;
- }
- #else
- (void)parser;
- (void)offset;
- (void)size;
- #endif /* XML_CONTEXT_BYTES > 0 */
- return (const char *)0;
- }
- XML_Size XMLCALL
- XML_GetCurrentLineNumber(XML_Parser parser) {
- if (parser == NULL)
- return 0;
- if (parser->m_eventPtr && parser->m_eventPtr >= parser->m_positionPtr) {
- XmlUpdatePosition(parser->m_encoding, parser->m_positionPtr,
- parser->m_eventPtr, &parser->m_position);
- parser->m_positionPtr = parser->m_eventPtr;
- }
- return parser->m_position.lineNumber + 1;
- }
- XML_Size XMLCALL
- XML_GetCurrentColumnNumber(XML_Parser parser) {
- if (parser == NULL)
- return 0;
- if (parser->m_eventPtr && parser->m_eventPtr >= parser->m_positionPtr) {
- XmlUpdatePosition(parser->m_encoding, parser->m_positionPtr,
- parser->m_eventPtr, &parser->m_position);
- parser->m_positionPtr = parser->m_eventPtr;
- }
- return parser->m_position.columnNumber;
- }
- void XMLCALL
- XML_FreeContentModel(XML_Parser parser, XML_Content *model) {
- if (parser != NULL)
- FREE(parser, model);
- }
- void *XMLCALL
- XML_MemMalloc(XML_Parser parser, size_t size) {
- if (parser == NULL)
- return NULL;
- return MALLOC(parser, size);
- }
- void *XMLCALL
- XML_MemRealloc(XML_Parser parser, void *ptr, size_t size) {
- if (parser == NULL)
- return NULL;
- return REALLOC(parser, ptr, size);
- }
- void XMLCALL
- XML_MemFree(XML_Parser parser, void *ptr) {
- if (parser != NULL)
- FREE(parser, ptr);
- }
- void XMLCALL
- XML_DefaultCurrent(XML_Parser parser) {
- if (parser == NULL)
- return;
- if (parser->m_defaultHandler) {
- if (parser->m_openInternalEntities)
- reportDefault(parser, parser->m_internalEncoding,
- parser->m_openInternalEntities->internalEventPtr,
- parser->m_openInternalEntities->internalEventEndPtr);
- else
- reportDefault(parser, parser->m_encoding, parser->m_eventPtr,
- parser->m_eventEndPtr);
- }
- }
- const XML_LChar *XMLCALL
- XML_ErrorString(enum XML_Error code) {
- switch (code) {
- case XML_ERROR_NONE:
- return NULL;
- case XML_ERROR_NO_MEMORY:
- return XML_L("out of memory");
- case XML_ERROR_SYNTAX:
- return XML_L("syntax error");
- case XML_ERROR_NO_ELEMENTS:
- return XML_L("no element found");
- case XML_ERROR_INVALID_TOKEN:
- return XML_L("not well-formed (invalid token)");
- case XML_ERROR_UNCLOSED_TOKEN:
- return XML_L("unclosed token");
- case XML_ERROR_PARTIAL_CHAR:
- return XML_L("partial character");
- case XML_ERROR_TAG_MISMATCH:
- return XML_L("mismatched tag");
- case XML_ERROR_DUPLICATE_ATTRIBUTE:
- return XML_L("duplicate attribute");
- case XML_ERROR_JUNK_AFTER_DOC_ELEMENT:
- return XML_L("junk after document element");
- case XML_ERROR_PARAM_ENTITY_REF:
- return XML_L("illegal parameter entity reference");
- case XML_ERROR_UNDEFINED_ENTITY:
- return XML_L("undefined entity");
- case XML_ERROR_RECURSIVE_ENTITY_REF:
- return XML_L("recursive entity reference");
- case XML_ERROR_ASYNC_ENTITY:
- return XML_L("asynchronous entity");
- case XML_ERROR_BAD_CHAR_REF:
- return XML_L("reference to invalid character number");
- case XML_ERROR_BINARY_ENTITY_REF:
- return XML_L("reference to binary entity");
- case XML_ERROR_ATTRIBUTE_EXTERNAL_ENTITY_REF:
- return XML_L("reference to external entity in attribute");
- case XML_ERROR_MISPLACED_XML_PI:
- return XML_L("XML or text declaration not at start of entity");
- case XML_ERROR_UNKNOWN_ENCODING:
- return XML_L("unknown encoding");
- case XML_ERROR_INCORRECT_ENCODING:
- return XML_L("encoding specified in XML declaration is incorrect");
- case XML_ERROR_UNCLOSED_CDATA_SECTION:
- return XML_L("unclosed CDATA section");
- case XML_ERROR_EXTERNAL_ENTITY_HANDLING:
- return XML_L("error in processing external entity reference");
- case XML_ERROR_NOT_STANDALONE:
- return XML_L("document is not standalone");
- case XML_ERROR_UNEXPECTED_STATE:
- return XML_L("unexpected parser state - please send a bug report");
- case XML_ERROR_ENTITY_DECLARED_IN_PE:
- return XML_L("entity declared in parameter entity");
- case XML_ERROR_FEATURE_REQUIRES_XML_DTD:
- return XML_L("requested feature requires XML_DTD support in Expat");
- case XML_ERROR_CANT_CHANGE_FEATURE_ONCE_PARSING:
- return XML_L("cannot change setting once parsing has begun");
- /* Added in 1.95.7. */
- case XML_ERROR_UNBOUND_PREFIX:
- return XML_L("unbound prefix");
- /* Added in 1.95.8. */
- case XML_ERROR_UNDECLARING_PREFIX:
- return XML_L("must not undeclare prefix");
- case XML_ERROR_INCOMPLETE_PE:
- return XML_L("incomplete markup in parameter entity");
- case XML_ERROR_XML_DECL:
- return XML_L("XML declaration not well-formed");
- case XML_ERROR_TEXT_DECL:
- return XML_L("text declaration not well-formed");
- case XML_ERROR_PUBLICID:
- return XML_L("illegal character(s) in public id");
- case XML_ERROR_SUSPENDED:
- return XML_L("parser suspended");
- case XML_ERROR_NOT_SUSPENDED:
- return XML_L("parser not suspended");
- case XML_ERROR_ABORTED:
- return XML_L("parsing aborted");
- case XML_ERROR_FINISHED:
- return XML_L("parsing finished");
- case XML_ERROR_SUSPEND_PE:
- return XML_L("cannot suspend in external parameter entity");
- /* Added in 2.0.0. */
- case XML_ERROR_RESERVED_PREFIX_XML:
- return XML_L(
- "reserved prefix (xml) must not be undeclared or bound to another namespace name");
- case XML_ERROR_RESERVED_PREFIX_XMLNS:
- return XML_L("reserved prefix (xmlns) must not be declared or undeclared");
- case XML_ERROR_RESERVED_NAMESPACE_URI:
- return XML_L(
- "prefix must not be bound to one of the reserved namespace names");
- /* Added in 2.2.5. */
- case XML_ERROR_INVALID_ARGUMENT: /* Constant added in 2.2.1, already */
- return XML_L("invalid argument");
- /* Added in 2.3.0. */
- case XML_ERROR_NO_BUFFER:
- return XML_L(
- "a successful prior call to function XML_GetBuffer is required");
- /* Added in 2.4.0. */
- case XML_ERROR_AMPLIFICATION_LIMIT_BREACH:
- return XML_L(
- "limit on input amplification factor (from DTD and entities) breached");
- /* Added in 2.6.4. */
- case XML_ERROR_NOT_STARTED:
- return XML_L("parser not started");
- }
- return NULL;
- }
- const XML_LChar *XMLCALL
- XML_ExpatVersion(void) {
- /* V1 is used to string-ize the version number. However, it would
- string-ize the actual version macro *names* unless we get them
- substituted before being passed to V1. CPP is defined to expand
- a macro, then rescan for more expansions. Thus, we use V2 to expand
- the version macros, then CPP will expand the resulting V1() macro
- with the correct numerals. */
- /* ### I'm assuming cpp is portable in this respect... */
- #define V1(a, b, c) XML_L(#a) XML_L(".") XML_L(#b) XML_L(".") XML_L(#c)
- #define V2(a, b, c) XML_L("expat_") V1(a, b, c)
- return V2(XML_MAJOR_VERSION, XML_MINOR_VERSION, XML_MICRO_VERSION);
- #undef V1
- #undef V2
- }
- XML_Expat_Version XMLCALL
- XML_ExpatVersionInfo(void) {
- XML_Expat_Version version;
- version.major = XML_MAJOR_VERSION;
- version.minor = XML_MINOR_VERSION;
- version.micro = XML_MICRO_VERSION;
- return version;
- }
- const XML_Feature *XMLCALL
- XML_GetFeatureList(void) {
- static const XML_Feature features[] = {
- {XML_FEATURE_SIZEOF_XML_CHAR, XML_L("sizeof(XML_Char)"),
- sizeof(XML_Char)},
- {XML_FEATURE_SIZEOF_XML_LCHAR, XML_L("sizeof(XML_LChar)"),
- sizeof(XML_LChar)},
- #ifdef XML_UNICODE
- {XML_FEATURE_UNICODE, XML_L("XML_UNICODE"), 0},
- #endif
- #ifdef XML_UNICODE_WCHAR_T
- {XML_FEATURE_UNICODE_WCHAR_T, XML_L("XML_UNICODE_WCHAR_T"), 0},
- #endif
- #ifdef XML_DTD
- {XML_FEATURE_DTD, XML_L("XML_DTD"), 0},
- #endif
- #if XML_CONTEXT_BYTES > 0
- {XML_FEATURE_CONTEXT_BYTES, XML_L("XML_CONTEXT_BYTES"),
- XML_CONTEXT_BYTES},
- #endif
- #ifdef XML_MIN_SIZE
- {XML_FEATURE_MIN_SIZE, XML_L("XML_MIN_SIZE"), 0},
- #endif
- #ifdef XML_NS
- {XML_FEATURE_NS, XML_L("XML_NS"), 0},
- #endif
- #ifdef XML_LARGE_SIZE
- {XML_FEATURE_LARGE_SIZE, XML_L("XML_LARGE_SIZE"), 0},
- #endif
- #ifdef XML_ATTR_INFO
- {XML_FEATURE_ATTR_INFO, XML_L("XML_ATTR_INFO"), 0},
- #endif
- #if XML_GE == 1
- /* Added in Expat 2.4.0 for XML_DTD defined and
- * added in Expat 2.6.0 for XML_GE == 1. */
- {XML_FEATURE_BILLION_LAUGHS_ATTACK_PROTECTION_MAXIMUM_AMPLIFICATION_DEFAULT,
- XML_L("XML_BLAP_MAX_AMP"),
- (long int)
- EXPAT_BILLION_LAUGHS_ATTACK_PROTECTION_MAXIMUM_AMPLIFICATION_DEFAULT},
- {XML_FEATURE_BILLION_LAUGHS_ATTACK_PROTECTION_ACTIVATION_THRESHOLD_DEFAULT,
- XML_L("XML_BLAP_ACT_THRES"),
- EXPAT_BILLION_LAUGHS_ATTACK_PROTECTION_ACTIVATION_THRESHOLD_DEFAULT},
- /* Added in Expat 2.6.0. */
- {XML_FEATURE_GE, XML_L("XML_GE"), 0},
- #endif
- {XML_FEATURE_END, NULL, 0}};
- return features;
- }
- #if XML_GE == 1
- XML_Bool XMLCALL
- XML_SetBillionLaughsAttackProtectionMaximumAmplification(
- XML_Parser parser, float maximumAmplificationFactor) {
- if ((parser == NULL) || (parser->m_parentParser != NULL)
- || isnan(maximumAmplificationFactor)
- || (maximumAmplificationFactor < 1.0f)) {
- return XML_FALSE;
- }
- parser->m_accounting.maximumAmplificationFactor = maximumAmplificationFactor;
- return XML_TRUE;
- }
- XML_Bool XMLCALL
- XML_SetBillionLaughsAttackProtectionActivationThreshold(
- XML_Parser parser, unsigned long long activationThresholdBytes) {
- if ((parser == NULL) || (parser->m_parentParser != NULL)) {
- return XML_FALSE;
- }
- parser->m_accounting.activationThresholdBytes = activationThresholdBytes;
- return XML_TRUE;
- }
- #endif /* XML_GE == 1 */
- XML_Bool XMLCALL
- XML_SetReparseDeferralEnabled(XML_Parser parser, XML_Bool enabled) {
- if (parser != NULL && (enabled == XML_TRUE || enabled == XML_FALSE)) {
- parser->m_reparseDeferralEnabled = enabled;
- return XML_TRUE;
- }
- return XML_FALSE;
- }
- /* Initially tag->rawName always points into the parse buffer;
- for those TAG instances opened while the current parse buffer was
- processed, and not yet closed, we need to store tag->rawName in a more
- permanent location, since the parse buffer is about to be discarded.
- */
- static XML_Bool
- storeRawNames(XML_Parser parser) {
- TAG *tag = parser->m_tagStack;
- while (tag) {
- int bufSize;
- int nameLen = sizeof(XML_Char) * (tag->name.strLen + 1);
- size_t rawNameLen;
- char *rawNameBuf = tag->buf + nameLen;
- /* Stop if already stored. Since m_tagStack is a stack, we can stop
- at the first entry that has already been copied; everything
- below it in the stack is already been accounted for in a
- previous call to this function.
- */
- if (tag->rawName == rawNameBuf)
- break;
- /* For reuse purposes we need to ensure that the
- size of tag->buf is a multiple of sizeof(XML_Char).
- */
- rawNameLen = ROUND_UP(tag->rawNameLength, sizeof(XML_Char));
- /* Detect and prevent integer overflow. */
- if (rawNameLen > (size_t)INT_MAX - nameLen)
- return XML_FALSE;
- bufSize = nameLen + (int)rawNameLen;
- if (bufSize > tag->bufEnd - tag->buf) {
- char *temp = (char *)REALLOC(parser, tag->buf, bufSize);
- if (temp == NULL)
- return XML_FALSE;
- /* if tag->name.str points to tag->buf (only when namespace
- processing is off) then we have to update it
- */
- if (tag->name.str == (XML_Char *)tag->buf)
- tag->name.str = (XML_Char *)temp;
- /* if tag->name.localPart is set (when namespace processing is on)
- then update it as well, since it will always point into tag->buf
- */
- if (tag->name.localPart)
- tag->name.localPart
- = (XML_Char *)temp + (tag->name.localPart - (XML_Char *)tag->buf);
- tag->buf = temp;
- tag->bufEnd = temp + bufSize;
- rawNameBuf = temp + nameLen;
- }
- memcpy(rawNameBuf, tag->rawName, tag->rawNameLength);
- tag->rawName = rawNameBuf;
- tag = tag->parent;
- }
- return XML_TRUE;
- }
- static enum XML_Error PTRCALL
- contentProcessor(XML_Parser parser, const char *start, const char *end,
- const char **endPtr) {
- enum XML_Error result = doContent(
- parser, 0, parser->m_encoding, start, end, endPtr,
- (XML_Bool)! parser->m_parsingStatus.finalBuffer, XML_ACCOUNT_DIRECT);
- if (result == XML_ERROR_NONE) {
- if (! storeRawNames(parser))
- return XML_ERROR_NO_MEMORY;
- }
- return result;
- }
- static enum XML_Error PTRCALL
- externalEntityInitProcessor(XML_Parser parser, const char *start,
- const char *end, const char **endPtr) {
- enum XML_Error result = initializeEncoding(parser);
- if (result != XML_ERROR_NONE)
- return result;
- parser->m_processor = externalEntityInitProcessor2;
- return externalEntityInitProcessor2(parser, start, end, endPtr);
- }
- static enum XML_Error PTRCALL
- externalEntityInitProcessor2(XML_Parser parser, const char *start,
- const char *end, const char **endPtr) {
- const char *next = start; /* XmlContentTok doesn't always set the last arg */
- int tok = XmlContentTok(parser->m_encoding, start, end, &next);
- switch (tok) {
- case XML_TOK_BOM:
- #if XML_GE == 1
- if (! accountingDiffTolerated(parser, tok, start, next, __LINE__,
- XML_ACCOUNT_DIRECT)) {
- accountingOnAbort(parser);
- return XML_ERROR_AMPLIFICATION_LIMIT_BREACH;
- }
- #endif /* XML_GE == 1 */
- /* If we are at the end of the buffer, this would cause the next stage,
- i.e. externalEntityInitProcessor3, to pass control directly to
- doContent (by detecting XML_TOK_NONE) without processing any xml text
- declaration - causing the error XML_ERROR_MISPLACED_XML_PI in doContent.
- */
- if (next == end && ! parser->m_parsingStatus.finalBuffer) {
- *endPtr = next;
- return XML_ERROR_NONE;
- }
- start = next;
- break;
- case XML_TOK_PARTIAL:
- if (! parser->m_parsingStatus.finalBuffer) {
- *endPtr = start;
- return XML_ERROR_NONE;
- }
- parser->m_eventPtr = start;
- return XML_ERROR_UNCLOSED_TOKEN;
- case XML_TOK_PARTIAL_CHAR:
- if (! parser->m_parsingStatus.finalBuffer) {
- *endPtr = start;
- return XML_ERROR_NONE;
- }
- parser->m_eventPtr = start;
- return XML_ERROR_PARTIAL_CHAR;
- }
- parser->m_processor = externalEntityInitProcessor3;
- return externalEntityInitProcessor3(parser, start, end, endPtr);
- }
- static enum XML_Error PTRCALL
- externalEntityInitProcessor3(XML_Parser parser, const char *start,
- const char *end, const char **endPtr) {
- int tok;
- const char *next = start; /* XmlContentTok doesn't always set the last arg */
- parser->m_eventPtr = start;
- tok = XmlContentTok(parser->m_encoding, start, end, &next);
- /* Note: These bytes are accounted later in:
- - processXmlDecl
- - externalEntityContentProcessor
- */
- parser->m_eventEndPtr = next;
- switch (tok) {
- case XML_TOK_XML_DECL: {
- enum XML_Error result;
- result = processXmlDecl(parser, 1, start, next);
- if (result != XML_ERROR_NONE)
- return result;
- switch (parser->m_parsingStatus.parsing) {
- case XML_SUSPENDED:
- *endPtr = next;
- return XML_ERROR_NONE;
- case XML_FINISHED:
- return XML_ERROR_ABORTED;
- default:
- start = next;
- }
- } break;
- case XML_TOK_PARTIAL:
- if (! parser->m_parsingStatus.finalBuffer) {
- *endPtr = start;
- return XML_ERROR_NONE;
- }
- return XML_ERROR_UNCLOSED_TOKEN;
- case XML_TOK_PARTIAL_CHAR:
- if (! parser->m_parsingStatus.finalBuffer) {
- *endPtr = start;
- return XML_ERROR_NONE;
- }
- return XML_ERROR_PARTIAL_CHAR;
- }
- parser->m_processor = externalEntityContentProcessor;
- parser->m_tagLevel = 1;
- return externalEntityContentProcessor(parser, start, end, endPtr);
- }
- static enum XML_Error PTRCALL
- externalEntityContentProcessor(XML_Parser parser, const char *start,
- const char *end, const char **endPtr) {
- enum XML_Error result
- = doContent(parser, 1, parser->m_encoding, start, end, endPtr,
- (XML_Bool)! parser->m_parsingStatus.finalBuffer,
- XML_ACCOUNT_ENTITY_EXPANSION);
- if (result == XML_ERROR_NONE) {
- if (! storeRawNames(parser))
- return XML_ERROR_NO_MEMORY;
- }
- return result;
- }
- static enum XML_Error
- doContent(XML_Parser parser, int startTagLevel, const ENCODING *enc,
- const char *s, const char *end, const char **nextPtr,
- XML_Bool haveMore, enum XML_Account account) {
- /* save one level of indirection */
- DTD *const dtd = parser->m_dtd;
- const char **eventPP;
- const char **eventEndPP;
- if (enc == parser->m_encoding) {
- eventPP = &parser->m_eventPtr;
- eventEndPP = &parser->m_eventEndPtr;
- } else {
- eventPP = &(parser->m_openInternalEntities->internalEventPtr);
- eventEndPP = &(parser->m_openInternalEntities->internalEventEndPtr);
- }
- *eventPP = s;
- for (;;) {
- const char *next = s; /* XmlContentTok doesn't always set the last arg */
- int tok = XmlContentTok(enc, s, end, &next);
- #if XML_GE == 1
- const char *accountAfter
- = ((tok == XML_TOK_TRAILING_RSQB) || (tok == XML_TOK_TRAILING_CR))
- ? (haveMore ? s /* i.e. 0 bytes */ : end)
- : next;
- if (! accountingDiffTolerated(parser, tok, s, accountAfter, __LINE__,
- account)) {
- accountingOnAbort(parser);
- return XML_ERROR_AMPLIFICATION_LIMIT_BREACH;
- }
- #endif
- *eventEndPP = next;
- switch (tok) {
- case XML_TOK_TRAILING_CR:
- if (haveMore) {
- *nextPtr = s;
- return XML_ERROR_NONE;
- }
- *eventEndPP = end;
- if (parser->m_characterDataHandler) {
- XML_Char c = 0xA;
- parser->m_characterDataHandler(parser->m_handlerArg, &c, 1);
- } else if (parser->m_defaultHandler)
- reportDefault(parser, enc, s, end);
- /* We are at the end of the final buffer, should we check for
- XML_SUSPENDED, XML_FINISHED?
- */
- if (startTagLevel == 0)
- return XML_ERROR_NO_ELEMENTS;
- if (parser->m_tagLevel != startTagLevel)
- return XML_ERROR_ASYNC_ENTITY;
- *nextPtr = end;
- return XML_ERROR_NONE;
- case XML_TOK_NONE:
- if (haveMore) {
- *nextPtr = s;
- return XML_ERROR_NONE;
- }
- if (startTagLevel > 0) {
- if (parser->m_tagLevel != startTagLevel)
- return XML_ERROR_ASYNC_ENTITY;
- *nextPtr = s;
- return XML_ERROR_NONE;
- }
- return XML_ERROR_NO_ELEMENTS;
- case XML_TOK_INVALID:
- *eventPP = next;
- return XML_ERROR_INVALID_TOKEN;
- case XML_TOK_PARTIAL:
- if (haveMore) {
- *nextPtr = s;
- return XML_ERROR_NONE;
- }
- return XML_ERROR_UNCLOSED_TOKEN;
- case XML_TOK_PARTIAL_CHAR:
- if (haveMore) {
- *nextPtr = s;
- return XML_ERROR_NONE;
- }
- return XML_ERROR_PARTIAL_CHAR;
- case XML_TOK_ENTITY_REF: {
- const XML_Char *name;
- ENTITY *entity;
- XML_Char ch = (XML_Char)XmlPredefinedEntityName(
- enc, s + enc->minBytesPerChar, next - enc->minBytesPerChar);
- if (ch) {
- #if XML_GE == 1
- /* NOTE: We are replacing 4-6 characters original input for 1 character
- * so there is no amplification and hence recording without
- * protection. */
- accountingDiffTolerated(parser, tok, (char *)&ch,
- ((char *)&ch) + sizeof(XML_Char), __LINE__,
- XML_ACCOUNT_ENTITY_EXPANSION);
- #endif /* XML_GE == 1 */
- if (parser->m_characterDataHandler)
- parser->m_characterDataHandler(parser->m_handlerArg, &ch, 1);
- else if (parser->m_defaultHandler)
- reportDefault(parser, enc, s, next);
- break;
- }
- name = poolStoreString(&dtd->pool, enc, s + enc->minBytesPerChar,
- next - enc->minBytesPerChar);
- if (! name)
- return XML_ERROR_NO_MEMORY;
- entity = (ENTITY *)lookup(parser, &dtd->generalEntities, name, 0);
- poolDiscard(&dtd->pool);
- /* First, determine if a check for an existing declaration is needed;
- if yes, check that the entity exists, and that it is internal,
- otherwise call the skipped entity or default handler.
- */
- if (! dtd->hasParamEntityRefs || dtd->standalone) {
- if (! entity)
- return XML_ERROR_UNDEFINED_ENTITY;
- else if (! entity->is_internal)
- return XML_ERROR_ENTITY_DECLARED_IN_PE;
- } else if (! entity) {
- if (parser->m_skippedEntityHandler)
- parser->m_skippedEntityHandler(parser->m_handlerArg, name, 0);
- else if (parser->m_defaultHandler)
- reportDefault(parser, enc, s, next);
- break;
- }
- if (entity->open)
- return XML_ERROR_RECURSIVE_ENTITY_REF;
- if (entity->notation)
- return XML_ERROR_BINARY_ENTITY_REF;
- if (entity->textPtr) {
- enum XML_Error result;
- if (! parser->m_defaultExpandInternalEntities) {
- if (parser->m_skippedEntityHandler)
- parser->m_skippedEntityHandler(parser->m_handlerArg, entity->name,
- 0);
- else if (parser->m_defaultHandler)
- reportDefault(parser, enc, s, next);
- break;
- }
- result = processInternalEntity(parser, entity, XML_FALSE);
- if (result != XML_ERROR_NONE)
- return result;
- } else if (parser->m_externalEntityRefHandler) {
- const XML_Char *context;
- entity->open = XML_TRUE;
- context = getContext(parser);
- entity->open = XML_FALSE;
- if (! context)
- return XML_ERROR_NO_MEMORY;
- if (! parser->m_externalEntityRefHandler(
- parser->m_externalEntityRefHandlerArg, context, entity->base,
- entity->systemId, entity->publicId))
- return XML_ERROR_EXTERNAL_ENTITY_HANDLING;
- poolDiscard(&parser->m_tempPool);
- } else if (parser->m_defaultHandler)
- reportDefault(parser, enc, s, next);
- break;
- }
- case XML_TOK_START_TAG_NO_ATTS:
- /* fall through */
- case XML_TOK_START_TAG_WITH_ATTS: {
- TAG *tag;
- enum XML_Error result;
- XML_Char *toPtr;
- if (parser->m_freeTagList) {
- tag = parser->m_freeTagList;
- parser->m_freeTagList = parser->m_freeTagList->parent;
- } else {
- tag = (TAG *)MALLOC(parser, sizeof(TAG));
- if (! tag)
- return XML_ERROR_NO_MEMORY;
- tag->buf = (char *)MALLOC(parser, INIT_TAG_BUF_SIZE);
- if (! tag->buf) {
- FREE(parser, tag);
- return XML_ERROR_NO_MEMORY;
- }
- tag->bufEnd = tag->buf + INIT_TAG_BUF_SIZE;
- }
- tag->bindings = NULL;
- tag->parent = parser->m_tagStack;
- parser->m_tagStack = tag;
- tag->name.localPart = NULL;
- tag->name.prefix = NULL;
- tag->rawName = s + enc->minBytesPerChar;
- tag->rawNameLength = XmlNameLength(enc, tag->rawName);
- ++parser->m_tagLevel;
- {
- const char *rawNameEnd = tag->rawName + tag->rawNameLength;
- const char *fromPtr = tag->rawName;
- toPtr = (XML_Char *)tag->buf;
- for (;;) {
- int bufSize;
- int convLen;
- const enum XML_Convert_Result convert_res
- = XmlConvert(enc, &fromPtr, rawNameEnd, (ICHAR **)&toPtr,
- (ICHAR *)tag->bufEnd - 1);
- convLen = (int)(toPtr - (XML_Char *)tag->buf);
- if ((fromPtr >= rawNameEnd)
- || (convert_res == XML_CONVERT_INPUT_INCOMPLETE)) {
- tag->name.strLen = convLen;
- break;
- }
- bufSize = (int)(tag->bufEnd - tag->buf) << 1;
- {
- char *temp = (char *)REALLOC(parser, tag->buf, bufSize);
- if (temp == NULL)
- return XML_ERROR_NO_MEMORY;
- tag->buf = temp;
- tag->bufEnd = temp + bufSize;
- toPtr = (XML_Char *)temp + convLen;
- }
- }
- }
- tag->name.str = (XML_Char *)tag->buf;
- *toPtr = XML_T('\0');
- result
- = storeAtts(parser, enc, s, &(tag->name), &(tag->bindings), account);
- if (result)
- return result;
- if (parser->m_startElementHandler)
- parser->m_startElementHandler(parser->m_handlerArg, tag->name.str,
- (const XML_Char **)parser->m_atts);
- else if (parser->m_defaultHandler)
- reportDefault(parser, enc, s, next);
- poolClear(&parser->m_tempPool);
- break;
- }
- case XML_TOK_EMPTY_ELEMENT_NO_ATTS:
- /* fall through */
- case XML_TOK_EMPTY_ELEMENT_WITH_ATTS: {
- const char *rawName = s + enc->minBytesPerChar;
- enum XML_Error result;
- BINDING *bindings = NULL;
- XML_Bool noElmHandlers = XML_TRUE;
- TAG_NAME name;
- name.str = poolStoreString(&parser->m_tempPool, enc, rawName,
- rawName + XmlNameLength(enc, rawName));
- if (! name.str)
- return XML_ERROR_NO_MEMORY;
- poolFinish(&parser->m_tempPool);
- result = storeAtts(parser, enc, s, &name, &bindings,
- XML_ACCOUNT_NONE /* token spans whole start tag */);
- if (result != XML_ERROR_NONE) {
- freeBindings(parser, bindings);
- return result;
- }
- poolFinish(&parser->m_tempPool);
- if (parser->m_startElementHandler) {
- parser->m_startElementHandler(parser->m_handlerArg, name.str,
- (const XML_Char **)parser->m_atts);
- noElmHandlers = XML_FALSE;
- }
- if (parser->m_endElementHandler) {
- if (parser->m_startElementHandler)
- *eventPP = *eventEndPP;
- parser->m_endElementHandler(parser->m_handlerArg, name.str);
- noElmHandlers = XML_FALSE;
- }
- if (noElmHandlers && parser->m_defaultHandler)
- reportDefault(parser, enc, s, next);
- poolClear(&parser->m_tempPool);
- freeBindings(parser, bindings);
- }
- if ((parser->m_tagLevel == 0)
- && (parser->m_parsingStatus.parsing != XML_FINISHED)) {
- if (parser->m_parsingStatus.parsing == XML_SUSPENDED)
- parser->m_processor = epilogProcessor;
- else
- return epilogProcessor(parser, next, end, nextPtr);
- }
- break;
- case XML_TOK_END_TAG:
- if (parser->m_tagLevel == startTagLevel)
- return XML_ERROR_ASYNC_ENTITY;
- else {
- int len;
- const char *rawName;
- TAG *tag = parser->m_tagStack;
- rawName = s + enc->minBytesPerChar * 2;
- len = XmlNameLength(enc, rawName);
- if (len != tag->rawNameLength
- || memcmp(tag->rawName, rawName, len) != 0) {
- *eventPP = rawName;
- return XML_ERROR_TAG_MISMATCH;
- }
- parser->m_tagStack = tag->parent;
- tag->parent = parser->m_freeTagList;
- parser->m_freeTagList = tag;
- --parser->m_tagLevel;
- if (parser->m_endElementHandler) {
- const XML_Char *localPart;
- const XML_Char *prefix;
- XML_Char *uri;
- localPart = tag->name.localPart;
- if (parser->m_ns && localPart) {
- /* localPart and prefix may have been overwritten in
- tag->name.str, since this points to the binding->uri
- buffer which gets reused; so we have to add them again
- */
- uri = (XML_Char *)tag->name.str + tag->name.uriLen;
- /* don't need to check for space - already done in storeAtts() */
- while (*localPart)
- *uri++ = *localPart++;
- prefix = tag->name.prefix;
- if (parser->m_ns_triplets && prefix) {
- *uri++ = parser->m_namespaceSeparator;
- while (*prefix)
- *uri++ = *prefix++;
- }
- *uri = XML_T('\0');
- }
- parser->m_endElementHandler(parser->m_handlerArg, tag->name.str);
- } else if (parser->m_defaultHandler)
- reportDefault(parser, enc, s, next);
- while (tag->bindings) {
- BINDING *b = tag->bindings;
- if (parser->m_endNamespaceDeclHandler)
- parser->m_endNamespaceDeclHandler(parser->m_handlerArg,
- b->prefix->name);
- tag->bindings = tag->bindings->nextTagBinding;
- b->nextTagBinding = parser->m_freeBindingList;
- parser->m_freeBindingList = b;
- b->prefix->binding = b->prevPrefixBinding;
- }
- if ((parser->m_tagLevel == 0)
- && (parser->m_parsingStatus.parsing != XML_FINISHED)) {
- if (parser->m_parsingStatus.parsing == XML_SUSPENDED)
- parser->m_processor = epilogProcessor;
- else
- return epilogProcessor(parser, next, end, nextPtr);
- }
- }
- break;
- case XML_TOK_CHAR_REF: {
- int n = XmlCharRefNumber(enc, s);
- if (n < 0)
- return XML_ERROR_BAD_CHAR_REF;
- if (parser->m_characterDataHandler) {
- XML_Char buf[XML_ENCODE_MAX];
- parser->m_characterDataHandler(parser->m_handlerArg, buf,
- XmlEncode(n, (ICHAR *)buf));
- } else if (parser->m_defaultHandler)
- reportDefault(parser, enc, s, next);
- } break;
- case XML_TOK_XML_DECL:
- return XML_ERROR_MISPLACED_XML_PI;
- case XML_TOK_DATA_NEWLINE:
- if (parser->m_characterDataHandler) {
- XML_Char c = 0xA;
- parser->m_characterDataHandler(parser->m_handlerArg, &c, 1);
- } else if (parser->m_defaultHandler)
- reportDefault(parser, enc, s, next);
- break;
- case XML_TOK_CDATA_SECT_OPEN: {
- enum XML_Error result;
- if (parser->m_startCdataSectionHandler)
- parser->m_startCdataSectionHandler(parser->m_handlerArg);
- /* BEGIN disabled code */
- /* Suppose you doing a transformation on a document that involves
- changing only the character data. You set up a defaultHandler
- and a characterDataHandler. The defaultHandler simply copies
- characters through. The characterDataHandler does the
- transformation and writes the characters out escaping them as
- necessary. This case will fail to work if we leave out the
- following two lines (because & and < inside CDATA sections will
- be incorrectly escaped).
- However, now we have a start/endCdataSectionHandler, so it seems
- easier to let the user deal with this.
- */
- else if ((0) && parser->m_characterDataHandler)
- parser->m_characterDataHandler(parser->m_handlerArg, parser->m_dataBuf,
- 0);
- /* END disabled code */
- else if (parser->m_defaultHandler)
- reportDefault(parser, enc, s, next);
- result
- = doCdataSection(parser, enc, &next, end, nextPtr, haveMore, account);
- if (result != XML_ERROR_NONE)
- return result;
- else if (! next) {
- parser->m_processor = cdataSectionProcessor;
- return result;
- }
- } break;
- case XML_TOK_TRAILING_RSQB:
- if (haveMore) {
- *nextPtr = s;
- return XML_ERROR_NONE;
- }
- if (parser->m_characterDataHandler) {
- if (MUST_CONVERT(enc, s)) {
- ICHAR *dataPtr = (ICHAR *)parser->m_dataBuf;
- XmlConvert(enc, &s, end, &dataPtr, (ICHAR *)parser->m_dataBufEnd);
- parser->m_characterDataHandler(
- parser->m_handlerArg, parser->m_dataBuf,
- (int)(dataPtr - (ICHAR *)parser->m_dataBuf));
- } else
- parser->m_characterDataHandler(
- parser->m_handlerArg, (const XML_Char *)s,
- (int)((const XML_Char *)end - (const XML_Char *)s));
- } else if (parser->m_defaultHandler)
- reportDefault(parser, enc, s, end);
- /* We are at the end of the final buffer, should we check for
- XML_SUSPENDED, XML_FINISHED?
- */
- if (startTagLevel == 0) {
- *eventPP = end;
- return XML_ERROR_NO_ELEMENTS;
- }
- if (parser->m_tagLevel != startTagLevel) {
- *eventPP = end;
- return XML_ERROR_ASYNC_ENTITY;
- }
- *nextPtr = end;
- return XML_ERROR_NONE;
- case XML_TOK_DATA_CHARS: {
- XML_CharacterDataHandler charDataHandler = parser->m_characterDataHandler;
- if (charDataHandler) {
- if (MUST_CONVERT(enc, s)) {
- for (;;) {
- ICHAR *dataPtr = (ICHAR *)parser->m_dataBuf;
- const enum XML_Convert_Result convert_res = XmlConvert(
- enc, &s, next, &dataPtr, (ICHAR *)parser->m_dataBufEnd);
- *eventEndPP = s;
- charDataHandler(parser->m_handlerArg, parser->m_dataBuf,
- (int)(dataPtr - (ICHAR *)parser->m_dataBuf));
- if ((convert_res == XML_CONVERT_COMPLETED)
- || (convert_res == XML_CONVERT_INPUT_INCOMPLETE))
- break;
- *eventPP = s;
- }
- } else
- charDataHandler(parser->m_handlerArg, (const XML_Char *)s,
- (int)((const XML_Char *)next - (const XML_Char *)s));
- } else if (parser->m_defaultHandler)
- reportDefault(parser, enc, s, next);
- } break;
- case XML_TOK_PI:
- if (! reportProcessingInstruction(parser, enc, s, next))
- return XML_ERROR_NO_MEMORY;
- break;
- case XML_TOK_COMMENT:
- if (! reportComment(parser, enc, s, next))
- return XML_ERROR_NO_MEMORY;
- break;
- default:
- /* All of the tokens produced by XmlContentTok() have their own
- * explicit cases, so this default is not strictly necessary.
- * However it is a useful safety net, so we retain the code and
- * simply exclude it from the coverage tests.
- *
- * LCOV_EXCL_START
- */
- if (parser->m_defaultHandler)
- reportDefault(parser, enc, s, next);
- break;
- /* LCOV_EXCL_STOP */
- }
- *eventPP = s = next;
- switch (parser->m_parsingStatus.parsing) {
- case XML_SUSPENDED:
- *nextPtr = next;
- return XML_ERROR_NONE;
- case XML_FINISHED:
- return XML_ERROR_ABORTED;
- default:;
- }
- }
- /* not reached */
- }
- /* This function does not call free() on the allocated memory, merely
- * moving it to the parser's m_freeBindingList where it can be freed or
- * reused as appropriate.
- */
- static void
- freeBindings(XML_Parser parser, BINDING *bindings) {
- while (bindings) {
- BINDING *b = bindings;
- /* m_startNamespaceDeclHandler will have been called for this
- * binding in addBindings(), so call the end handler now.
- */
- if (parser->m_endNamespaceDeclHandler)
- parser->m_endNamespaceDeclHandler(parser->m_handlerArg, b->prefix->name);
- bindings = bindings->nextTagBinding;
- b->nextTagBinding = parser->m_freeBindingList;
- parser->m_freeBindingList = b;
- b->prefix->binding = b->prevPrefixBinding;
- }
- }
- /* Precondition: all arguments must be non-NULL;
- Purpose:
- - normalize attributes
- - check attributes for well-formedness
- - generate namespace aware attribute names (URI, prefix)
- - build list of attributes for startElementHandler
- - default attributes
- - process namespace declarations (check and report them)
- - generate namespace aware element name (URI, prefix)
- */
- static enum XML_Error
- storeAtts(XML_Parser parser, const ENCODING *enc, const char *attStr,
- TAG_NAME *tagNamePtr, BINDING **bindingsPtr,
- enum XML_Account account) {
- DTD *const dtd = parser->m_dtd; /* save one level of indirection */
- ELEMENT_TYPE *elementType;
- int nDefaultAtts;
- const XML_Char **appAtts; /* the attribute list for the application */
- int attIndex = 0;
- int prefixLen;
- int i;
- int n;
- XML_Char *uri;
- int nPrefixes = 0;
- BINDING *binding;
- const XML_Char *localPart;
- /* lookup the element type name */
- elementType
- = (ELEMENT_TYPE *)lookup(parser, &dtd->elementTypes, tagNamePtr->str, 0);
- if (! elementType) {
- const XML_Char *name = poolCopyString(&dtd->pool, tagNamePtr->str);
- if (! name)
- return XML_ERROR_NO_MEMORY;
- elementType = (ELEMENT_TYPE *)lookup(parser, &dtd->elementTypes, name,
- sizeof(ELEMENT_TYPE));
- if (! elementType)
- return XML_ERROR_NO_MEMORY;
- if (parser->m_ns && ! setElementTypePrefix(parser, elementType))
- return XML_ERROR_NO_MEMORY;
- }
- nDefaultAtts = elementType->nDefaultAtts;
- /* get the attributes from the tokenizer */
- n = XmlGetAttributes(enc, attStr, parser->m_attsSize, parser->m_atts);
- /* Detect and prevent integer overflow */
- if (n > INT_MAX - nDefaultAtts) {
- return XML_ERROR_NO_MEMORY;
- }
- if (n + nDefaultAtts > parser->m_attsSize) {
- int oldAttsSize = parser->m_attsSize;
- ATTRIBUTE *temp;
- #ifdef XML_ATTR_INFO
- XML_AttrInfo *temp2;
- #endif
- /* Detect and prevent integer overflow */
- if ((nDefaultAtts > INT_MAX - INIT_ATTS_SIZE)
- || (n > INT_MAX - (nDefaultAtts + INIT_ATTS_SIZE))) {
- return XML_ERROR_NO_MEMORY;
- }
- parser->m_attsSize = n + nDefaultAtts + INIT_ATTS_SIZE;
- /* Detect and prevent integer overflow.
- * The preprocessor guard addresses the "always false" warning
- * from -Wtype-limits on platforms where
- * sizeof(unsigned int) < sizeof(size_t), e.g. on x86_64. */
- #if UINT_MAX >= SIZE_MAX
- if ((unsigned)parser->m_attsSize > (size_t)(-1) / sizeof(ATTRIBUTE)) {
- parser->m_attsSize = oldAttsSize;
- return XML_ERROR_NO_MEMORY;
- }
- #endif
- temp = (ATTRIBUTE *)REALLOC(parser, (void *)parser->m_atts,
- parser->m_attsSize * sizeof(ATTRIBUTE));
- if (temp == NULL) {
- parser->m_attsSize = oldAttsSize;
- return XML_ERROR_NO_MEMORY;
- }
- parser->m_atts = temp;
- #ifdef XML_ATTR_INFO
- /* Detect and prevent integer overflow.
- * The preprocessor guard addresses the "always false" warning
- * from -Wtype-limits on platforms where
- * sizeof(unsigned int) < sizeof(size_t), e.g. on x86_64. */
- # if UINT_MAX >= SIZE_MAX
- if ((unsigned)parser->m_attsSize > (size_t)(-1) / sizeof(XML_AttrInfo)) {
- parser->m_attsSize = oldAttsSize;
- return XML_ERROR_NO_MEMORY;
- }
- # endif
- temp2 = (XML_AttrInfo *)REALLOC(parser, (void *)parser->m_attInfo,
- parser->m_attsSize * sizeof(XML_AttrInfo));
- if (temp2 == NULL) {
- parser->m_attsSize = oldAttsSize;
- return XML_ERROR_NO_MEMORY;
- }
- parser->m_attInfo = temp2;
- #endif
- if (n > oldAttsSize)
- XmlGetAttributes(enc, attStr, n, parser->m_atts);
- }
- appAtts = (const XML_Char **)parser->m_atts;
- for (i = 0; i < n; i++) {
- ATTRIBUTE *currAtt = &parser->m_atts[i];
- #ifdef XML_ATTR_INFO
- XML_AttrInfo *currAttInfo = &parser->m_attInfo[i];
- #endif
- /* add the name and value to the attribute list */
- ATTRIBUTE_ID *attId
- = getAttributeId(parser, enc, currAtt->name,
- currAtt->name + XmlNameLength(enc, currAtt->name));
- if (! attId)
- return XML_ERROR_NO_MEMORY;
- #ifdef XML_ATTR_INFO
- currAttInfo->nameStart
- = parser->m_parseEndByteIndex - (parser->m_parseEndPtr - currAtt->name);
- currAttInfo->nameEnd
- = currAttInfo->nameStart + XmlNameLength(enc, currAtt->name);
- currAttInfo->valueStart = parser->m_parseEndByteIndex
- - (parser->m_parseEndPtr - currAtt->valuePtr);
- currAttInfo->valueEnd = parser->m_parseEndByteIndex
- - (parser->m_parseEndPtr - currAtt->valueEnd);
- #endif
- /* Detect duplicate attributes by their QNames. This does not work when
- namespace processing is turned on and different prefixes for the same
- namespace are used. For this case we have a check further down.
- */
- if ((attId->name)[-1]) {
- if (enc == parser->m_encoding)
- parser->m_eventPtr = parser->m_atts[i].name;
- return XML_ERROR_DUPLICATE_ATTRIBUTE;
- }
- (attId->name)[-1] = 1;
- appAtts[attIndex++] = attId->name;
- if (! parser->m_atts[i].normalized) {
- enum XML_Error result;
- XML_Bool isCdata = XML_TRUE;
- /* figure out whether declared as other than CDATA */
- if (attId->maybeTokenized) {
- int j;
- for (j = 0; j < nDefaultAtts; j++) {
- if (attId == elementType->defaultAtts[j].id) {
- isCdata = elementType->defaultAtts[j].isCdata;
- break;
- }
- }
- }
- /* normalize the attribute value */
- result = storeAttributeValue(
- parser, enc, isCdata, parser->m_atts[i].valuePtr,
- parser->m_atts[i].valueEnd, &parser->m_tempPool, account);
- if (result)
- return result;
- appAtts[attIndex] = poolStart(&parser->m_tempPool);
- poolFinish(&parser->m_tempPool);
- } else {
- /* the value did not need normalizing */
- appAtts[attIndex] = poolStoreString(&parser->m_tempPool, enc,
- parser->m_atts[i].valuePtr,
- parser->m_atts[i].valueEnd);
- if (appAtts[attIndex] == 0)
- return XML_ERROR_NO_MEMORY;
- poolFinish(&parser->m_tempPool);
- }
- /* handle prefixed attribute names */
- if (attId->prefix) {
- if (attId->xmlns) {
- /* deal with namespace declarations here */
- enum XML_Error result = addBinding(parser, attId->prefix, attId,
- appAtts[attIndex], bindingsPtr);
- if (result)
- return result;
- --attIndex;
- } else {
- /* deal with other prefixed names later */
- attIndex++;
- nPrefixes++;
- (attId->name)[-1] = 2;
- }
- } else
- attIndex++;
- }
- /* set-up for XML_GetSpecifiedAttributeCount and XML_GetIdAttributeIndex */
- parser->m_nSpecifiedAtts = attIndex;
- if (elementType->idAtt && (elementType->idAtt->name)[-1]) {
- for (i = 0; i < attIndex; i += 2)
- if (appAtts[i] == elementType->idAtt->name) {
- parser->m_idAttIndex = i;
- break;
- }
- } else
- parser->m_idAttIndex = -1;
- /* do attribute defaulting */
- for (i = 0; i < nDefaultAtts; i++) {
- const DEFAULT_ATTRIBUTE *da = elementType->defaultAtts + i;
- if (! (da->id->name)[-1] && da->value) {
- if (da->id->prefix) {
- if (da->id->xmlns) {
- enum XML_Error result = addBinding(parser, da->id->prefix, da->id,
- da->value, bindingsPtr);
- if (result)
- return result;
- } else {
- (da->id->name)[-1] = 2;
- nPrefixes++;
- appAtts[attIndex++] = da->id->name;
- appAtts[attIndex++] = da->value;
- }
- } else {
- (da->id->name)[-1] = 1;
- appAtts[attIndex++] = da->id->name;
- appAtts[attIndex++] = da->value;
- }
- }
- }
- appAtts[attIndex] = 0;
- /* expand prefixed attribute names, check for duplicates,
- and clear flags that say whether attributes were specified */
- i = 0;
- if (nPrefixes) {
- int j; /* hash table index */
- unsigned long version = parser->m_nsAttsVersion;
- /* Detect and prevent invalid shift */
- if (parser->m_nsAttsPower >= sizeof(unsigned int) * 8 /* bits per byte */) {
- return XML_ERROR_NO_MEMORY;
- }
- unsigned int nsAttsSize = 1u << parser->m_nsAttsPower;
- unsigned char oldNsAttsPower = parser->m_nsAttsPower;
- /* size of hash table must be at least 2 * (# of prefixed attributes) */
- if ((nPrefixes << 1)
- >> parser->m_nsAttsPower) { /* true for m_nsAttsPower = 0 */
- NS_ATT *temp;
- /* hash table size must also be a power of 2 and >= 8 */
- while (nPrefixes >> parser->m_nsAttsPower++)
- ;
- if (parser->m_nsAttsPower < 3)
- parser->m_nsAttsPower = 3;
- /* Detect and prevent invalid shift */
- if (parser->m_nsAttsPower >= sizeof(nsAttsSize) * 8 /* bits per byte */) {
- /* Restore actual size of memory in m_nsAtts */
- parser->m_nsAttsPower = oldNsAttsPower;
- return XML_ERROR_NO_MEMORY;
- }
- nsAttsSize = 1u << parser->m_nsAttsPower;
- /* Detect and prevent integer overflow.
- * The preprocessor guard addresses the "always false" warning
- * from -Wtype-limits on platforms where
- * sizeof(unsigned int) < sizeof(size_t), e.g. on x86_64. */
- #if UINT_MAX >= SIZE_MAX
- if (nsAttsSize > (size_t)(-1) / sizeof(NS_ATT)) {
- /* Restore actual size of memory in m_nsAtts */
- parser->m_nsAttsPower = oldNsAttsPower;
- return XML_ERROR_NO_MEMORY;
- }
- #endif
- temp = (NS_ATT *)REALLOC(parser, parser->m_nsAtts,
- nsAttsSize * sizeof(NS_ATT));
- if (! temp) {
- /* Restore actual size of memory in m_nsAtts */
- parser->m_nsAttsPower = oldNsAttsPower;
- return XML_ERROR_NO_MEMORY;
- }
- parser->m_nsAtts = temp;
- version = 0; /* force re-initialization of m_nsAtts hash table */
- }
- /* using a version flag saves us from initializing m_nsAtts every time */
- if (! version) { /* initialize version flags when version wraps around */
- version = INIT_ATTS_VERSION;
- for (j = nsAttsSize; j != 0;)
- parser->m_nsAtts[--j].version = version;
- }
- parser->m_nsAttsVersion = --version;
- /* expand prefixed names and check for duplicates */
- for (; i < attIndex; i += 2) {
- const XML_Char *s = appAtts[i];
- if (s[-1] == 2) { /* prefixed */
- ATTRIBUTE_ID *id;
- const BINDING *b;
- unsigned long uriHash;
- struct siphash sip_state;
- struct sipkey sip_key;
- copy_salt_to_sipkey(parser, &sip_key);
- sip24_init(&sip_state, &sip_key);
- ((XML_Char *)s)[-1] = 0; /* clear flag */
- id = (ATTRIBUTE_ID *)lookup(parser, &dtd->attributeIds, s, 0);
- if (! id || ! id->prefix) {
- /* This code is walking through the appAtts array, dealing
- * with (in this case) a prefixed attribute name. To be in
- * the array, the attribute must have already been bound, so
- * has to have passed through the hash table lookup once
- * already. That implies that an entry for it already
- * exists, so the lookup above will return a pointer to
- * already allocated memory. There is no opportunaity for
- * the allocator to fail, so the condition above cannot be
- * fulfilled.
- *
- * Since it is difficult to be certain that the above
- * analysis is complete, we retain the test and merely
- * remove the code from coverage tests.
- */
- return XML_ERROR_NO_MEMORY; /* LCOV_EXCL_LINE */
- }
- b = id->prefix->binding;
- if (! b)
- return XML_ERROR_UNBOUND_PREFIX;
- for (j = 0; j < b->uriLen; j++) {
- const XML_Char c = b->uri[j];
- if (! poolAppendChar(&parser->m_tempPool, c))
- return XML_ERROR_NO_MEMORY;
- }
- sip24_update(&sip_state, b->uri, b->uriLen * sizeof(XML_Char));
- while (*s++ != XML_T(ASCII_COLON))
- ;
- sip24_update(&sip_state, s, keylen(s) * sizeof(XML_Char));
- do { /* copies null terminator */
- if (! poolAppendChar(&parser->m_tempPool, *s))
- return XML_ERROR_NO_MEMORY;
- } while (*s++);
- uriHash = (unsigned long)sip24_final(&sip_state);
- { /* Check hash table for duplicate of expanded name (uriName).
- Derived from code in lookup(parser, HASH_TABLE *table, ...).
- */
- unsigned char step = 0;
- unsigned long mask = nsAttsSize - 1;
- j = uriHash & mask; /* index into hash table */
- while (parser->m_nsAtts[j].version == version) {
- /* for speed we compare stored hash values first */
- if (uriHash == parser->m_nsAtts[j].hash) {
- const XML_Char *s1 = poolStart(&parser->m_tempPool);
- const XML_Char *s2 = parser->m_nsAtts[j].uriName;
- /* s1 is null terminated, but not s2 */
- for (; *s1 == *s2 && *s1 != 0; s1++, s2++)
- ;
- if (*s1 == 0)
- return XML_ERROR_DUPLICATE_ATTRIBUTE;
- }
- if (! step)
- step = PROBE_STEP(uriHash, mask, parser->m_nsAttsPower);
- j < step ? (j += nsAttsSize - step) : (j -= step);
- }
- }
- if (parser->m_ns_triplets) { /* append namespace separator and prefix */
- parser->m_tempPool.ptr[-1] = parser->m_namespaceSeparator;
- s = b->prefix->name;
- do {
- if (! poolAppendChar(&parser->m_tempPool, *s))
- return XML_ERROR_NO_MEMORY;
- } while (*s++);
- }
- /* store expanded name in attribute list */
- s = poolStart(&parser->m_tempPool);
- poolFinish(&parser->m_tempPool);
- appAtts[i] = s;
- /* fill empty slot with new version, uriName and hash value */
- parser->m_nsAtts[j].version = version;
- parser->m_nsAtts[j].hash = uriHash;
- parser->m_nsAtts[j].uriName = s;
- if (! --nPrefixes) {
- i += 2;
- break;
- }
- } else /* not prefixed */
- ((XML_Char *)s)[-1] = 0; /* clear flag */
- }
- }
- /* clear flags for the remaining attributes */
- for (; i < attIndex; i += 2)
- ((XML_Char *)(appAtts[i]))[-1] = 0;
- for (binding = *bindingsPtr; binding; binding = binding->nextTagBinding)
- binding->attId->name[-1] = 0;
- if (! parser->m_ns)
- return XML_ERROR_NONE;
- /* expand the element type name */
- if (elementType->prefix) {
- binding = elementType->prefix->binding;
- if (! binding)
- return XML_ERROR_UNBOUND_PREFIX;
- localPart = tagNamePtr->str;
- while (*localPart++ != XML_T(ASCII_COLON))
- ;
- } else if (dtd->defaultPrefix.binding) {
- binding = dtd->defaultPrefix.binding;
- localPart = tagNamePtr->str;
- } else
- return XML_ERROR_NONE;
- prefixLen = 0;
- if (parser->m_ns_triplets && binding->prefix->name) {
- for (; binding->prefix->name[prefixLen++];)
- ; /* prefixLen includes null terminator */
- }
- tagNamePtr->localPart = localPart;
- tagNamePtr->uriLen = binding->uriLen;
- tagNamePtr->prefix = binding->prefix->name;
- tagNamePtr->prefixLen = prefixLen;
- for (i = 0; localPart[i++];)
- ; /* i includes null terminator */
- /* Detect and prevent integer overflow */
- if (binding->uriLen > INT_MAX - prefixLen
- || i > INT_MAX - (binding->uriLen + prefixLen)) {
- return XML_ERROR_NO_MEMORY;
- }
- n = i + binding->uriLen + prefixLen;
- if (n > binding->uriAlloc) {
- TAG *p;
- /* Detect and prevent integer overflow */
- if (n > INT_MAX - EXPAND_SPARE) {
- return XML_ERROR_NO_MEMORY;
- }
- /* Detect and prevent integer overflow.
- * The preprocessor guard addresses the "always false" warning
- * from -Wtype-limits on platforms where
- * sizeof(unsigned int) < sizeof(size_t), e.g. on x86_64. */
- #if UINT_MAX >= SIZE_MAX
- if ((unsigned)(n + EXPAND_SPARE) > (size_t)(-1) / sizeof(XML_Char)) {
- return XML_ERROR_NO_MEMORY;
- }
- #endif
- uri = (XML_Char *)MALLOC(parser, (n + EXPAND_SPARE) * sizeof(XML_Char));
- if (! uri)
- return XML_ERROR_NO_MEMORY;
- binding->uriAlloc = n + EXPAND_SPARE;
- memcpy(uri, binding->uri, binding->uriLen * sizeof(XML_Char));
- for (p = parser->m_tagStack; p; p = p->parent)
- if (p->name.str == binding->uri)
- p->name.str = uri;
- FREE(parser, binding->uri);
- binding->uri = uri;
- }
- /* if m_namespaceSeparator != '\0' then uri includes it already */
- uri = binding->uri + binding->uriLen;
- memcpy(uri, localPart, i * sizeof(XML_Char));
- /* we always have a namespace separator between localPart and prefix */
- if (prefixLen) {
- uri += i - 1;
- *uri = parser->m_namespaceSeparator; /* replace null terminator */
- memcpy(uri + 1, binding->prefix->name, prefixLen * sizeof(XML_Char));
- }
- tagNamePtr->str = binding->uri;
- return XML_ERROR_NONE;
- }
- static XML_Bool
- is_rfc3986_uri_char(XML_Char candidate) {
- // For the RFC 3986 ANBF grammar see
- // https://datatracker.ietf.org/doc/html/rfc3986#appendix-A
- switch (candidate) {
- // From rule "ALPHA" (uppercase half)
- case 'A':
- case 'B':
- case 'C':
- case 'D':
- case 'E':
- case 'F':
- case 'G':
- case 'H':
- case 'I':
- case 'J':
- case 'K':
- case 'L':
- case 'M':
- case 'N':
- case 'O':
- case 'P':
- case 'Q':
- case 'R':
- case 'S':
- case 'T':
- case 'U':
- case 'V':
- case 'W':
- case 'X':
- case 'Y':
- case 'Z':
- // From rule "ALPHA" (lowercase half)
- case 'a':
- case 'b':
- case 'c':
- case 'd':
- case 'e':
- case 'f':
- case 'g':
- case 'h':
- case 'i':
- case 'j':
- case 'k':
- case 'l':
- case 'm':
- case 'n':
- case 'o':
- case 'p':
- case 'q':
- case 'r':
- case 's':
- case 't':
- case 'u':
- case 'v':
- case 'w':
- case 'x':
- case 'y':
- case 'z':
- // From rule "DIGIT"
- case '0':
- case '1':
- case '2':
- case '3':
- case '4':
- case '5':
- case '6':
- case '7':
- case '8':
- case '9':
- // From rule "pct-encoded"
- case '%':
- // From rule "unreserved"
- case '-':
- case '.':
- case '_':
- case '~':
- // From rule "gen-delims"
- case ':':
- case '/':
- case '?':
- case '#':
- case '[':
- case ']':
- case '@':
- // From rule "sub-delims"
- case '!':
- case '$':
- case '&':
- case '\'':
- case '(':
- case ')':
- case '*':
- case '+':
- case ',':
- case ';':
- case '=':
- return XML_TRUE;
- default:
- return XML_FALSE;
- }
- }
- /* addBinding() overwrites the value of prefix->binding without checking.
- Therefore one must keep track of the old value outside of addBinding().
- */
- static enum XML_Error
- addBinding(XML_Parser parser, PREFIX *prefix, const ATTRIBUTE_ID *attId,
- const XML_Char *uri, BINDING **bindingsPtr) {
- // "http://www.w3.org/XML/1998/namespace"
- static const XML_Char xmlNamespace[]
- = {ASCII_h, ASCII_t, ASCII_t, ASCII_p, ASCII_COLON,
- ASCII_SLASH, ASCII_SLASH, ASCII_w, ASCII_w, ASCII_w,
- ASCII_PERIOD, ASCII_w, ASCII_3, ASCII_PERIOD, ASCII_o,
- ASCII_r, ASCII_g, ASCII_SLASH, ASCII_X, ASCII_M,
- ASCII_L, ASCII_SLASH, ASCII_1, ASCII_9, ASCII_9,
- ASCII_8, ASCII_SLASH, ASCII_n, ASCII_a, ASCII_m,
- ASCII_e, ASCII_s, ASCII_p, ASCII_a, ASCII_c,
- ASCII_e, '\0'};
- static const int xmlLen = (int)sizeof(xmlNamespace) / sizeof(XML_Char) - 1;
- // "http://www.w3.org/2000/xmlns/"
- static const XML_Char xmlnsNamespace[]
- = {ASCII_h, ASCII_t, ASCII_t, ASCII_p, ASCII_COLON, ASCII_SLASH,
- ASCII_SLASH, ASCII_w, ASCII_w, ASCII_w, ASCII_PERIOD, ASCII_w,
- ASCII_3, ASCII_PERIOD, ASCII_o, ASCII_r, ASCII_g, ASCII_SLASH,
- ASCII_2, ASCII_0, ASCII_0, ASCII_0, ASCII_SLASH, ASCII_x,
- ASCII_m, ASCII_l, ASCII_n, ASCII_s, ASCII_SLASH, '\0'};
- static const int xmlnsLen
- = (int)sizeof(xmlnsNamespace) / sizeof(XML_Char) - 1;
- XML_Bool mustBeXML = XML_FALSE;
- XML_Bool isXML = XML_TRUE;
- XML_Bool isXMLNS = XML_TRUE;
- BINDING *b;
- int len;
- /* empty URI is only valid for default namespace per XML NS 1.0 (not 1.1) */
- if (*uri == XML_T('\0') && prefix->name)
- return XML_ERROR_UNDECLARING_PREFIX;
- if (prefix->name && prefix->name[0] == XML_T(ASCII_x)
- && prefix->name[1] == XML_T(ASCII_m)
- && prefix->name[2] == XML_T(ASCII_l)) {
- /* Not allowed to bind xmlns */
- if (prefix->name[3] == XML_T(ASCII_n) && prefix->name[4] == XML_T(ASCII_s)
- && prefix->name[5] == XML_T('\0'))
- return XML_ERROR_RESERVED_PREFIX_XMLNS;
- if (prefix->name[3] == XML_T('\0'))
- mustBeXML = XML_TRUE;
- }
- for (len = 0; uri[len]; len++) {
- if (isXML && (len > xmlLen || uri[len] != xmlNamespace[len]))
- isXML = XML_FALSE;
- if (! mustBeXML && isXMLNS
- && (len > xmlnsLen || uri[len] != xmlnsNamespace[len]))
- isXMLNS = XML_FALSE;
- // NOTE: While Expat does not validate namespace URIs against RFC 3986
- // today (and is not REQUIRED to do so with regard to the XML 1.0
- // namespaces specification) we have to at least make sure, that
- // the application on top of Expat (that is likely splitting expanded
- // element names ("qualified names") of form
- // "[uri sep] local [sep prefix] '\0'" back into 1, 2 or 3 pieces
- // in its element handler code) cannot be confused by an attacker
- // putting additional namespace separator characters into namespace
- // declarations. That would be ambiguous and not to be expected.
- //
- // While the HTML API docs of function XML_ParserCreateNS have been
- // advising against use of a namespace separator character that can
- // appear in a URI for >20 years now, some widespread applications
- // are using URI characters (':' (colon) in particular) for a
- // namespace separator, in practice. To keep these applications
- // functional, we only reject namespaces URIs containing the
- // application-chosen namespace separator if the chosen separator
- // is a non-URI character with regard to RFC 3986.
- if (parser->m_ns && (uri[len] == parser->m_namespaceSeparator)
- && ! is_rfc3986_uri_char(uri[len])) {
- return XML_ERROR_SYNTAX;
- }
- }
- isXML = isXML && len == xmlLen;
- isXMLNS = isXMLNS && len == xmlnsLen;
- if (mustBeXML != isXML)
- return mustBeXML ? XML_ERROR_RESERVED_PREFIX_XML
- : XML_ERROR_RESERVED_NAMESPACE_URI;
- if (isXMLNS)
- return XML_ERROR_RESERVED_NAMESPACE_URI;
- if (parser->m_namespaceSeparator)
- len++;
- if (parser->m_freeBindingList) {
- b = parser->m_freeBindingList;
- if (len > b->uriAlloc) {
- /* Detect and prevent integer overflow */
- if (len > INT_MAX - EXPAND_SPARE) {
- return XML_ERROR_NO_MEMORY;
- }
- /* Detect and prevent integer overflow.
- * The preprocessor guard addresses the "always false" warning
- * from -Wtype-limits on platforms where
- * sizeof(unsigned int) < sizeof(size_t), e.g. on x86_64. */
- #if UINT_MAX >= SIZE_MAX
- if ((unsigned)(len + EXPAND_SPARE) > (size_t)(-1) / sizeof(XML_Char)) {
- return XML_ERROR_NO_MEMORY;
- }
- #endif
- XML_Char *temp = (XML_Char *)REALLOC(
- parser, b->uri, sizeof(XML_Char) * (len + EXPAND_SPARE));
- if (temp == NULL)
- return XML_ERROR_NO_MEMORY;
- b->uri = temp;
- b->uriAlloc = len + EXPAND_SPARE;
- }
- parser->m_freeBindingList = b->nextTagBinding;
- } else {
- b = (BINDING *)MALLOC(parser, sizeof(BINDING));
- if (! b)
- return XML_ERROR_NO_MEMORY;
- /* Detect and prevent integer overflow */
- if (len > INT_MAX - EXPAND_SPARE) {
- return XML_ERROR_NO_MEMORY;
- }
- /* Detect and prevent integer overflow.
- * The preprocessor guard addresses the "always false" warning
- * from -Wtype-limits on platforms where
- * sizeof(unsigned int) < sizeof(size_t), e.g. on x86_64. */
- #if UINT_MAX >= SIZE_MAX
- if ((unsigned)(len + EXPAND_SPARE) > (size_t)(-1) / sizeof(XML_Char)) {
- return XML_ERROR_NO_MEMORY;
- }
- #endif
- b->uri
- = (XML_Char *)MALLOC(parser, sizeof(XML_Char) * (len + EXPAND_SPARE));
- if (! b->uri) {
- FREE(parser, b);
- return XML_ERROR_NO_MEMORY;
- }
- b->uriAlloc = len + EXPAND_SPARE;
- }
- b->uriLen = len;
- memcpy(b->uri, uri, len * sizeof(XML_Char));
- if (parser->m_namespaceSeparator)
- b->uri[len - 1] = parser->m_namespaceSeparator;
- b->prefix = prefix;
- b->attId = attId;
- b->prevPrefixBinding = prefix->binding;
- /* NULL binding when default namespace undeclared */
- if (*uri == XML_T('\0') && prefix == &parser->m_dtd->defaultPrefix)
- prefix->binding = NULL;
- else
- prefix->binding = b;
- b->nextTagBinding = *bindingsPtr;
- *bindingsPtr = b;
- /* if attId == NULL then we are not starting a namespace scope */
- if (attId && parser->m_startNamespaceDeclHandler)
- parser->m_startNamespaceDeclHandler(parser->m_handlerArg, prefix->name,
- prefix->binding ? uri : 0);
- return XML_ERROR_NONE;
- }
- /* The idea here is to avoid using stack for each CDATA section when
- the whole file is parsed with one call.
- */
- static enum XML_Error PTRCALL
- cdataSectionProcessor(XML_Parser parser, const char *start, const char *end,
- const char **endPtr) {
- enum XML_Error result = doCdataSection(
- parser, parser->m_encoding, &start, end, endPtr,
- (XML_Bool)! parser->m_parsingStatus.finalBuffer, XML_ACCOUNT_DIRECT);
- if (result != XML_ERROR_NONE)
- return result;
- if (start) {
- if (parser->m_parentParser) { /* we are parsing an external entity */
- parser->m_processor = externalEntityContentProcessor;
- return externalEntityContentProcessor(parser, start, end, endPtr);
- } else {
- parser->m_processor = contentProcessor;
- return contentProcessor(parser, start, end, endPtr);
- }
- }
- return result;
- }
- /* startPtr gets set to non-null if the section is closed, and to null if
- the section is not yet closed.
- */
- static enum XML_Error
- doCdataSection(XML_Parser parser, const ENCODING *enc, const char **startPtr,
- const char *end, const char **nextPtr, XML_Bool haveMore,
- enum XML_Account account) {
- const char *s = *startPtr;
- const char **eventPP;
- const char **eventEndPP;
- if (enc == parser->m_encoding) {
- eventPP = &parser->m_eventPtr;
- *eventPP = s;
- eventEndPP = &parser->m_eventEndPtr;
- } else {
- eventPP = &(parser->m_openInternalEntities->internalEventPtr);
- eventEndPP = &(parser->m_openInternalEntities->internalEventEndPtr);
- }
- *eventPP = s;
- *startPtr = NULL;
- for (;;) {
- const char *next = s; /* in case of XML_TOK_NONE or XML_TOK_PARTIAL */
- int tok = XmlCdataSectionTok(enc, s, end, &next);
- #if XML_GE == 1
- if (! accountingDiffTolerated(parser, tok, s, next, __LINE__, account)) {
- accountingOnAbort(parser);
- return XML_ERROR_AMPLIFICATION_LIMIT_BREACH;
- }
- #else
- UNUSED_P(account);
- #endif
- *eventEndPP = next;
- switch (tok) {
- case XML_TOK_CDATA_SECT_CLOSE:
- if (parser->m_endCdataSectionHandler)
- parser->m_endCdataSectionHandler(parser->m_handlerArg);
- /* BEGIN disabled code */
- /* see comment under XML_TOK_CDATA_SECT_OPEN */
- else if ((0) && parser->m_characterDataHandler)
- parser->m_characterDataHandler(parser->m_handlerArg, parser->m_dataBuf,
- 0);
- /* END disabled code */
- else if (parser->m_defaultHandler)
- reportDefault(parser, enc, s, next);
- *startPtr = next;
- *nextPtr = next;
- if (parser->m_parsingStatus.parsing == XML_FINISHED)
- return XML_ERROR_ABORTED;
- else
- return XML_ERROR_NONE;
- case XML_TOK_DATA_NEWLINE:
- if (parser->m_characterDataHandler) {
- XML_Char c = 0xA;
- parser->m_characterDataHandler(parser->m_handlerArg, &c, 1);
- } else if (parser->m_defaultHandler)
- reportDefault(parser, enc, s, next);
- break;
- case XML_TOK_DATA_CHARS: {
- XML_CharacterDataHandler charDataHandler = parser->m_characterDataHandler;
- if (charDataHandler) {
- if (MUST_CONVERT(enc, s)) {
- for (;;) {
- ICHAR *dataPtr = (ICHAR *)parser->m_dataBuf;
- const enum XML_Convert_Result convert_res = XmlConvert(
- enc, &s, next, &dataPtr, (ICHAR *)parser->m_dataBufEnd);
- *eventEndPP = next;
- charDataHandler(parser->m_handlerArg, parser->m_dataBuf,
- (int)(dataPtr - (ICHAR *)parser->m_dataBuf));
- if ((convert_res == XML_CONVERT_COMPLETED)
- || (convert_res == XML_CONVERT_INPUT_INCOMPLETE))
- break;
- *eventPP = s;
- }
- } else
- charDataHandler(parser->m_handlerArg, (const XML_Char *)s,
- (int)((const XML_Char *)next - (const XML_Char *)s));
- } else if (parser->m_defaultHandler)
- reportDefault(parser, enc, s, next);
- } break;
- case XML_TOK_INVALID:
- *eventPP = next;
- return XML_ERROR_INVALID_TOKEN;
- case XML_TOK_PARTIAL_CHAR:
- if (haveMore) {
- *nextPtr = s;
- return XML_ERROR_NONE;
- }
- return XML_ERROR_PARTIAL_CHAR;
- case XML_TOK_PARTIAL:
- case XML_TOK_NONE:
- if (haveMore) {
- *nextPtr = s;
- return XML_ERROR_NONE;
- }
- return XML_ERROR_UNCLOSED_CDATA_SECTION;
- default:
- /* Every token returned by XmlCdataSectionTok() has its own
- * explicit case, so this default case will never be executed.
- * We retain it as a safety net and exclude it from the coverage
- * statistics.
- *
- * LCOV_EXCL_START
- */
- *eventPP = next;
- return XML_ERROR_UNEXPECTED_STATE;
- /* LCOV_EXCL_STOP */
- }
- *eventPP = s = next;
- switch (parser->m_parsingStatus.parsing) {
- case XML_SUSPENDED:
- *nextPtr = next;
- return XML_ERROR_NONE;
- case XML_FINISHED:
- return XML_ERROR_ABORTED;
- default:;
- }
- }
- /* not reached */
- }
- #ifdef XML_DTD
- /* The idea here is to avoid using stack for each IGNORE section when
- the whole file is parsed with one call.
- */
- static enum XML_Error PTRCALL
- ignoreSectionProcessor(XML_Parser parser, const char *start, const char *end,
- const char **endPtr) {
- enum XML_Error result
- = doIgnoreSection(parser, parser->m_encoding, &start, end, endPtr,
- (XML_Bool)! parser->m_parsingStatus.finalBuffer);
- if (result != XML_ERROR_NONE)
- return result;
- if (start) {
- parser->m_processor = prologProcessor;
- return prologProcessor(parser, start, end, endPtr);
- }
- return result;
- }
- /* startPtr gets set to non-null is the section is closed, and to null
- if the section is not yet closed.
- */
- static enum XML_Error
- doIgnoreSection(XML_Parser parser, const ENCODING *enc, const char **startPtr,
- const char *end, const char **nextPtr, XML_Bool haveMore) {
- const char *next = *startPtr; /* in case of XML_TOK_NONE or XML_TOK_PARTIAL */
- int tok;
- const char *s = *startPtr;
- const char **eventPP;
- const char **eventEndPP;
- if (enc == parser->m_encoding) {
- eventPP = &parser->m_eventPtr;
- *eventPP = s;
- eventEndPP = &parser->m_eventEndPtr;
- } else {
- /* It's not entirely clear, but it seems the following two lines
- * of code cannot be executed. The only occasions on which 'enc'
- * is not 'encoding' are when this function is called
- * from the internal entity processing, and IGNORE sections are an
- * error in internal entities.
- *
- * Since it really isn't clear that this is true, we keep the code
- * and just remove it from our coverage tests.
- *
- * LCOV_EXCL_START
- */
- eventPP = &(parser->m_openInternalEntities->internalEventPtr);
- eventEndPP = &(parser->m_openInternalEntities->internalEventEndPtr);
- /* LCOV_EXCL_STOP */
- }
- *eventPP = s;
- *startPtr = NULL;
- tok = XmlIgnoreSectionTok(enc, s, end, &next);
- # if XML_GE == 1
- if (! accountingDiffTolerated(parser, tok, s, next, __LINE__,
- XML_ACCOUNT_DIRECT)) {
- accountingOnAbort(parser);
- return XML_ERROR_AMPLIFICATION_LIMIT_BREACH;
- }
- # endif
- *eventEndPP = next;
- switch (tok) {
- case XML_TOK_IGNORE_SECT:
- if (parser->m_defaultHandler)
- reportDefault(parser, enc, s, next);
- *startPtr = next;
- *nextPtr = next;
- if (parser->m_parsingStatus.parsing == XML_FINISHED)
- return XML_ERROR_ABORTED;
- else
- return XML_ERROR_NONE;
- case XML_TOK_INVALID:
- *eventPP = next;
- return XML_ERROR_INVALID_TOKEN;
- case XML_TOK_PARTIAL_CHAR:
- if (haveMore) {
- *nextPtr = s;
- return XML_ERROR_NONE;
- }
- return XML_ERROR_PARTIAL_CHAR;
- case XML_TOK_PARTIAL:
- case XML_TOK_NONE:
- if (haveMore) {
- *nextPtr = s;
- return XML_ERROR_NONE;
- }
- return XML_ERROR_SYNTAX; /* XML_ERROR_UNCLOSED_IGNORE_SECTION */
- default:
- /* All of the tokens that XmlIgnoreSectionTok() returns have
- * explicit cases to handle them, so this default case is never
- * executed. We keep it as a safety net anyway, and remove it
- * from our test coverage statistics.
- *
- * LCOV_EXCL_START
- */
- *eventPP = next;
- return XML_ERROR_UNEXPECTED_STATE;
- /* LCOV_EXCL_STOP */
- }
- /* not reached */
- }
- #endif /* XML_DTD */
- static enum XML_Error
- initializeEncoding(XML_Parser parser) {
- const char *s;
- #ifdef XML_UNICODE
- char encodingBuf[128];
- /* See comments about `protocolEncodingName` in parserInit() */
- if (! parser->m_protocolEncodingName)
- s = NULL;
- else {
- int i;
- for (i = 0; parser->m_protocolEncodingName[i]; i++) {
- if (i == sizeof(encodingBuf) - 1
- || (parser->m_protocolEncodingName[i] & ~0x7f) != 0) {
- encodingBuf[0] = '\0';
- break;
- }
- encodingBuf[i] = (char)parser->m_protocolEncodingName[i];
- }
- encodingBuf[i] = '\0';
- s = encodingBuf;
- }
- #else
- s = parser->m_protocolEncodingName;
- #endif
- if ((parser->m_ns ? XmlInitEncodingNS : XmlInitEncoding)(
- &parser->m_initEncoding, &parser->m_encoding, s))
- return XML_ERROR_NONE;
- return handleUnknownEncoding(parser, parser->m_protocolEncodingName);
- }
- static enum XML_Error
- processXmlDecl(XML_Parser parser, int isGeneralTextEntity, const char *s,
- const char *next) {
- const char *encodingName = NULL;
- const XML_Char *storedEncName = NULL;
- const ENCODING *newEncoding = NULL;
- const char *version = NULL;
- const char *versionend = NULL;
- const XML_Char *storedversion = NULL;
- int standalone = -1;
- #if XML_GE == 1
- if (! accountingDiffTolerated(parser, XML_TOK_XML_DECL, s, next, __LINE__,
- XML_ACCOUNT_DIRECT)) {
- accountingOnAbort(parser);
- return XML_ERROR_AMPLIFICATION_LIMIT_BREACH;
- }
- #endif
- if (! (parser->m_ns ? XmlParseXmlDeclNS : XmlParseXmlDecl)(
- isGeneralTextEntity, parser->m_encoding, s, next, &parser->m_eventPtr,
- &version, &versionend, &encodingName, &newEncoding, &standalone)) {
- if (isGeneralTextEntity)
- return XML_ERROR_TEXT_DECL;
- else
- return XML_ERROR_XML_DECL;
- }
- if (! isGeneralTextEntity && standalone == 1) {
- parser->m_dtd->standalone = XML_TRUE;
- #ifdef XML_DTD
- if (parser->m_paramEntityParsing
- == XML_PARAM_ENTITY_PARSING_UNLESS_STANDALONE)
- parser->m_paramEntityParsing = XML_PARAM_ENTITY_PARSING_NEVER;
- #endif /* XML_DTD */
- }
- if (parser->m_xmlDeclHandler) {
- if (encodingName != NULL) {
- storedEncName = poolStoreString(
- &parser->m_temp2Pool, parser->m_encoding, encodingName,
- encodingName + XmlNameLength(parser->m_encoding, encodingName));
- if (! storedEncName)
- return XML_ERROR_NO_MEMORY;
- poolFinish(&parser->m_temp2Pool);
- }
- if (version) {
- storedversion
- = poolStoreString(&parser->m_temp2Pool, parser->m_encoding, version,
- versionend - parser->m_encoding->minBytesPerChar);
- if (! storedversion)
- return XML_ERROR_NO_MEMORY;
- }
- parser->m_xmlDeclHandler(parser->m_handlerArg, storedversion, storedEncName,
- standalone);
- } else if (parser->m_defaultHandler)
- reportDefault(parser, parser->m_encoding, s, next);
- if (parser->m_protocolEncodingName == NULL) {
- if (newEncoding) {
- /* Check that the specified encoding does not conflict with what
- * the parser has already deduced. Do we have the same number
- * of bytes in the smallest representation of a character? If
- * this is UTF-16, is it the same endianness?
- */
- if (newEncoding->minBytesPerChar != parser->m_encoding->minBytesPerChar
- || (newEncoding->minBytesPerChar == 2
- && newEncoding != parser->m_encoding)) {
- parser->m_eventPtr = encodingName;
- return XML_ERROR_INCORRECT_ENCODING;
- }
- parser->m_encoding = newEncoding;
- } else if (encodingName) {
- enum XML_Error result;
- if (! storedEncName) {
- storedEncName = poolStoreString(
- &parser->m_temp2Pool, parser->m_encoding, encodingName,
- encodingName + XmlNameLength(parser->m_encoding, encodingName));
- if (! storedEncName)
- return XML_ERROR_NO_MEMORY;
- }
- result = handleUnknownEncoding(parser, storedEncName);
- poolClear(&parser->m_temp2Pool);
- if (result == XML_ERROR_UNKNOWN_ENCODING)
- parser->m_eventPtr = encodingName;
- return result;
- }
- }
- if (storedEncName || storedversion)
- poolClear(&parser->m_temp2Pool);
- return XML_ERROR_NONE;
- }
- static enum XML_Error
- handleUnknownEncoding(XML_Parser parser, const XML_Char *encodingName) {
- if (parser->m_unknownEncodingHandler) {
- XML_Encoding info;
- int i;
- for (i = 0; i < 256; i++)
- info.map[i] = -1;
- info.convert = NULL;
- info.data = NULL;
- info.release = NULL;
- if (parser->m_unknownEncodingHandler(parser->m_unknownEncodingHandlerData,
- encodingName, &info)) {
- ENCODING *enc;
- parser->m_unknownEncodingMem = MALLOC(parser, XmlSizeOfUnknownEncoding());
- if (! parser->m_unknownEncodingMem) {
- if (info.release)
- info.release(info.data);
- return XML_ERROR_NO_MEMORY;
- }
- enc = (parser->m_ns ? XmlInitUnknownEncodingNS : XmlInitUnknownEncoding)(
- parser->m_unknownEncodingMem, info.map, info.convert, info.data);
- if (enc) {
- parser->m_unknownEncodingData = info.data;
- parser->m_unknownEncodingRelease = info.release;
- parser->m_encoding = enc;
- return XML_ERROR_NONE;
- }
- }
- if (info.release != NULL)
- info.release(info.data);
- }
- return XML_ERROR_UNKNOWN_ENCODING;
- }
- static enum XML_Error PTRCALL
- prologInitProcessor(XML_Parser parser, const char *s, const char *end,
- const char **nextPtr) {
- enum XML_Error result = initializeEncoding(parser);
- if (result != XML_ERROR_NONE)
- return result;
- parser->m_processor = prologProcessor;
- return prologProcessor(parser, s, end, nextPtr);
- }
- #ifdef XML_DTD
- static enum XML_Error PTRCALL
- externalParEntInitProcessor(XML_Parser parser, const char *s, const char *end,
- const char **nextPtr) {
- enum XML_Error result = initializeEncoding(parser);
- if (result != XML_ERROR_NONE)
- return result;
- /* we know now that XML_Parse(Buffer) has been called,
- so we consider the external parameter entity read */
- parser->m_dtd->paramEntityRead = XML_TRUE;
- if (parser->m_prologState.inEntityValue) {
- parser->m_processor = entityValueInitProcessor;
- return entityValueInitProcessor(parser, s, end, nextPtr);
- } else {
- parser->m_processor = externalParEntProcessor;
- return externalParEntProcessor(parser, s, end, nextPtr);
- }
- }
- static enum XML_Error PTRCALL
- entityValueInitProcessor(XML_Parser parser, const char *s, const char *end,
- const char **nextPtr) {
- int tok;
- const char *start = s;
- const char *next = start;
- parser->m_eventPtr = start;
- for (;;) {
- tok = XmlPrologTok(parser->m_encoding, start, end, &next);
- /* Note: Except for XML_TOK_BOM below, these bytes are accounted later in:
- - storeEntityValue
- - processXmlDecl
- */
- parser->m_eventEndPtr = next;
- if (tok <= 0) {
- if (! parser->m_parsingStatus.finalBuffer && tok != XML_TOK_INVALID) {
- *nextPtr = s;
- return XML_ERROR_NONE;
- }
- switch (tok) {
- case XML_TOK_INVALID:
- return XML_ERROR_INVALID_TOKEN;
- case XML_TOK_PARTIAL:
- return XML_ERROR_UNCLOSED_TOKEN;
- case XML_TOK_PARTIAL_CHAR:
- return XML_ERROR_PARTIAL_CHAR;
- case XML_TOK_NONE: /* start == end */
- default:
- break;
- }
- /* found end of entity value - can store it now */
- return storeEntityValue(parser, parser->m_encoding, s, end,
- XML_ACCOUNT_DIRECT);
- } else if (tok == XML_TOK_XML_DECL) {
- enum XML_Error result;
- result = processXmlDecl(parser, 0, start, next);
- if (result != XML_ERROR_NONE)
- return result;
- /* At this point, m_parsingStatus.parsing cannot be XML_SUSPENDED. For
- * that to happen, a parameter entity parsing handler must have attempted
- * to suspend the parser, which fails and raises an error. The parser can
- * be aborted, but can't be suspended.
- */
- if (parser->m_parsingStatus.parsing == XML_FINISHED)
- return XML_ERROR_ABORTED;
- *nextPtr = next;
- /* stop scanning for text declaration - we found one */
- parser->m_processor = entityValueProcessor;
- return entityValueProcessor(parser, next, end, nextPtr);
- }
- /* XmlPrologTok has now set the encoding based on the BOM it found, and we
- must move s and nextPtr forward to consume the BOM.
- If we didn't, and got XML_TOK_NONE from the next XmlPrologTok call, we
- would leave the BOM in the buffer and return. On the next call to this
- function, our XmlPrologTok call would return XML_TOK_INVALID, since it
- is not valid to have multiple BOMs.
- */
- else if (tok == XML_TOK_BOM) {
- # if XML_GE == 1
- if (! accountingDiffTolerated(parser, tok, s, next, __LINE__,
- XML_ACCOUNT_DIRECT)) {
- accountingOnAbort(parser);
- return XML_ERROR_AMPLIFICATION_LIMIT_BREACH;
- }
- # endif
- *nextPtr = next;
- s = next;
- }
- /* If we get this token, we have the start of what might be a
- normal tag, but not a declaration (i.e. it doesn't begin with
- "<!"). In a DTD context, that isn't legal.
- */
- else if (tok == XML_TOK_INSTANCE_START) {
- *nextPtr = next;
- return XML_ERROR_SYNTAX;
- }
- start = next;
- parser->m_eventPtr = start;
- }
- }
- static enum XML_Error PTRCALL
- externalParEntProcessor(XML_Parser parser, const char *s, const char *end,
- const char **nextPtr) {
- const char *next = s;
- int tok;
- tok = XmlPrologTok(parser->m_encoding, s, end, &next);
- if (tok <= 0) {
- if (! parser->m_parsingStatus.finalBuffer && tok != XML_TOK_INVALID) {
- *nextPtr = s;
- return XML_ERROR_NONE;
- }
- switch (tok) {
- case XML_TOK_INVALID:
- return XML_ERROR_INVALID_TOKEN;
- case XML_TOK_PARTIAL:
- return XML_ERROR_UNCLOSED_TOKEN;
- case XML_TOK_PARTIAL_CHAR:
- return XML_ERROR_PARTIAL_CHAR;
- case XML_TOK_NONE: /* start == end */
- default:
- break;
- }
- }
- /* This would cause the next stage, i.e. doProlog to be passed XML_TOK_BOM.
- However, when parsing an external subset, doProlog will not accept a BOM
- as valid, and report a syntax error, so we have to skip the BOM, and
- account for the BOM bytes.
- */
- else if (tok == XML_TOK_BOM) {
- if (! accountingDiffTolerated(parser, tok, s, next, __LINE__,
- XML_ACCOUNT_DIRECT)) {
- accountingOnAbort(parser);
- return XML_ERROR_AMPLIFICATION_LIMIT_BREACH;
- }
- s = next;
- tok = XmlPrologTok(parser->m_encoding, s, end, &next);
- }
- parser->m_processor = prologProcessor;
- return doProlog(parser, parser->m_encoding, s, end, tok, next, nextPtr,
- (XML_Bool)! parser->m_parsingStatus.finalBuffer, XML_TRUE,
- XML_ACCOUNT_DIRECT);
- }
- static enum XML_Error PTRCALL
- entityValueProcessor(XML_Parser parser, const char *s, const char *end,
- const char **nextPtr) {
- const char *start = s;
- const char *next = s;
- const ENCODING *enc = parser->m_encoding;
- int tok;
- for (;;) {
- tok = XmlPrologTok(enc, start, end, &next);
- /* Note: These bytes are accounted later in:
- - storeEntityValue
- */
- if (tok <= 0) {
- if (! parser->m_parsingStatus.finalBuffer && tok != XML_TOK_INVALID) {
- *nextPtr = s;
- return XML_ERROR_NONE;
- }
- switch (tok) {
- case XML_TOK_INVALID:
- return XML_ERROR_INVALID_TOKEN;
- case XML_TOK_PARTIAL:
- return XML_ERROR_UNCLOSED_TOKEN;
- case XML_TOK_PARTIAL_CHAR:
- return XML_ERROR_PARTIAL_CHAR;
- case XML_TOK_NONE: /* start == end */
- default:
- break;
- }
- /* found end of entity value - can store it now */
- return storeEntityValue(parser, enc, s, end, XML_ACCOUNT_DIRECT);
- }
- start = next;
- }
- }
- #endif /* XML_DTD */
- static enum XML_Error PTRCALL
- prologProcessor(XML_Parser parser, const char *s, const char *end,
- const char **nextPtr) {
- const char *next = s;
- int tok = XmlPrologTok(parser->m_encoding, s, end, &next);
- return doProlog(parser, parser->m_encoding, s, end, tok, next, nextPtr,
- (XML_Bool)! parser->m_parsingStatus.finalBuffer, XML_TRUE,
- XML_ACCOUNT_DIRECT);
- }
- static enum XML_Error
- doProlog(XML_Parser parser, const ENCODING *enc, const char *s, const char *end,
- int tok, const char *next, const char **nextPtr, XML_Bool haveMore,
- XML_Bool allowClosingDoctype, enum XML_Account account) {
- #ifdef XML_DTD
- static const XML_Char externalSubsetName[] = {ASCII_HASH, '\0'};
- #endif /* XML_DTD */
- static const XML_Char atypeCDATA[]
- = {ASCII_C, ASCII_D, ASCII_A, ASCII_T, ASCII_A, '\0'};
- static const XML_Char atypeID[] = {ASCII_I, ASCII_D, '\0'};
- static const XML_Char atypeIDREF[]
- = {ASCII_I, ASCII_D, ASCII_R, ASCII_E, ASCII_F, '\0'};
- static const XML_Char atypeIDREFS[]
- = {ASCII_I, ASCII_D, ASCII_R, ASCII_E, ASCII_F, ASCII_S, '\0'};
- static const XML_Char atypeENTITY[]
- = {ASCII_E, ASCII_N, ASCII_T, ASCII_I, ASCII_T, ASCII_Y, '\0'};
- static const XML_Char atypeENTITIES[]
- = {ASCII_E, ASCII_N, ASCII_T, ASCII_I, ASCII_T,
- ASCII_I, ASCII_E, ASCII_S, '\0'};
- static const XML_Char atypeNMTOKEN[]
- = {ASCII_N, ASCII_M, ASCII_T, ASCII_O, ASCII_K, ASCII_E, ASCII_N, '\0'};
- static const XML_Char atypeNMTOKENS[]
- = {ASCII_N, ASCII_M, ASCII_T, ASCII_O, ASCII_K,
- ASCII_E, ASCII_N, ASCII_S, '\0'};
- static const XML_Char notationPrefix[]
- = {ASCII_N, ASCII_O, ASCII_T, ASCII_A, ASCII_T,
- ASCII_I, ASCII_O, ASCII_N, ASCII_LPAREN, '\0'};
- static const XML_Char enumValueSep[] = {ASCII_PIPE, '\0'};
- static const XML_Char enumValueStart[] = {ASCII_LPAREN, '\0'};
- #ifndef XML_DTD
- UNUSED_P(account);
- #endif
- /* save one level of indirection */
- DTD *const dtd = parser->m_dtd;
- const char **eventPP;
- const char **eventEndPP;
- enum XML_Content_Quant quant;
- if (enc == parser->m_encoding) {
- eventPP = &parser->m_eventPtr;
- eventEndPP = &parser->m_eventEndPtr;
- } else {
- eventPP = &(parser->m_openInternalEntities->internalEventPtr);
- eventEndPP = &(parser->m_openInternalEntities->internalEventEndPtr);
- }
- for (;;) {
- int role;
- XML_Bool handleDefault = XML_TRUE;
- *eventPP = s;
- *eventEndPP = next;
- if (tok <= 0) {
- if (haveMore && tok != XML_TOK_INVALID) {
- *nextPtr = s;
- return XML_ERROR_NONE;
- }
- switch (tok) {
- case XML_TOK_INVALID:
- *eventPP = next;
- return XML_ERROR_INVALID_TOKEN;
- case XML_TOK_PARTIAL:
- return XML_ERROR_UNCLOSED_TOKEN;
- case XML_TOK_PARTIAL_CHAR:
- return XML_ERROR_PARTIAL_CHAR;
- case -XML_TOK_PROLOG_S:
- tok = -tok;
- break;
- case XML_TOK_NONE:
- #ifdef XML_DTD
- /* for internal PE NOT referenced between declarations */
- if (enc != parser->m_encoding
- && ! parser->m_openInternalEntities->betweenDecl) {
- *nextPtr = s;
- return XML_ERROR_NONE;
- }
- /* WFC: PE Between Declarations - must check that PE contains
- complete markup, not only for external PEs, but also for
- internal PEs if the reference occurs between declarations.
- */
- if (parser->m_isParamEntity || enc != parser->m_encoding) {
- if (XmlTokenRole(&parser->m_prologState, XML_TOK_NONE, end, end, enc)
- == XML_ROLE_ERROR)
- return XML_ERROR_INCOMPLETE_PE;
- *nextPtr = s;
- return XML_ERROR_NONE;
- }
- #endif /* XML_DTD */
- return XML_ERROR_NO_ELEMENTS;
- default:
- tok = -tok;
- next = end;
- break;
- }
- }
- role = XmlTokenRole(&parser->m_prologState, tok, s, next, enc);
- #if XML_GE == 1
- switch (role) {
- case XML_ROLE_INSTANCE_START: // bytes accounted in contentProcessor
- case XML_ROLE_XML_DECL: // bytes accounted in processXmlDecl
- # ifdef XML_DTD
- case XML_ROLE_TEXT_DECL: // bytes accounted in processXmlDecl
- # endif
- break;
- default:
- if (! accountingDiffTolerated(parser, tok, s, next, __LINE__, account)) {
- accountingOnAbort(parser);
- return XML_ERROR_AMPLIFICATION_LIMIT_BREACH;
- }
- }
- #endif
- switch (role) {
- case XML_ROLE_XML_DECL: {
- enum XML_Error result = processXmlDecl(parser, 0, s, next);
- if (result != XML_ERROR_NONE)
- return result;
- enc = parser->m_encoding;
- handleDefault = XML_FALSE;
- } break;
- case XML_ROLE_DOCTYPE_NAME:
- if (parser->m_startDoctypeDeclHandler) {
- parser->m_doctypeName
- = poolStoreString(&parser->m_tempPool, enc, s, next);
- if (! parser->m_doctypeName)
- return XML_ERROR_NO_MEMORY;
- poolFinish(&parser->m_tempPool);
- parser->m_doctypePubid = NULL;
- handleDefault = XML_FALSE;
- }
- parser->m_doctypeSysid = NULL; /* always initialize to NULL */
- break;
- case XML_ROLE_DOCTYPE_INTERNAL_SUBSET:
- if (parser->m_startDoctypeDeclHandler) {
- parser->m_startDoctypeDeclHandler(
- parser->m_handlerArg, parser->m_doctypeName, parser->m_doctypeSysid,
- parser->m_doctypePubid, 1);
- parser->m_doctypeName = NULL;
- poolClear(&parser->m_tempPool);
- handleDefault = XML_FALSE;
- }
- break;
- #ifdef XML_DTD
- case XML_ROLE_TEXT_DECL: {
- enum XML_Error result = processXmlDecl(parser, 1, s, next);
- if (result != XML_ERROR_NONE)
- return result;
- enc = parser->m_encoding;
- handleDefault = XML_FALSE;
- } break;
- #endif /* XML_DTD */
- case XML_ROLE_DOCTYPE_PUBLIC_ID:
- #ifdef XML_DTD
- parser->m_useForeignDTD = XML_FALSE;
- parser->m_declEntity = (ENTITY *)lookup(
- parser, &dtd->paramEntities, externalSubsetName, sizeof(ENTITY));
- if (! parser->m_declEntity)
- return XML_ERROR_NO_MEMORY;
- #endif /* XML_DTD */
- dtd->hasParamEntityRefs = XML_TRUE;
- if (parser->m_startDoctypeDeclHandler) {
- XML_Char *pubId;
- if (! XmlIsPublicId(enc, s, next, eventPP))
- return XML_ERROR_PUBLICID;
- pubId = poolStoreString(&parser->m_tempPool, enc,
- s + enc->minBytesPerChar,
- next - enc->minBytesPerChar);
- if (! pubId)
- return XML_ERROR_NO_MEMORY;
- normalizePublicId(pubId);
- poolFinish(&parser->m_tempPool);
- parser->m_doctypePubid = pubId;
- handleDefault = XML_FALSE;
- goto alreadyChecked;
- }
- /* fall through */
- case XML_ROLE_ENTITY_PUBLIC_ID:
- if (! XmlIsPublicId(enc, s, next, eventPP))
- return XML_ERROR_PUBLICID;
- alreadyChecked:
- if (dtd->keepProcessing && parser->m_declEntity) {
- XML_Char *tem
- = poolStoreString(&dtd->pool, enc, s + enc->minBytesPerChar,
- next - enc->minBytesPerChar);
- if (! tem)
- return XML_ERROR_NO_MEMORY;
- normalizePublicId(tem);
- parser->m_declEntity->publicId = tem;
- poolFinish(&dtd->pool);
- /* Don't suppress the default handler if we fell through from
- * the XML_ROLE_DOCTYPE_PUBLIC_ID case.
- */
- if (parser->m_entityDeclHandler && role == XML_ROLE_ENTITY_PUBLIC_ID)
- handleDefault = XML_FALSE;
- }
- break;
- case XML_ROLE_DOCTYPE_CLOSE:
- if (allowClosingDoctype != XML_TRUE) {
- /* Must not close doctype from within expanded parameter entities */
- return XML_ERROR_INVALID_TOKEN;
- }
- if (parser->m_doctypeName) {
- parser->m_startDoctypeDeclHandler(
- parser->m_handlerArg, parser->m_doctypeName, parser->m_doctypeSysid,
- parser->m_doctypePubid, 0);
- poolClear(&parser->m_tempPool);
- handleDefault = XML_FALSE;
- }
- /* parser->m_doctypeSysid will be non-NULL in the case of a previous
- XML_ROLE_DOCTYPE_SYSTEM_ID, even if parser->m_startDoctypeDeclHandler
- was not set, indicating an external subset
- */
- #ifdef XML_DTD
- if (parser->m_doctypeSysid || parser->m_useForeignDTD) {
- XML_Bool hadParamEntityRefs = dtd->hasParamEntityRefs;
- dtd->hasParamEntityRefs = XML_TRUE;
- if (parser->m_paramEntityParsing
- && parser->m_externalEntityRefHandler) {
- ENTITY *entity = (ENTITY *)lookup(parser, &dtd->paramEntities,
- externalSubsetName, sizeof(ENTITY));
- if (! entity) {
- /* The external subset name "#" will have already been
- * inserted into the hash table at the start of the
- * external entity parsing, so no allocation will happen
- * and lookup() cannot fail.
- */
- return XML_ERROR_NO_MEMORY; /* LCOV_EXCL_LINE */
- }
- if (parser->m_useForeignDTD)
- entity->base = parser->m_curBase;
- dtd->paramEntityRead = XML_FALSE;
- if (! parser->m_externalEntityRefHandler(
- parser->m_externalEntityRefHandlerArg, 0, entity->base,
- entity->systemId, entity->publicId))
- return XML_ERROR_EXTERNAL_ENTITY_HANDLING;
- if (dtd->paramEntityRead) {
- if (! dtd->standalone && parser->m_notStandaloneHandler
- && ! parser->m_notStandaloneHandler(parser->m_handlerArg))
- return XML_ERROR_NOT_STANDALONE;
- }
- /* if we didn't read the foreign DTD then this means that there
- is no external subset and we must reset dtd->hasParamEntityRefs
- */
- else if (! parser->m_doctypeSysid)
- dtd->hasParamEntityRefs = hadParamEntityRefs;
- /* end of DTD - no need to update dtd->keepProcessing */
- }
- parser->m_useForeignDTD = XML_FALSE;
- }
- #endif /* XML_DTD */
- if (parser->m_endDoctypeDeclHandler) {
- parser->m_endDoctypeDeclHandler(parser->m_handlerArg);
- handleDefault = XML_FALSE;
- }
- break;
- case XML_ROLE_INSTANCE_START:
- #ifdef XML_DTD
- /* if there is no DOCTYPE declaration then now is the
- last chance to read the foreign DTD
- */
- if (parser->m_useForeignDTD) {
- XML_Bool hadParamEntityRefs = dtd->hasParamEntityRefs;
- dtd->hasParamEntityRefs = XML_TRUE;
- if (parser->m_paramEntityParsing
- && parser->m_externalEntityRefHandler) {
- ENTITY *entity = (ENTITY *)lookup(parser, &dtd->paramEntities,
- externalSubsetName, sizeof(ENTITY));
- if (! entity)
- return XML_ERROR_NO_MEMORY;
- entity->base = parser->m_curBase;
- dtd->paramEntityRead = XML_FALSE;
- if (! parser->m_externalEntityRefHandler(
- parser->m_externalEntityRefHandlerArg, 0, entity->base,
- entity->systemId, entity->publicId))
- return XML_ERROR_EXTERNAL_ENTITY_HANDLING;
- if (dtd->paramEntityRead) {
- if (! dtd->standalone && parser->m_notStandaloneHandler
- && ! parser->m_notStandaloneHandler(parser->m_handlerArg))
- return XML_ERROR_NOT_STANDALONE;
- }
- /* if we didn't read the foreign DTD then this means that there
- is no external subset and we must reset dtd->hasParamEntityRefs
- */
- else
- dtd->hasParamEntityRefs = hadParamEntityRefs;
- /* end of DTD - no need to update dtd->keepProcessing */
- }
- }
- #endif /* XML_DTD */
- parser->m_processor = contentProcessor;
- return contentProcessor(parser, s, end, nextPtr);
- case XML_ROLE_ATTLIST_ELEMENT_NAME:
- parser->m_declElementType = getElementType(parser, enc, s, next);
- if (! parser->m_declElementType)
- return XML_ERROR_NO_MEMORY;
- goto checkAttListDeclHandler;
- case XML_ROLE_ATTRIBUTE_NAME:
- parser->m_declAttributeId = getAttributeId(parser, enc, s, next);
- if (! parser->m_declAttributeId)
- return XML_ERROR_NO_MEMORY;
- parser->m_declAttributeIsCdata = XML_FALSE;
- parser->m_declAttributeType = NULL;
- parser->m_declAttributeIsId = XML_FALSE;
- goto checkAttListDeclHandler;
- case XML_ROLE_ATTRIBUTE_TYPE_CDATA:
- parser->m_declAttributeIsCdata = XML_TRUE;
- parser->m_declAttributeType = atypeCDATA;
- goto checkAttListDeclHandler;
- case XML_ROLE_ATTRIBUTE_TYPE_ID:
- parser->m_declAttributeIsId = XML_TRUE;
- parser->m_declAttributeType = atypeID;
- goto checkAttListDeclHandler;
- case XML_ROLE_ATTRIBUTE_TYPE_IDREF:
- parser->m_declAttributeType = atypeIDREF;
- goto checkAttListDeclHandler;
- case XML_ROLE_ATTRIBUTE_TYPE_IDREFS:
- parser->m_declAttributeType = atypeIDREFS;
- goto checkAttListDeclHandler;
- case XML_ROLE_ATTRIBUTE_TYPE_ENTITY:
- parser->m_declAttributeType = atypeENTITY;
- goto checkAttListDeclHandler;
- case XML_ROLE_ATTRIBUTE_TYPE_ENTITIES:
- parser->m_declAttributeType = atypeENTITIES;
- goto checkAttListDeclHandler;
- case XML_ROLE_ATTRIBUTE_TYPE_NMTOKEN:
- parser->m_declAttributeType = atypeNMTOKEN;
- goto checkAttListDeclHandler;
- case XML_ROLE_ATTRIBUTE_TYPE_NMTOKENS:
- parser->m_declAttributeType = atypeNMTOKENS;
- checkAttListDeclHandler:
- if (dtd->keepProcessing && parser->m_attlistDeclHandler)
- handleDefault = XML_FALSE;
- break;
- case XML_ROLE_ATTRIBUTE_ENUM_VALUE:
- case XML_ROLE_ATTRIBUTE_NOTATION_VALUE:
- if (dtd->keepProcessing && parser->m_attlistDeclHandler) {
- const XML_Char *prefix;
- if (parser->m_declAttributeType) {
- prefix = enumValueSep;
- } else {
- prefix = (role == XML_ROLE_ATTRIBUTE_NOTATION_VALUE ? notationPrefix
- : enumValueStart);
- }
- if (! poolAppendString(&parser->m_tempPool, prefix))
- return XML_ERROR_NO_MEMORY;
- if (! poolAppend(&parser->m_tempPool, enc, s, next))
- return XML_ERROR_NO_MEMORY;
- parser->m_declAttributeType = parser->m_tempPool.start;
- handleDefault = XML_FALSE;
- }
- break;
- case XML_ROLE_IMPLIED_ATTRIBUTE_VALUE:
- case XML_ROLE_REQUIRED_ATTRIBUTE_VALUE:
- if (dtd->keepProcessing) {
- if (! defineAttribute(parser->m_declElementType,
- parser->m_declAttributeId,
- parser->m_declAttributeIsCdata,
- parser->m_declAttributeIsId, 0, parser))
- return XML_ERROR_NO_MEMORY;
- if (parser->m_attlistDeclHandler && parser->m_declAttributeType) {
- if (*parser->m_declAttributeType == XML_T(ASCII_LPAREN)
- || (*parser->m_declAttributeType == XML_T(ASCII_N)
- && parser->m_declAttributeType[1] == XML_T(ASCII_O))) {
- /* Enumerated or Notation type */
- if (! poolAppendChar(&parser->m_tempPool, XML_T(ASCII_RPAREN))
- || ! poolAppendChar(&parser->m_tempPool, XML_T('\0')))
- return XML_ERROR_NO_MEMORY;
- parser->m_declAttributeType = parser->m_tempPool.start;
- poolFinish(&parser->m_tempPool);
- }
- *eventEndPP = s;
- parser->m_attlistDeclHandler(
- parser->m_handlerArg, parser->m_declElementType->name,
- parser->m_declAttributeId->name, parser->m_declAttributeType, 0,
- role == XML_ROLE_REQUIRED_ATTRIBUTE_VALUE);
- handleDefault = XML_FALSE;
- }
- }
- poolClear(&parser->m_tempPool);
- break;
- case XML_ROLE_DEFAULT_ATTRIBUTE_VALUE:
- case XML_ROLE_FIXED_ATTRIBUTE_VALUE:
- if (dtd->keepProcessing) {
- const XML_Char *attVal;
- enum XML_Error result = storeAttributeValue(
- parser, enc, parser->m_declAttributeIsCdata,
- s + enc->minBytesPerChar, next - enc->minBytesPerChar, &dtd->pool,
- XML_ACCOUNT_NONE);
- if (result)
- return result;
- attVal = poolStart(&dtd->pool);
- poolFinish(&dtd->pool);
- /* ID attributes aren't allowed to have a default */
- if (! defineAttribute(
- parser->m_declElementType, parser->m_declAttributeId,
- parser->m_declAttributeIsCdata, XML_FALSE, attVal, parser))
- return XML_ERROR_NO_MEMORY;
- if (parser->m_attlistDeclHandler && parser->m_declAttributeType) {
- if (*parser->m_declAttributeType == XML_T(ASCII_LPAREN)
- || (*parser->m_declAttributeType == XML_T(ASCII_N)
- && parser->m_declAttributeType[1] == XML_T(ASCII_O))) {
- /* Enumerated or Notation type */
- if (! poolAppendChar(&parser->m_tempPool, XML_T(ASCII_RPAREN))
- || ! poolAppendChar(&parser->m_tempPool, XML_T('\0')))
- return XML_ERROR_NO_MEMORY;
- parser->m_declAttributeType = parser->m_tempPool.start;
- poolFinish(&parser->m_tempPool);
- }
- *eventEndPP = s;
- parser->m_attlistDeclHandler(
- parser->m_handlerArg, parser->m_declElementType->name,
- parser->m_declAttributeId->name, parser->m_declAttributeType,
- attVal, role == XML_ROLE_FIXED_ATTRIBUTE_VALUE);
- poolClear(&parser->m_tempPool);
- handleDefault = XML_FALSE;
- }
- }
- break;
- case XML_ROLE_ENTITY_VALUE:
- if (dtd->keepProcessing) {
- #if XML_GE == 1
- // This will store the given replacement text in
- // parser->m_declEntity->textPtr.
- enum XML_Error result
- = storeEntityValue(parser, enc, s + enc->minBytesPerChar,
- next - enc->minBytesPerChar, XML_ACCOUNT_NONE);
- if (parser->m_declEntity) {
- parser->m_declEntity->textPtr = poolStart(&dtd->entityValuePool);
- parser->m_declEntity->textLen
- = (int)(poolLength(&dtd->entityValuePool));
- poolFinish(&dtd->entityValuePool);
- if (parser->m_entityDeclHandler) {
- *eventEndPP = s;
- parser->m_entityDeclHandler(
- parser->m_handlerArg, parser->m_declEntity->name,
- parser->m_declEntity->is_param, parser->m_declEntity->textPtr,
- parser->m_declEntity->textLen, parser->m_curBase, 0, 0, 0);
- handleDefault = XML_FALSE;
- }
- } else
- poolDiscard(&dtd->entityValuePool);
- if (result != XML_ERROR_NONE)
- return result;
- #else
- // This will store "&entity123;" in parser->m_declEntity->textPtr
- // to end up as "&entity123;" in the handler.
- if (parser->m_declEntity != NULL) {
- const enum XML_Error result
- = storeSelfEntityValue(parser, parser->m_declEntity);
- if (result != XML_ERROR_NONE)
- return result;
- if (parser->m_entityDeclHandler) {
- *eventEndPP = s;
- parser->m_entityDeclHandler(
- parser->m_handlerArg, parser->m_declEntity->name,
- parser->m_declEntity->is_param, parser->m_declEntity->textPtr,
- parser->m_declEntity->textLen, parser->m_curBase, 0, 0, 0);
- handleDefault = XML_FALSE;
- }
- }
- #endif
- }
- break;
- case XML_ROLE_DOCTYPE_SYSTEM_ID:
- #ifdef XML_DTD
- parser->m_useForeignDTD = XML_FALSE;
- #endif /* XML_DTD */
- dtd->hasParamEntityRefs = XML_TRUE;
- if (parser->m_startDoctypeDeclHandler) {
- parser->m_doctypeSysid = poolStoreString(&parser->m_tempPool, enc,
- s + enc->minBytesPerChar,
- next - enc->minBytesPerChar);
- if (parser->m_doctypeSysid == NULL)
- return XML_ERROR_NO_MEMORY;
- poolFinish(&parser->m_tempPool);
- handleDefault = XML_FALSE;
- }
- #ifdef XML_DTD
- else
- /* use externalSubsetName to make parser->m_doctypeSysid non-NULL
- for the case where no parser->m_startDoctypeDeclHandler is set */
- parser->m_doctypeSysid = externalSubsetName;
- #endif /* XML_DTD */
- if (! dtd->standalone
- #ifdef XML_DTD
- && ! parser->m_paramEntityParsing
- #endif /* XML_DTD */
- && parser->m_notStandaloneHandler
- && ! parser->m_notStandaloneHandler(parser->m_handlerArg))
- return XML_ERROR_NOT_STANDALONE;
- #ifndef XML_DTD
- break;
- #else /* XML_DTD */
- if (! parser->m_declEntity) {
- parser->m_declEntity = (ENTITY *)lookup(
- parser, &dtd->paramEntities, externalSubsetName, sizeof(ENTITY));
- if (! parser->m_declEntity)
- return XML_ERROR_NO_MEMORY;
- parser->m_declEntity->publicId = NULL;
- }
- #endif /* XML_DTD */
- /* fall through */
- case XML_ROLE_ENTITY_SYSTEM_ID:
- if (dtd->keepProcessing && parser->m_declEntity) {
- parser->m_declEntity->systemId
- = poolStoreString(&dtd->pool, enc, s + enc->minBytesPerChar,
- next - enc->minBytesPerChar);
- if (! parser->m_declEntity->systemId)
- return XML_ERROR_NO_MEMORY;
- parser->m_declEntity->base = parser->m_curBase;
- poolFinish(&dtd->pool);
- /* Don't suppress the default handler if we fell through from
- * the XML_ROLE_DOCTYPE_SYSTEM_ID case.
- */
- if (parser->m_entityDeclHandler && role == XML_ROLE_ENTITY_SYSTEM_ID)
- handleDefault = XML_FALSE;
- }
- break;
- case XML_ROLE_ENTITY_COMPLETE:
- #if XML_GE == 0
- // This will store "&entity123;" in entity->textPtr
- // to end up as "&entity123;" in the handler.
- if (parser->m_declEntity != NULL) {
- const enum XML_Error result
- = storeSelfEntityValue(parser, parser->m_declEntity);
- if (result != XML_ERROR_NONE)
- return result;
- }
- #endif
- if (dtd->keepProcessing && parser->m_declEntity
- && parser->m_entityDeclHandler) {
- *eventEndPP = s;
- parser->m_entityDeclHandler(
- parser->m_handlerArg, parser->m_declEntity->name,
- parser->m_declEntity->is_param, 0, 0, parser->m_declEntity->base,
- parser->m_declEntity->systemId, parser->m_declEntity->publicId, 0);
- handleDefault = XML_FALSE;
- }
- break;
- case XML_ROLE_ENTITY_NOTATION_NAME:
- if (dtd->keepProcessing && parser->m_declEntity) {
- parser->m_declEntity->notation
- = poolStoreString(&dtd->pool, enc, s, next);
- if (! parser->m_declEntity->notation)
- return XML_ERROR_NO_MEMORY;
- poolFinish(&dtd->pool);
- if (parser->m_unparsedEntityDeclHandler) {
- *eventEndPP = s;
- parser->m_unparsedEntityDeclHandler(
- parser->m_handlerArg, parser->m_declEntity->name,
- parser->m_declEntity->base, parser->m_declEntity->systemId,
- parser->m_declEntity->publicId, parser->m_declEntity->notation);
- handleDefault = XML_FALSE;
- } else if (parser->m_entityDeclHandler) {
- *eventEndPP = s;
- parser->m_entityDeclHandler(
- parser->m_handlerArg, parser->m_declEntity->name, 0, 0, 0,
- parser->m_declEntity->base, parser->m_declEntity->systemId,
- parser->m_declEntity->publicId, parser->m_declEntity->notation);
- handleDefault = XML_FALSE;
- }
- }
- break;
- case XML_ROLE_GENERAL_ENTITY_NAME: {
- if (XmlPredefinedEntityName(enc, s, next)) {
- parser->m_declEntity = NULL;
- break;
- }
- if (dtd->keepProcessing) {
- const XML_Char *name = poolStoreString(&dtd->pool, enc, s, next);
- if (! name)
- return XML_ERROR_NO_MEMORY;
- parser->m_declEntity = (ENTITY *)lookup(parser, &dtd->generalEntities,
- name, sizeof(ENTITY));
- if (! parser->m_declEntity)
- return XML_ERROR_NO_MEMORY;
- if (parser->m_declEntity->name != name) {
- poolDiscard(&dtd->pool);
- parser->m_declEntity = NULL;
- } else {
- poolFinish(&dtd->pool);
- parser->m_declEntity->publicId = NULL;
- parser->m_declEntity->is_param = XML_FALSE;
- /* if we have a parent parser or are reading an internal parameter
- entity, then the entity declaration is not considered "internal"
- */
- parser->m_declEntity->is_internal
- = ! (parser->m_parentParser || parser->m_openInternalEntities);
- if (parser->m_entityDeclHandler)
- handleDefault = XML_FALSE;
- }
- } else {
- poolDiscard(&dtd->pool);
- parser->m_declEntity = NULL;
- }
- } break;
- case XML_ROLE_PARAM_ENTITY_NAME:
- #ifdef XML_DTD
- if (dtd->keepProcessing) {
- const XML_Char *name = poolStoreString(&dtd->pool, enc, s, next);
- if (! name)
- return XML_ERROR_NO_MEMORY;
- parser->m_declEntity = (ENTITY *)lookup(parser, &dtd->paramEntities,
- name, sizeof(ENTITY));
- if (! parser->m_declEntity)
- return XML_ERROR_NO_MEMORY;
- if (parser->m_declEntity->name != name) {
- poolDiscard(&dtd->pool);
- parser->m_declEntity = NULL;
- } else {
- poolFinish(&dtd->pool);
- parser->m_declEntity->publicId = NULL;
- parser->m_declEntity->is_param = XML_TRUE;
- /* if we have a parent parser or are reading an internal parameter
- entity, then the entity declaration is not considered "internal"
- */
- parser->m_declEntity->is_internal
- = ! (parser->m_parentParser || parser->m_openInternalEntities);
- if (parser->m_entityDeclHandler)
- handleDefault = XML_FALSE;
- }
- } else {
- poolDiscard(&dtd->pool);
- parser->m_declEntity = NULL;
- }
- #else /* not XML_DTD */
- parser->m_declEntity = NULL;
- #endif /* XML_DTD */
- break;
- case XML_ROLE_NOTATION_NAME:
- parser->m_declNotationPublicId = NULL;
- parser->m_declNotationName = NULL;
- if (parser->m_notationDeclHandler) {
- parser->m_declNotationName
- = poolStoreString(&parser->m_tempPool, enc, s, next);
- if (! parser->m_declNotationName)
- return XML_ERROR_NO_MEMORY;
- poolFinish(&parser->m_tempPool);
- handleDefault = XML_FALSE;
- }
- break;
- case XML_ROLE_NOTATION_PUBLIC_ID:
- if (! XmlIsPublicId(enc, s, next, eventPP))
- return XML_ERROR_PUBLICID;
- if (parser
- ->m_declNotationName) { /* means m_notationDeclHandler != NULL */
- XML_Char *tem = poolStoreString(&parser->m_tempPool, enc,
- s + enc->minBytesPerChar,
- next - enc->minBytesPerChar);
- if (! tem)
- return XML_ERROR_NO_MEMORY;
- normalizePublicId(tem);
- parser->m_declNotationPublicId = tem;
- poolFinish(&parser->m_tempPool);
- handleDefault = XML_FALSE;
- }
- break;
- case XML_ROLE_NOTATION_SYSTEM_ID:
- if (parser->m_declNotationName && parser->m_notationDeclHandler) {
- const XML_Char *systemId = poolStoreString(&parser->m_tempPool, enc,
- s + enc->minBytesPerChar,
- next - enc->minBytesPerChar);
- if (! systemId)
- return XML_ERROR_NO_MEMORY;
- *eventEndPP = s;
- parser->m_notationDeclHandler(
- parser->m_handlerArg, parser->m_declNotationName, parser->m_curBase,
- systemId, parser->m_declNotationPublicId);
- handleDefault = XML_FALSE;
- }
- poolClear(&parser->m_tempPool);
- break;
- case XML_ROLE_NOTATION_NO_SYSTEM_ID:
- if (parser->m_declNotationPublicId && parser->m_notationDeclHandler) {
- *eventEndPP = s;
- parser->m_notationDeclHandler(
- parser->m_handlerArg, parser->m_declNotationName, parser->m_curBase,
- 0, parser->m_declNotationPublicId);
- handleDefault = XML_FALSE;
- }
- poolClear(&parser->m_tempPool);
- break;
- case XML_ROLE_ERROR:
- switch (tok) {
- case XML_TOK_PARAM_ENTITY_REF:
- /* PE references in internal subset are
- not allowed within declarations. */
- return XML_ERROR_PARAM_ENTITY_REF;
- case XML_TOK_XML_DECL:
- return XML_ERROR_MISPLACED_XML_PI;
- default:
- return XML_ERROR_SYNTAX;
- }
- #ifdef XML_DTD
- case XML_ROLE_IGNORE_SECT: {
- enum XML_Error result;
- if (parser->m_defaultHandler)
- reportDefault(parser, enc, s, next);
- handleDefault = XML_FALSE;
- result = doIgnoreSection(parser, enc, &next, end, nextPtr, haveMore);
- if (result != XML_ERROR_NONE)
- return result;
- else if (! next) {
- parser->m_processor = ignoreSectionProcessor;
- return result;
- }
- } break;
- #endif /* XML_DTD */
- case XML_ROLE_GROUP_OPEN:
- if (parser->m_prologState.level >= parser->m_groupSize) {
- if (parser->m_groupSize) {
- {
- /* Detect and prevent integer overflow */
- if (parser->m_groupSize > (unsigned int)(-1) / 2u) {
- return XML_ERROR_NO_MEMORY;
- }
- char *const new_connector = (char *)REALLOC(
- parser, parser->m_groupConnector, parser->m_groupSize *= 2);
- if (new_connector == NULL) {
- parser->m_groupSize /= 2;
- return XML_ERROR_NO_MEMORY;
- }
- parser->m_groupConnector = new_connector;
- }
- if (dtd->scaffIndex) {
- /* Detect and prevent integer overflow.
- * The preprocessor guard addresses the "always false" warning
- * from -Wtype-limits on platforms where
- * sizeof(unsigned int) < sizeof(size_t), e.g. on x86_64. */
- #if UINT_MAX >= SIZE_MAX
- if (parser->m_groupSize > (size_t)(-1) / sizeof(int)) {
- return XML_ERROR_NO_MEMORY;
- }
- #endif
- int *const new_scaff_index = (int *)REALLOC(
- parser, dtd->scaffIndex, parser->m_groupSize * sizeof(int));
- if (new_scaff_index == NULL)
- return XML_ERROR_NO_MEMORY;
- dtd->scaffIndex = new_scaff_index;
- }
- } else {
- parser->m_groupConnector
- = (char *)MALLOC(parser, parser->m_groupSize = 32);
- if (! parser->m_groupConnector) {
- parser->m_groupSize = 0;
- return XML_ERROR_NO_MEMORY;
- }
- }
- }
- parser->m_groupConnector[parser->m_prologState.level] = 0;
- if (dtd->in_eldecl) {
- int myindex = nextScaffoldPart(parser);
- if (myindex < 0)
- return XML_ERROR_NO_MEMORY;
- assert(dtd->scaffIndex != NULL);
- dtd->scaffIndex[dtd->scaffLevel] = myindex;
- dtd->scaffLevel++;
- dtd->scaffold[myindex].type = XML_CTYPE_SEQ;
- if (parser->m_elementDeclHandler)
- handleDefault = XML_FALSE;
- }
- break;
- case XML_ROLE_GROUP_SEQUENCE:
- if (parser->m_groupConnector[parser->m_prologState.level] == ASCII_PIPE)
- return XML_ERROR_SYNTAX;
- parser->m_groupConnector[parser->m_prologState.level] = ASCII_COMMA;
- if (dtd->in_eldecl && parser->m_elementDeclHandler)
- handleDefault = XML_FALSE;
- break;
- case XML_ROLE_GROUP_CHOICE:
- if (parser->m_groupConnector[parser->m_prologState.level] == ASCII_COMMA)
- return XML_ERROR_SYNTAX;
- if (dtd->in_eldecl
- && ! parser->m_groupConnector[parser->m_prologState.level]
- && (dtd->scaffold[dtd->scaffIndex[dtd->scaffLevel - 1]].type
- != XML_CTYPE_MIXED)) {
- dtd->scaffold[dtd->scaffIndex[dtd->scaffLevel - 1]].type
- = XML_CTYPE_CHOICE;
- if (parser->m_elementDeclHandler)
- handleDefault = XML_FALSE;
- }
- parser->m_groupConnector[parser->m_prologState.level] = ASCII_PIPE;
- break;
- case XML_ROLE_PARAM_ENTITY_REF:
- #ifdef XML_DTD
- case XML_ROLE_INNER_PARAM_ENTITY_REF:
- dtd->hasParamEntityRefs = XML_TRUE;
- if (! parser->m_paramEntityParsing)
- dtd->keepProcessing = dtd->standalone;
- else {
- const XML_Char *name;
- ENTITY *entity;
- name = poolStoreString(&dtd->pool, enc, s + enc->minBytesPerChar,
- next - enc->minBytesPerChar);
- if (! name)
- return XML_ERROR_NO_MEMORY;
- entity = (ENTITY *)lookup(parser, &dtd->paramEntities, name, 0);
- poolDiscard(&dtd->pool);
- /* first, determine if a check for an existing declaration is needed;
- if yes, check that the entity exists, and that it is internal,
- otherwise call the skipped entity handler
- */
- if (parser->m_prologState.documentEntity
- && (dtd->standalone ? ! parser->m_openInternalEntities
- : ! dtd->hasParamEntityRefs)) {
- if (! entity)
- return XML_ERROR_UNDEFINED_ENTITY;
- else if (! entity->is_internal) {
- /* It's hard to exhaustively search the code to be sure,
- * but there doesn't seem to be a way of executing the
- * following line. There are two cases:
- *
- * If 'standalone' is false, the DTD must have no
- * parameter entities or we wouldn't have passed the outer
- * 'if' statement. That means the only entity in the hash
- * table is the external subset name "#" which cannot be
- * given as a parameter entity name in XML syntax, so the
- * lookup must have returned NULL and we don't even reach
- * the test for an internal entity.
- *
- * If 'standalone' is true, it does not seem to be
- * possible to create entities taking this code path that
- * are not internal entities, so fail the test above.
- *
- * Because this analysis is very uncertain, the code is
- * being left in place and merely removed from the
- * coverage test statistics.
- */
- return XML_ERROR_ENTITY_DECLARED_IN_PE; /* LCOV_EXCL_LINE */
- }
- } else if (! entity) {
- dtd->keepProcessing = dtd->standalone;
- /* cannot report skipped entities in declarations */
- if ((role == XML_ROLE_PARAM_ENTITY_REF)
- && parser->m_skippedEntityHandler) {
- parser->m_skippedEntityHandler(parser->m_handlerArg, name, 1);
- handleDefault = XML_FALSE;
- }
- break;
- }
- if (entity->open)
- return XML_ERROR_RECURSIVE_ENTITY_REF;
- if (entity->textPtr) {
- enum XML_Error result;
- XML_Bool betweenDecl
- = (role == XML_ROLE_PARAM_ENTITY_REF ? XML_TRUE : XML_FALSE);
- result = processInternalEntity(parser, entity, betweenDecl);
- if (result != XML_ERROR_NONE)
- return result;
- handleDefault = XML_FALSE;
- break;
- }
- if (parser->m_externalEntityRefHandler) {
- dtd->paramEntityRead = XML_FALSE;
- entity->open = XML_TRUE;
- entityTrackingOnOpen(parser, entity, __LINE__);
- if (! parser->m_externalEntityRefHandler(
- parser->m_externalEntityRefHandlerArg, 0, entity->base,
- entity->systemId, entity->publicId)) {
- entityTrackingOnClose(parser, entity, __LINE__);
- entity->open = XML_FALSE;
- return XML_ERROR_EXTERNAL_ENTITY_HANDLING;
- }
- entityTrackingOnClose(parser, entity, __LINE__);
- entity->open = XML_FALSE;
- handleDefault = XML_FALSE;
- if (! dtd->paramEntityRead) {
- dtd->keepProcessing = dtd->standalone;
- break;
- }
- } else {
- dtd->keepProcessing = dtd->standalone;
- break;
- }
- }
- #endif /* XML_DTD */
- if (! dtd->standalone && parser->m_notStandaloneHandler
- && ! parser->m_notStandaloneHandler(parser->m_handlerArg))
- return XML_ERROR_NOT_STANDALONE;
- break;
- /* Element declaration stuff */
- case XML_ROLE_ELEMENT_NAME:
- if (parser->m_elementDeclHandler) {
- parser->m_declElementType = getElementType(parser, enc, s, next);
- if (! parser->m_declElementType)
- return XML_ERROR_NO_MEMORY;
- dtd->scaffLevel = 0;
- dtd->scaffCount = 0;
- dtd->in_eldecl = XML_TRUE;
- handleDefault = XML_FALSE;
- }
- break;
- case XML_ROLE_CONTENT_ANY:
- case XML_ROLE_CONTENT_EMPTY:
- if (dtd->in_eldecl) {
- if (parser->m_elementDeclHandler) {
- XML_Content *content
- = (XML_Content *)MALLOC(parser, sizeof(XML_Content));
- if (! content)
- return XML_ERROR_NO_MEMORY;
- content->quant = XML_CQUANT_NONE;
- content->name = NULL;
- content->numchildren = 0;
- content->children = NULL;
- content->type = ((role == XML_ROLE_CONTENT_ANY) ? XML_CTYPE_ANY
- : XML_CTYPE_EMPTY);
- *eventEndPP = s;
- parser->m_elementDeclHandler(
- parser->m_handlerArg, parser->m_declElementType->name, content);
- handleDefault = XML_FALSE;
- }
- dtd->in_eldecl = XML_FALSE;
- }
- break;
- case XML_ROLE_CONTENT_PCDATA:
- if (dtd->in_eldecl) {
- dtd->scaffold[dtd->scaffIndex[dtd->scaffLevel - 1]].type
- = XML_CTYPE_MIXED;
- if (parser->m_elementDeclHandler)
- handleDefault = XML_FALSE;
- }
- break;
- case XML_ROLE_CONTENT_ELEMENT:
- quant = XML_CQUANT_NONE;
- goto elementContent;
- case XML_ROLE_CONTENT_ELEMENT_OPT:
- quant = XML_CQUANT_OPT;
- goto elementContent;
- case XML_ROLE_CONTENT_ELEMENT_REP:
- quant = XML_CQUANT_REP;
- goto elementContent;
- case XML_ROLE_CONTENT_ELEMENT_PLUS:
- quant = XML_CQUANT_PLUS;
- elementContent:
- if (dtd->in_eldecl) {
- ELEMENT_TYPE *el;
- const XML_Char *name;
- size_t nameLen;
- const char *nxt
- = (quant == XML_CQUANT_NONE ? next : next - enc->minBytesPerChar);
- int myindex = nextScaffoldPart(parser);
- if (myindex < 0)
- return XML_ERROR_NO_MEMORY;
- dtd->scaffold[myindex].type = XML_CTYPE_NAME;
- dtd->scaffold[myindex].quant = quant;
- el = getElementType(parser, enc, s, nxt);
- if (! el)
- return XML_ERROR_NO_MEMORY;
- name = el->name;
- dtd->scaffold[myindex].name = name;
- nameLen = 0;
- for (; name[nameLen++];)
- ;
- /* Detect and prevent integer overflow */
- if (nameLen > UINT_MAX - dtd->contentStringLen) {
- return XML_ERROR_NO_MEMORY;
- }
- dtd->contentStringLen += (unsigned)nameLen;
- if (parser->m_elementDeclHandler)
- handleDefault = XML_FALSE;
- }
- break;
- case XML_ROLE_GROUP_CLOSE:
- quant = XML_CQUANT_NONE;
- goto closeGroup;
- case XML_ROLE_GROUP_CLOSE_OPT:
- quant = XML_CQUANT_OPT;
- goto closeGroup;
- case XML_ROLE_GROUP_CLOSE_REP:
- quant = XML_CQUANT_REP;
- goto closeGroup;
- case XML_ROLE_GROUP_CLOSE_PLUS:
- quant = XML_CQUANT_PLUS;
- closeGroup:
- if (dtd->in_eldecl) {
- if (parser->m_elementDeclHandler)
- handleDefault = XML_FALSE;
- dtd->scaffLevel--;
- dtd->scaffold[dtd->scaffIndex[dtd->scaffLevel]].quant = quant;
- if (dtd->scaffLevel == 0) {
- if (! handleDefault) {
- XML_Content *model = build_model(parser);
- if (! model)
- return XML_ERROR_NO_MEMORY;
- *eventEndPP = s;
- parser->m_elementDeclHandler(
- parser->m_handlerArg, parser->m_declElementType->name, model);
- }
- dtd->in_eldecl = XML_FALSE;
- dtd->contentStringLen = 0;
- }
- }
- break;
- /* End element declaration stuff */
- case XML_ROLE_PI:
- if (! reportProcessingInstruction(parser, enc, s, next))
- return XML_ERROR_NO_MEMORY;
- handleDefault = XML_FALSE;
- break;
- case XML_ROLE_COMMENT:
- if (! reportComment(parser, enc, s, next))
- return XML_ERROR_NO_MEMORY;
- handleDefault = XML_FALSE;
- break;
- case XML_ROLE_NONE:
- switch (tok) {
- case XML_TOK_BOM:
- handleDefault = XML_FALSE;
- break;
- }
- break;
- case XML_ROLE_DOCTYPE_NONE:
- if (parser->m_startDoctypeDeclHandler)
- handleDefault = XML_FALSE;
- break;
- case XML_ROLE_ENTITY_NONE:
- if (dtd->keepProcessing && parser->m_entityDeclHandler)
- handleDefault = XML_FALSE;
- break;
- case XML_ROLE_NOTATION_NONE:
- if (parser->m_notationDeclHandler)
- handleDefault = XML_FALSE;
- break;
- case XML_ROLE_ATTLIST_NONE:
- if (dtd->keepProcessing && parser->m_attlistDeclHandler)
- handleDefault = XML_FALSE;
- break;
- case XML_ROLE_ELEMENT_NONE:
- if (parser->m_elementDeclHandler)
- handleDefault = XML_FALSE;
- break;
- } /* end of big switch */
- if (handleDefault && parser->m_defaultHandler)
- reportDefault(parser, enc, s, next);
- switch (parser->m_parsingStatus.parsing) {
- case XML_SUSPENDED:
- *nextPtr = next;
- return XML_ERROR_NONE;
- case XML_FINISHED:
- return XML_ERROR_ABORTED;
- default:
- s = next;
- tok = XmlPrologTok(enc, s, end, &next);
- }
- }
- /* not reached */
- }
- static enum XML_Error PTRCALL
- epilogProcessor(XML_Parser parser, const char *s, const char *end,
- const char **nextPtr) {
- parser->m_processor = epilogProcessor;
- parser->m_eventPtr = s;
- for (;;) {
- const char *next = NULL;
- int tok = XmlPrologTok(parser->m_encoding, s, end, &next);
- #if XML_GE == 1
- if (! accountingDiffTolerated(parser, tok, s, next, __LINE__,
- XML_ACCOUNT_DIRECT)) {
- accountingOnAbort(parser);
- return XML_ERROR_AMPLIFICATION_LIMIT_BREACH;
- }
- #endif
- parser->m_eventEndPtr = next;
- switch (tok) {
- /* report partial linebreak - it might be the last token */
- case -XML_TOK_PROLOG_S:
- if (parser->m_defaultHandler) {
- reportDefault(parser, parser->m_encoding, s, next);
- if (parser->m_parsingStatus.parsing == XML_FINISHED)
- return XML_ERROR_ABORTED;
- }
- *nextPtr = next;
- return XML_ERROR_NONE;
- case XML_TOK_NONE:
- *nextPtr = s;
- return XML_ERROR_NONE;
- case XML_TOK_PROLOG_S:
- if (parser->m_defaultHandler)
- reportDefault(parser, parser->m_encoding, s, next);
- break;
- case XML_TOK_PI:
- if (! reportProcessingInstruction(parser, parser->m_encoding, s, next))
- return XML_ERROR_NO_MEMORY;
- break;
- case XML_TOK_COMMENT:
- if (! reportComment(parser, parser->m_encoding, s, next))
- return XML_ERROR_NO_MEMORY;
- break;
- case XML_TOK_INVALID:
- parser->m_eventPtr = next;
- return XML_ERROR_INVALID_TOKEN;
- case XML_TOK_PARTIAL:
- if (! parser->m_parsingStatus.finalBuffer) {
- *nextPtr = s;
- return XML_ERROR_NONE;
- }
- return XML_ERROR_UNCLOSED_TOKEN;
- case XML_TOK_PARTIAL_CHAR:
- if (! parser->m_parsingStatus.finalBuffer) {
- *nextPtr = s;
- return XML_ERROR_NONE;
- }
- return XML_ERROR_PARTIAL_CHAR;
- default:
- return XML_ERROR_JUNK_AFTER_DOC_ELEMENT;
- }
- parser->m_eventPtr = s = next;
- switch (parser->m_parsingStatus.parsing) {
- case XML_SUSPENDED:
- *nextPtr = next;
- return XML_ERROR_NONE;
- case XML_FINISHED:
- return XML_ERROR_ABORTED;
- default:;
- }
- }
- }
- static enum XML_Error
- processInternalEntity(XML_Parser parser, ENTITY *entity, XML_Bool betweenDecl) {
- const char *textStart, *textEnd;
- const char *next;
- enum XML_Error result;
- OPEN_INTERNAL_ENTITY *openEntity;
- if (parser->m_freeInternalEntities) {
- openEntity = parser->m_freeInternalEntities;
- parser->m_freeInternalEntities = openEntity->next;
- } else {
- openEntity
- = (OPEN_INTERNAL_ENTITY *)MALLOC(parser, sizeof(OPEN_INTERNAL_ENTITY));
- if (! openEntity)
- return XML_ERROR_NO_MEMORY;
- }
- entity->open = XML_TRUE;
- #if XML_GE == 1
- entityTrackingOnOpen(parser, entity, __LINE__);
- #endif
- entity->processed = 0;
- openEntity->next = parser->m_openInternalEntities;
- parser->m_openInternalEntities = openEntity;
- openEntity->entity = entity;
- openEntity->startTagLevel = parser->m_tagLevel;
- openEntity->betweenDecl = betweenDecl;
- openEntity->internalEventPtr = NULL;
- openEntity->internalEventEndPtr = NULL;
- textStart = (const char *)entity->textPtr;
- textEnd = (const char *)(entity->textPtr + entity->textLen);
- /* Set a safe default value in case 'next' does not get set */
- next = textStart;
- if (entity->is_param) {
- int tok
- = XmlPrologTok(parser->m_internalEncoding, textStart, textEnd, &next);
- result = doProlog(parser, parser->m_internalEncoding, textStart, textEnd,
- tok, next, &next, XML_FALSE, XML_FALSE,
- XML_ACCOUNT_ENTITY_EXPANSION);
- } else {
- result = doContent(parser, parser->m_tagLevel, parser->m_internalEncoding,
- textStart, textEnd, &next, XML_FALSE,
- XML_ACCOUNT_ENTITY_EXPANSION);
- }
- if (result == XML_ERROR_NONE) {
- if (textEnd != next && parser->m_parsingStatus.parsing == XML_SUSPENDED) {
- entity->processed = (int)(next - textStart);
- parser->m_processor = internalEntityProcessor;
- } else if (parser->m_openInternalEntities->entity == entity) {
- #if XML_GE == 1
- entityTrackingOnClose(parser, entity, __LINE__);
- #endif /* XML_GE == 1 */
- entity->open = XML_FALSE;
- parser->m_openInternalEntities = openEntity->next;
- /* put openEntity back in list of free instances */
- openEntity->next = parser->m_freeInternalEntities;
- parser->m_freeInternalEntities = openEntity;
- }
- }
- return result;
- }
- static enum XML_Error PTRCALL
- internalEntityProcessor(XML_Parser parser, const char *s, const char *end,
- const char **nextPtr) {
- ENTITY *entity;
- const char *textStart, *textEnd;
- const char *next;
- enum XML_Error result;
- OPEN_INTERNAL_ENTITY *openEntity = parser->m_openInternalEntities;
- if (! openEntity)
- return XML_ERROR_UNEXPECTED_STATE;
- entity = openEntity->entity;
- textStart = ((const char *)entity->textPtr) + entity->processed;
- textEnd = (const char *)(entity->textPtr + entity->textLen);
- /* Set a safe default value in case 'next' does not get set */
- next = textStart;
- if (entity->is_param) {
- int tok
- = XmlPrologTok(parser->m_internalEncoding, textStart, textEnd, &next);
- result = doProlog(parser, parser->m_internalEncoding, textStart, textEnd,
- tok, next, &next, XML_FALSE, XML_TRUE,
- XML_ACCOUNT_ENTITY_EXPANSION);
- } else {
- result = doContent(parser, openEntity->startTagLevel,
- parser->m_internalEncoding, textStart, textEnd, &next,
- XML_FALSE, XML_ACCOUNT_ENTITY_EXPANSION);
- }
- if (result != XML_ERROR_NONE)
- return result;
- if (textEnd != next && parser->m_parsingStatus.parsing == XML_SUSPENDED) {
- entity->processed = (int)(next - (const char *)entity->textPtr);
- return result;
- }
- #if XML_GE == 1
- entityTrackingOnClose(parser, entity, __LINE__);
- #endif
- entity->open = XML_FALSE;
- parser->m_openInternalEntities = openEntity->next;
- /* put openEntity back in list of free instances */
- openEntity->next = parser->m_freeInternalEntities;
- parser->m_freeInternalEntities = openEntity;
- // If there are more open entities we want to stop right here and have the
- // upcoming call to XML_ResumeParser continue with entity content, or it would
- // be ignored altogether.
- if (parser->m_openInternalEntities != NULL
- && parser->m_parsingStatus.parsing == XML_SUSPENDED) {
- return XML_ERROR_NONE;
- }
- if (entity->is_param) {
- int tok;
- parser->m_processor = prologProcessor;
- tok = XmlPrologTok(parser->m_encoding, s, end, &next);
- return doProlog(parser, parser->m_encoding, s, end, tok, next, nextPtr,
- (XML_Bool)! parser->m_parsingStatus.finalBuffer, XML_TRUE,
- XML_ACCOUNT_DIRECT);
- } else {
- parser->m_processor = contentProcessor;
- /* see externalEntityContentProcessor vs contentProcessor */
- result = doContent(parser, parser->m_parentParser ? 1 : 0,
- parser->m_encoding, s, end, nextPtr,
- (XML_Bool)! parser->m_parsingStatus.finalBuffer,
- XML_ACCOUNT_DIRECT);
- if (result == XML_ERROR_NONE) {
- if (! storeRawNames(parser))
- return XML_ERROR_NO_MEMORY;
- }
- return result;
- }
- }
- static enum XML_Error PTRCALL
- errorProcessor(XML_Parser parser, const char *s, const char *end,
- const char **nextPtr) {
- UNUSED_P(s);
- UNUSED_P(end);
- UNUSED_P(nextPtr);
- return parser->m_errorCode;
- }
- static enum XML_Error
- storeAttributeValue(XML_Parser parser, const ENCODING *enc, XML_Bool isCdata,
- const char *ptr, const char *end, STRING_POOL *pool,
- enum XML_Account account) {
- enum XML_Error result
- = appendAttributeValue(parser, enc, isCdata, ptr, end, pool, account);
- if (result)
- return result;
- if (! isCdata && poolLength(pool) && poolLastChar(pool) == 0x20)
- poolChop(pool);
- if (! poolAppendChar(pool, XML_T('\0')))
- return XML_ERROR_NO_MEMORY;
- return XML_ERROR_NONE;
- }
- static enum XML_Error
- appendAttributeValue(XML_Parser parser, const ENCODING *enc, XML_Bool isCdata,
- const char *ptr, const char *end, STRING_POOL *pool,
- enum XML_Account account) {
- DTD *const dtd = parser->m_dtd; /* save one level of indirection */
- #ifndef XML_DTD
- UNUSED_P(account);
- #endif
- for (;;) {
- const char *next
- = ptr; /* XmlAttributeValueTok doesn't always set the last arg */
- int tok = XmlAttributeValueTok(enc, ptr, end, &next);
- #if XML_GE == 1
- if (! accountingDiffTolerated(parser, tok, ptr, next, __LINE__, account)) {
- accountingOnAbort(parser);
- return XML_ERROR_AMPLIFICATION_LIMIT_BREACH;
- }
- #endif
- switch (tok) {
- case XML_TOK_NONE:
- return XML_ERROR_NONE;
- case XML_TOK_INVALID:
- if (enc == parser->m_encoding)
- parser->m_eventPtr = next;
- return XML_ERROR_INVALID_TOKEN;
- case XML_TOK_PARTIAL:
- if (enc == parser->m_encoding)
- parser->m_eventPtr = ptr;
- return XML_ERROR_INVALID_TOKEN;
- case XML_TOK_CHAR_REF: {
- XML_Char buf[XML_ENCODE_MAX];
- int i;
- int n = XmlCharRefNumber(enc, ptr);
- if (n < 0) {
- if (enc == parser->m_encoding)
- parser->m_eventPtr = ptr;
- return XML_ERROR_BAD_CHAR_REF;
- }
- if (! isCdata && n == 0x20 /* space */
- && (poolLength(pool) == 0 || poolLastChar(pool) == 0x20))
- break;
- n = XmlEncode(n, (ICHAR *)buf);
- /* The XmlEncode() functions can never return 0 here. That
- * error return happens if the code point passed in is either
- * negative or greater than or equal to 0x110000. The
- * XmlCharRefNumber() functions will all return a number
- * strictly less than 0x110000 or a negative value if an error
- * occurred. The negative value is intercepted above, so
- * XmlEncode() is never passed a value it might return an
- * error for.
- */
- for (i = 0; i < n; i++) {
- if (! poolAppendChar(pool, buf[i]))
- return XML_ERROR_NO_MEMORY;
- }
- } break;
- case XML_TOK_DATA_CHARS:
- if (! poolAppend(pool, enc, ptr, next))
- return XML_ERROR_NO_MEMORY;
- break;
- case XML_TOK_TRAILING_CR:
- next = ptr + enc->minBytesPerChar;
- /* fall through */
- case XML_TOK_ATTRIBUTE_VALUE_S:
- case XML_TOK_DATA_NEWLINE:
- if (! isCdata && (poolLength(pool) == 0 || poolLastChar(pool) == 0x20))
- break;
- if (! poolAppendChar(pool, 0x20))
- return XML_ERROR_NO_MEMORY;
- break;
- case XML_TOK_ENTITY_REF: {
- const XML_Char *name;
- ENTITY *entity;
- char checkEntityDecl;
- XML_Char ch = (XML_Char)XmlPredefinedEntityName(
- enc, ptr + enc->minBytesPerChar, next - enc->minBytesPerChar);
- if (ch) {
- #if XML_GE == 1
- /* NOTE: We are replacing 4-6 characters original input for 1 character
- * so there is no amplification and hence recording without
- * protection. */
- accountingDiffTolerated(parser, tok, (char *)&ch,
- ((char *)&ch) + sizeof(XML_Char), __LINE__,
- XML_ACCOUNT_ENTITY_EXPANSION);
- #endif /* XML_GE == 1 */
- if (! poolAppendChar(pool, ch))
- return XML_ERROR_NO_MEMORY;
- break;
- }
- name = poolStoreString(&parser->m_temp2Pool, enc,
- ptr + enc->minBytesPerChar,
- next - enc->minBytesPerChar);
- if (! name)
- return XML_ERROR_NO_MEMORY;
- entity = (ENTITY *)lookup(parser, &dtd->generalEntities, name, 0);
- poolDiscard(&parser->m_temp2Pool);
- /* First, determine if a check for an existing declaration is needed;
- if yes, check that the entity exists, and that it is internal.
- */
- if (pool == &dtd->pool) /* are we called from prolog? */
- checkEntityDecl =
- #ifdef XML_DTD
- parser->m_prologState.documentEntity &&
- #endif /* XML_DTD */
- (dtd->standalone ? ! parser->m_openInternalEntities
- : ! dtd->hasParamEntityRefs);
- else /* if (pool == &parser->m_tempPool): we are called from content */
- checkEntityDecl = ! dtd->hasParamEntityRefs || dtd->standalone;
- if (checkEntityDecl) {
- if (! entity)
- return XML_ERROR_UNDEFINED_ENTITY;
- else if (! entity->is_internal)
- return XML_ERROR_ENTITY_DECLARED_IN_PE;
- } else if (! entity) {
- /* Cannot report skipped entity here - see comments on
- parser->m_skippedEntityHandler.
- if (parser->m_skippedEntityHandler)
- parser->m_skippedEntityHandler(parser->m_handlerArg, name, 0);
- */
- /* Cannot call the default handler because this would be
- out of sync with the call to the startElementHandler.
- if ((pool == &parser->m_tempPool) && parser->m_defaultHandler)
- reportDefault(parser, enc, ptr, next);
- */
- break;
- }
- if (entity->open) {
- if (enc == parser->m_encoding) {
- /* It does not appear that this line can be executed.
- *
- * The "if (entity->open)" check catches recursive entity
- * definitions. In order to be called with an open
- * entity, it must have gone through this code before and
- * been through the recursive call to
- * appendAttributeValue() some lines below. That call
- * sets the local encoding ("enc") to the parser's
- * internal encoding (internal_utf8 or internal_utf16),
- * which can never be the same as the principle encoding.
- * It doesn't appear there is another code path that gets
- * here with entity->open being TRUE.
- *
- * Since it is not certain that this logic is watertight,
- * we keep the line and merely exclude it from coverage
- * tests.
- */
- parser->m_eventPtr = ptr; /* LCOV_EXCL_LINE */
- }
- return XML_ERROR_RECURSIVE_ENTITY_REF;
- }
- if (entity->notation) {
- if (enc == parser->m_encoding)
- parser->m_eventPtr = ptr;
- return XML_ERROR_BINARY_ENTITY_REF;
- }
- if (! entity->textPtr) {
- if (enc == parser->m_encoding)
- parser->m_eventPtr = ptr;
- return XML_ERROR_ATTRIBUTE_EXTERNAL_ENTITY_REF;
- } else {
- enum XML_Error result;
- const XML_Char *textEnd = entity->textPtr + entity->textLen;
- entity->open = XML_TRUE;
- #if XML_GE == 1
- entityTrackingOnOpen(parser, entity, __LINE__);
- #endif
- result = appendAttributeValue(parser, parser->m_internalEncoding,
- isCdata, (const char *)entity->textPtr,
- (const char *)textEnd, pool,
- XML_ACCOUNT_ENTITY_EXPANSION);
- #if XML_GE == 1
- entityTrackingOnClose(parser, entity, __LINE__);
- #endif
- entity->open = XML_FALSE;
- if (result)
- return result;
- }
- } break;
- default:
- /* The only token returned by XmlAttributeValueTok() that does
- * not have an explicit case here is XML_TOK_PARTIAL_CHAR.
- * Getting that would require an entity name to contain an
- * incomplete XML character (e.g. \xE2\x82); however previous
- * tokenisers will have already recognised and rejected such
- * names before XmlAttributeValueTok() gets a look-in. This
- * default case should be retained as a safety net, but the code
- * excluded from coverage tests.
- *
- * LCOV_EXCL_START
- */
- if (enc == parser->m_encoding)
- parser->m_eventPtr = ptr;
- return XML_ERROR_UNEXPECTED_STATE;
- /* LCOV_EXCL_STOP */
- }
- ptr = next;
- }
- /* not reached */
- }
- #if XML_GE == 1
- static enum XML_Error
- storeEntityValue(XML_Parser parser, const ENCODING *enc,
- const char *entityTextPtr, const char *entityTextEnd,
- enum XML_Account account) {
- DTD *const dtd = parser->m_dtd; /* save one level of indirection */
- STRING_POOL *pool = &(dtd->entityValuePool);
- enum XML_Error result = XML_ERROR_NONE;
- # ifdef XML_DTD
- int oldInEntityValue = parser->m_prologState.inEntityValue;
- parser->m_prologState.inEntityValue = 1;
- # else
- UNUSED_P(account);
- # endif /* XML_DTD */
- /* never return Null for the value argument in EntityDeclHandler,
- since this would indicate an external entity; therefore we
- have to make sure that entityValuePool.start is not null */
- if (! pool->blocks) {
- if (! poolGrow(pool))
- return XML_ERROR_NO_MEMORY;
- }
- for (;;) {
- const char *next
- = entityTextPtr; /* XmlEntityValueTok doesn't always set the last arg */
- int tok = XmlEntityValueTok(enc, entityTextPtr, entityTextEnd, &next);
- if (! accountingDiffTolerated(parser, tok, entityTextPtr, next, __LINE__,
- account)) {
- accountingOnAbort(parser);
- result = XML_ERROR_AMPLIFICATION_LIMIT_BREACH;
- goto endEntityValue;
- }
- switch (tok) {
- case XML_TOK_PARAM_ENTITY_REF:
- # ifdef XML_DTD
- if (parser->m_isParamEntity || enc != parser->m_encoding) {
- const XML_Char *name;
- ENTITY *entity;
- name = poolStoreString(&parser->m_tempPool, enc,
- entityTextPtr + enc->minBytesPerChar,
- next - enc->minBytesPerChar);
- if (! name) {
- result = XML_ERROR_NO_MEMORY;
- goto endEntityValue;
- }
- entity = (ENTITY *)lookup(parser, &dtd->paramEntities, name, 0);
- poolDiscard(&parser->m_tempPool);
- if (! entity) {
- /* not a well-formedness error - see XML 1.0: WFC Entity Declared */
- /* cannot report skipped entity here - see comments on
- parser->m_skippedEntityHandler
- if (parser->m_skippedEntityHandler)
- parser->m_skippedEntityHandler(parser->m_handlerArg, name, 0);
- */
- dtd->keepProcessing = dtd->standalone;
- goto endEntityValue;
- }
- if (entity->open || (entity == parser->m_declEntity)) {
- if (enc == parser->m_encoding)
- parser->m_eventPtr = entityTextPtr;
- result = XML_ERROR_RECURSIVE_ENTITY_REF;
- goto endEntityValue;
- }
- if (entity->systemId) {
- if (parser->m_externalEntityRefHandler) {
- dtd->paramEntityRead = XML_FALSE;
- entity->open = XML_TRUE;
- entityTrackingOnOpen(parser, entity, __LINE__);
- if (! parser->m_externalEntityRefHandler(
- parser->m_externalEntityRefHandlerArg, 0, entity->base,
- entity->systemId, entity->publicId)) {
- entityTrackingOnClose(parser, entity, __LINE__);
- entity->open = XML_FALSE;
- result = XML_ERROR_EXTERNAL_ENTITY_HANDLING;
- goto endEntityValue;
- }
- entityTrackingOnClose(parser, entity, __LINE__);
- entity->open = XML_FALSE;
- if (! dtd->paramEntityRead)
- dtd->keepProcessing = dtd->standalone;
- } else
- dtd->keepProcessing = dtd->standalone;
- } else {
- entity->open = XML_TRUE;
- entityTrackingOnOpen(parser, entity, __LINE__);
- result = storeEntityValue(
- parser, parser->m_internalEncoding, (const char *)entity->textPtr,
- (const char *)(entity->textPtr + entity->textLen),
- XML_ACCOUNT_ENTITY_EXPANSION);
- entityTrackingOnClose(parser, entity, __LINE__);
- entity->open = XML_FALSE;
- if (result)
- goto endEntityValue;
- }
- break;
- }
- # endif /* XML_DTD */
- /* In the internal subset, PE references are not legal
- within markup declarations, e.g entity values in this case. */
- parser->m_eventPtr = entityTextPtr;
- result = XML_ERROR_PARAM_ENTITY_REF;
- goto endEntityValue;
- case XML_TOK_NONE:
- result = XML_ERROR_NONE;
- goto endEntityValue;
- case XML_TOK_ENTITY_REF:
- case XML_TOK_DATA_CHARS:
- if (! poolAppend(pool, enc, entityTextPtr, next)) {
- result = XML_ERROR_NO_MEMORY;
- goto endEntityValue;
- }
- break;
- case XML_TOK_TRAILING_CR:
- next = entityTextPtr + enc->minBytesPerChar;
- /* fall through */
- case XML_TOK_DATA_NEWLINE:
- if (pool->end == pool->ptr && ! poolGrow(pool)) {
- result = XML_ERROR_NO_MEMORY;
- goto endEntityValue;
- }
- *(pool->ptr)++ = 0xA;
- break;
- case XML_TOK_CHAR_REF: {
- XML_Char buf[XML_ENCODE_MAX];
- int i;
- int n = XmlCharRefNumber(enc, entityTextPtr);
- if (n < 0) {
- if (enc == parser->m_encoding)
- parser->m_eventPtr = entityTextPtr;
- result = XML_ERROR_BAD_CHAR_REF;
- goto endEntityValue;
- }
- n = XmlEncode(n, (ICHAR *)buf);
- /* The XmlEncode() functions can never return 0 here. That
- * error return happens if the code point passed in is either
- * negative or greater than or equal to 0x110000. The
- * XmlCharRefNumber() functions will all return a number
- * strictly less than 0x110000 or a negative value if an error
- * occurred. The negative value is intercepted above, so
- * XmlEncode() is never passed a value it might return an
- * error for.
- */
- for (i = 0; i < n; i++) {
- if (pool->end == pool->ptr && ! poolGrow(pool)) {
- result = XML_ERROR_NO_MEMORY;
- goto endEntityValue;
- }
- *(pool->ptr)++ = buf[i];
- }
- } break;
- case XML_TOK_PARTIAL:
- if (enc == parser->m_encoding)
- parser->m_eventPtr = entityTextPtr;
- result = XML_ERROR_INVALID_TOKEN;
- goto endEntityValue;
- case XML_TOK_INVALID:
- if (enc == parser->m_encoding)
- parser->m_eventPtr = next;
- result = XML_ERROR_INVALID_TOKEN;
- goto endEntityValue;
- default:
- /* This default case should be unnecessary -- all the tokens
- * that XmlEntityValueTok() can return have their own explicit
- * cases -- but should be retained for safety. We do however
- * exclude it from the coverage statistics.
- *
- * LCOV_EXCL_START
- */
- if (enc == parser->m_encoding)
- parser->m_eventPtr = entityTextPtr;
- result = XML_ERROR_UNEXPECTED_STATE;
- goto endEntityValue;
- /* LCOV_EXCL_STOP */
- }
- entityTextPtr = next;
- }
- endEntityValue:
- # ifdef XML_DTD
- parser->m_prologState.inEntityValue = oldInEntityValue;
- # endif /* XML_DTD */
- return result;
- }
- #else /* XML_GE == 0 */
- static enum XML_Error
- storeSelfEntityValue(XML_Parser parser, ENTITY *entity) {
- // This will store "&entity123;" in entity->textPtr
- // to end up as "&entity123;" in the handler.
- const char *const entity_start = "&";
- const char *const entity_end = ";";
- STRING_POOL *const pool = &(parser->m_dtd->entityValuePool);
- if (! poolAppendString(pool, entity_start)
- || ! poolAppendString(pool, entity->name)
- || ! poolAppendString(pool, entity_end)) {
- poolDiscard(pool);
- return XML_ERROR_NO_MEMORY;
- }
- entity->textPtr = poolStart(pool);
- entity->textLen = (int)(poolLength(pool));
- poolFinish(pool);
- return XML_ERROR_NONE;
- }
- #endif /* XML_GE == 0 */
- static void FASTCALL
- normalizeLines(XML_Char *s) {
- XML_Char *p;
- for (;; s++) {
- if (*s == XML_T('\0'))
- return;
- if (*s == 0xD)
- break;
- }
- p = s;
- do {
- if (*s == 0xD) {
- *p++ = 0xA;
- if (*++s == 0xA)
- s++;
- } else
- *p++ = *s++;
- } while (*s);
- *p = XML_T('\0');
- }
- static int
- reportProcessingInstruction(XML_Parser parser, const ENCODING *enc,
- const char *start, const char *end) {
- const XML_Char *target;
- XML_Char *data;
- const char *tem;
- if (! parser->m_processingInstructionHandler) {
- if (parser->m_defaultHandler)
- reportDefault(parser, enc, start, end);
- return 1;
- }
- start += enc->minBytesPerChar * 2;
- tem = start + XmlNameLength(enc, start);
- target = poolStoreString(&parser->m_tempPool, enc, start, tem);
- if (! target)
- return 0;
- poolFinish(&parser->m_tempPool);
- data = poolStoreString(&parser->m_tempPool, enc, XmlSkipS(enc, tem),
- end - enc->minBytesPerChar * 2);
- if (! data)
- return 0;
- normalizeLines(data);
- parser->m_processingInstructionHandler(parser->m_handlerArg, target, data);
- poolClear(&parser->m_tempPool);
- return 1;
- }
- static int
- reportComment(XML_Parser parser, const ENCODING *enc, const char *start,
- const char *end) {
- XML_Char *data;
- if (! parser->m_commentHandler) {
- if (parser->m_defaultHandler)
- reportDefault(parser, enc, start, end);
- return 1;
- }
- data = poolStoreString(&parser->m_tempPool, enc,
- start + enc->minBytesPerChar * 4,
- end - enc->minBytesPerChar * 3);
- if (! data)
- return 0;
- normalizeLines(data);
- parser->m_commentHandler(parser->m_handlerArg, data);
- poolClear(&parser->m_tempPool);
- return 1;
- }
- static void
- reportDefault(XML_Parser parser, const ENCODING *enc, const char *s,
- const char *end) {
- if (MUST_CONVERT(enc, s)) {
- enum XML_Convert_Result convert_res;
- const char **eventPP;
- const char **eventEndPP;
- if (enc == parser->m_encoding) {
- eventPP = &parser->m_eventPtr;
- eventEndPP = &parser->m_eventEndPtr;
- } else {
- /* To get here, two things must be true; the parser must be
- * using a character encoding that is not the same as the
- * encoding passed in, and the encoding passed in must need
- * conversion to the internal format (UTF-8 unless XML_UNICODE
- * is defined). The only occasions on which the encoding passed
- * in is not the same as the parser's encoding are when it is
- * the internal encoding (e.g. a previously defined parameter
- * entity, already converted to internal format). This by
- * definition doesn't need conversion, so the whole branch never
- * gets executed.
- *
- * For safety's sake we don't delete these lines and merely
- * exclude them from coverage statistics.
- *
- * LCOV_EXCL_START
- */
- eventPP = &(parser->m_openInternalEntities->internalEventPtr);
- eventEndPP = &(parser->m_openInternalEntities->internalEventEndPtr);
- /* LCOV_EXCL_STOP */
- }
- do {
- ICHAR *dataPtr = (ICHAR *)parser->m_dataBuf;
- convert_res
- = XmlConvert(enc, &s, end, &dataPtr, (ICHAR *)parser->m_dataBufEnd);
- *eventEndPP = s;
- parser->m_defaultHandler(parser->m_handlerArg, parser->m_dataBuf,
- (int)(dataPtr - (ICHAR *)parser->m_dataBuf));
- *eventPP = s;
- } while ((convert_res != XML_CONVERT_COMPLETED)
- && (convert_res != XML_CONVERT_INPUT_INCOMPLETE));
- } else
- parser->m_defaultHandler(
- parser->m_handlerArg, (const XML_Char *)s,
- (int)((const XML_Char *)end - (const XML_Char *)s));
- }
- static int
- defineAttribute(ELEMENT_TYPE *type, ATTRIBUTE_ID *attId, XML_Bool isCdata,
- XML_Bool isId, const XML_Char *value, XML_Parser parser) {
- DEFAULT_ATTRIBUTE *att;
- if (value || isId) {
- /* The handling of default attributes gets messed up if we have
- a default which duplicates a non-default. */
- int i;
- for (i = 0; i < type->nDefaultAtts; i++)
- if (attId == type->defaultAtts[i].id)
- return 1;
- if (isId && ! type->idAtt && ! attId->xmlns)
- type->idAtt = attId;
- }
- if (type->nDefaultAtts == type->allocDefaultAtts) {
- if (type->allocDefaultAtts == 0) {
- type->allocDefaultAtts = 8;
- type->defaultAtts = (DEFAULT_ATTRIBUTE *)MALLOC(
- parser, type->allocDefaultAtts * sizeof(DEFAULT_ATTRIBUTE));
- if (! type->defaultAtts) {
- type->allocDefaultAtts = 0;
- return 0;
- }
- } else {
- DEFAULT_ATTRIBUTE *temp;
- /* Detect and prevent integer overflow */
- if (type->allocDefaultAtts > INT_MAX / 2) {
- return 0;
- }
- int count = type->allocDefaultAtts * 2;
- /* Detect and prevent integer overflow.
- * The preprocessor guard addresses the "always false" warning
- * from -Wtype-limits on platforms where
- * sizeof(unsigned int) < sizeof(size_t), e.g. on x86_64. */
- #if UINT_MAX >= SIZE_MAX
- if ((unsigned)count > (size_t)(-1) / sizeof(DEFAULT_ATTRIBUTE)) {
- return 0;
- }
- #endif
- temp = (DEFAULT_ATTRIBUTE *)REALLOC(parser, type->defaultAtts,
- (count * sizeof(DEFAULT_ATTRIBUTE)));
- if (temp == NULL)
- return 0;
- type->allocDefaultAtts = count;
- type->defaultAtts = temp;
- }
- }
- att = type->defaultAtts + type->nDefaultAtts;
- att->id = attId;
- att->value = value;
- att->isCdata = isCdata;
- if (! isCdata)
- attId->maybeTokenized = XML_TRUE;
- type->nDefaultAtts += 1;
- return 1;
- }
- static int
- setElementTypePrefix(XML_Parser parser, ELEMENT_TYPE *elementType) {
- DTD *const dtd = parser->m_dtd; /* save one level of indirection */
- const XML_Char *name;
- for (name = elementType->name; *name; name++) {
- if (*name == XML_T(ASCII_COLON)) {
- PREFIX *prefix;
- const XML_Char *s;
- for (s = elementType->name; s != name; s++) {
- if (! poolAppendChar(&dtd->pool, *s))
- return 0;
- }
- if (! poolAppendChar(&dtd->pool, XML_T('\0')))
- return 0;
- prefix = (PREFIX *)lookup(parser, &dtd->prefixes, poolStart(&dtd->pool),
- sizeof(PREFIX));
- if (! prefix)
- return 0;
- if (prefix->name == poolStart(&dtd->pool))
- poolFinish(&dtd->pool);
- else
- poolDiscard(&dtd->pool);
- elementType->prefix = prefix;
- break;
- }
- }
- return 1;
- }
- static ATTRIBUTE_ID *
- getAttributeId(XML_Parser parser, const ENCODING *enc, const char *start,
- const char *end) {
- DTD *const dtd = parser->m_dtd; /* save one level of indirection */
- ATTRIBUTE_ID *id;
- const XML_Char *name;
- if (! poolAppendChar(&dtd->pool, XML_T('\0')))
- return NULL;
- name = poolStoreString(&dtd->pool, enc, start, end);
- if (! name)
- return NULL;
- /* skip quotation mark - its storage will be reused (like in name[-1]) */
- ++name;
- id = (ATTRIBUTE_ID *)lookup(parser, &dtd->attributeIds, name,
- sizeof(ATTRIBUTE_ID));
- if (! id)
- return NULL;
- if (id->name != name)
- poolDiscard(&dtd->pool);
- else {
- poolFinish(&dtd->pool);
- if (! parser->m_ns)
- ;
- else if (name[0] == XML_T(ASCII_x) && name[1] == XML_T(ASCII_m)
- && name[2] == XML_T(ASCII_l) && name[3] == XML_T(ASCII_n)
- && name[4] == XML_T(ASCII_s)
- && (name[5] == XML_T('\0') || name[5] == XML_T(ASCII_COLON))) {
- if (name[5] == XML_T('\0'))
- id->prefix = &dtd->defaultPrefix;
- else
- id->prefix = (PREFIX *)lookup(parser, &dtd->prefixes, name + 6,
- sizeof(PREFIX));
- id->xmlns = XML_TRUE;
- } else {
- int i;
- for (i = 0; name[i]; i++) {
- /* attributes without prefix are *not* in the default namespace */
- if (name[i] == XML_T(ASCII_COLON)) {
- int j;
- for (j = 0; j < i; j++) {
- if (! poolAppendChar(&dtd->pool, name[j]))
- return NULL;
- }
- if (! poolAppendChar(&dtd->pool, XML_T('\0')))
- return NULL;
- id->prefix = (PREFIX *)lookup(parser, &dtd->prefixes,
- poolStart(&dtd->pool), sizeof(PREFIX));
- if (! id->prefix)
- return NULL;
- if (id->prefix->name == poolStart(&dtd->pool))
- poolFinish(&dtd->pool);
- else
- poolDiscard(&dtd->pool);
- break;
- }
- }
- }
- }
- return id;
- }
- #define CONTEXT_SEP XML_T(ASCII_FF)
- static const XML_Char *
- getContext(XML_Parser parser) {
- DTD *const dtd = parser->m_dtd; /* save one level of indirection */
- HASH_TABLE_ITER iter;
- XML_Bool needSep = XML_FALSE;
- if (dtd->defaultPrefix.binding) {
- int i;
- int len;
- if (! poolAppendChar(&parser->m_tempPool, XML_T(ASCII_EQUALS)))
- return NULL;
- len = dtd->defaultPrefix.binding->uriLen;
- if (parser->m_namespaceSeparator)
- len--;
- for (i = 0; i < len; i++) {
- if (! poolAppendChar(&parser->m_tempPool,
- dtd->defaultPrefix.binding->uri[i])) {
- /* Because of memory caching, I don't believe this line can be
- * executed.
- *
- * This is part of a loop copying the default prefix binding
- * URI into the parser's temporary string pool. Previously,
- * that URI was copied into the same string pool, with a
- * terminating NUL character, as part of setContext(). When
- * the pool was cleared, that leaves a block definitely big
- * enough to hold the URI on the free block list of the pool.
- * The URI copy in getContext() therefore cannot run out of
- * memory.
- *
- * If the pool is used between the setContext() and
- * getContext() calls, the worst it can do is leave a bigger
- * block on the front of the free list. Given that this is
- * all somewhat inobvious and program logic can be changed, we
- * don't delete the line but we do exclude it from the test
- * coverage statistics.
- */
- return NULL; /* LCOV_EXCL_LINE */
- }
- }
- needSep = XML_TRUE;
- }
- hashTableIterInit(&iter, &(dtd->prefixes));
- for (;;) {
- int i;
- int len;
- const XML_Char *s;
- PREFIX *prefix = (PREFIX *)hashTableIterNext(&iter);
- if (! prefix)
- break;
- if (! prefix->binding) {
- /* This test appears to be (justifiable) paranoia. There does
- * not seem to be a way of injecting a prefix without a binding
- * that doesn't get errored long before this function is called.
- * The test should remain for safety's sake, so we instead
- * exclude the following line from the coverage statistics.
- */
- continue; /* LCOV_EXCL_LINE */
- }
- if (needSep && ! poolAppendChar(&parser->m_tempPool, CONTEXT_SEP))
- return NULL;
- for (s = prefix->name; *s; s++)
- if (! poolAppendChar(&parser->m_tempPool, *s))
- return NULL;
- if (! poolAppendChar(&parser->m_tempPool, XML_T(ASCII_EQUALS)))
- return NULL;
- len = prefix->binding->uriLen;
- if (parser->m_namespaceSeparator)
- len--;
- for (i = 0; i < len; i++)
- if (! poolAppendChar(&parser->m_tempPool, prefix->binding->uri[i]))
- return NULL;
- needSep = XML_TRUE;
- }
- hashTableIterInit(&iter, &(dtd->generalEntities));
- for (;;) {
- const XML_Char *s;
- ENTITY *e = (ENTITY *)hashTableIterNext(&iter);
- if (! e)
- break;
- if (! e->open)
- continue;
- if (needSep && ! poolAppendChar(&parser->m_tempPool, CONTEXT_SEP))
- return NULL;
- for (s = e->name; *s; s++)
- if (! poolAppendChar(&parser->m_tempPool, *s))
- return 0;
- needSep = XML_TRUE;
- }
- if (! poolAppendChar(&parser->m_tempPool, XML_T('\0')))
- return NULL;
- return parser->m_tempPool.start;
- }
- static XML_Bool
- setContext(XML_Parser parser, const XML_Char *context) {
- if (context == NULL) {
- return XML_FALSE;
- }
- DTD *const dtd = parser->m_dtd; /* save one level of indirection */
- const XML_Char *s = context;
- while (*context != XML_T('\0')) {
- if (*s == CONTEXT_SEP || *s == XML_T('\0')) {
- ENTITY *e;
- if (! poolAppendChar(&parser->m_tempPool, XML_T('\0')))
- return XML_FALSE;
- e = (ENTITY *)lookup(parser, &dtd->generalEntities,
- poolStart(&parser->m_tempPool), 0);
- if (e)
- e->open = XML_TRUE;
- if (*s != XML_T('\0'))
- s++;
- context = s;
- poolDiscard(&parser->m_tempPool);
- } else if (*s == XML_T(ASCII_EQUALS)) {
- PREFIX *prefix;
- if (poolLength(&parser->m_tempPool) == 0)
- prefix = &dtd->defaultPrefix;
- else {
- if (! poolAppendChar(&parser->m_tempPool, XML_T('\0')))
- return XML_FALSE;
- prefix
- = (PREFIX *)lookup(parser, &dtd->prefixes,
- poolStart(&parser->m_tempPool), sizeof(PREFIX));
- if (! prefix)
- return XML_FALSE;
- if (prefix->name == poolStart(&parser->m_tempPool)) {
- prefix->name = poolCopyString(&dtd->pool, prefix->name);
- if (! prefix->name)
- return XML_FALSE;
- }
- poolDiscard(&parser->m_tempPool);
- }
- for (context = s + 1; *context != CONTEXT_SEP && *context != XML_T('\0');
- context++)
- if (! poolAppendChar(&parser->m_tempPool, *context))
- return XML_FALSE;
- if (! poolAppendChar(&parser->m_tempPool, XML_T('\0')))
- return XML_FALSE;
- if (addBinding(parser, prefix, NULL, poolStart(&parser->m_tempPool),
- &parser->m_inheritedBindings)
- != XML_ERROR_NONE)
- return XML_FALSE;
- poolDiscard(&parser->m_tempPool);
- if (*context != XML_T('\0'))
- ++context;
- s = context;
- } else {
- if (! poolAppendChar(&parser->m_tempPool, *s))
- return XML_FALSE;
- s++;
- }
- }
- return XML_TRUE;
- }
- static void FASTCALL
- normalizePublicId(XML_Char *publicId) {
- XML_Char *p = publicId;
- XML_Char *s;
- for (s = publicId; *s; s++) {
- switch (*s) {
- case 0x20:
- case 0xD:
- case 0xA:
- if (p != publicId && p[-1] != 0x20)
- *p++ = 0x20;
- break;
- default:
- *p++ = *s;
- }
- }
- if (p != publicId && p[-1] == 0x20)
- --p;
- *p = XML_T('\0');
- }
- static DTD *
- dtdCreate(const XML_Memory_Handling_Suite *ms) {
- DTD *p = ms->malloc_fcn(sizeof(DTD));
- if (p == NULL)
- return p;
- poolInit(&(p->pool), ms);
- poolInit(&(p->entityValuePool), ms);
- hashTableInit(&(p->generalEntities), ms);
- hashTableInit(&(p->elementTypes), ms);
- hashTableInit(&(p->attributeIds), ms);
- hashTableInit(&(p->prefixes), ms);
- #ifdef XML_DTD
- p->paramEntityRead = XML_FALSE;
- hashTableInit(&(p->paramEntities), ms);
- #endif /* XML_DTD */
- p->defaultPrefix.name = NULL;
- p->defaultPrefix.binding = NULL;
- p->in_eldecl = XML_FALSE;
- p->scaffIndex = NULL;
- p->scaffold = NULL;
- p->scaffLevel = 0;
- p->scaffSize = 0;
- p->scaffCount = 0;
- p->contentStringLen = 0;
- p->keepProcessing = XML_TRUE;
- p->hasParamEntityRefs = XML_FALSE;
- p->standalone = XML_FALSE;
- return p;
- }
- static void
- dtdReset(DTD *p, const XML_Memory_Handling_Suite *ms) {
- HASH_TABLE_ITER iter;
- hashTableIterInit(&iter, &(p->elementTypes));
- for (;;) {
- ELEMENT_TYPE *e = (ELEMENT_TYPE *)hashTableIterNext(&iter);
- if (! e)
- break;
- if (e->allocDefaultAtts != 0)
- ms->free_fcn(e->defaultAtts);
- }
- hashTableClear(&(p->generalEntities));
- #ifdef XML_DTD
- p->paramEntityRead = XML_FALSE;
- hashTableClear(&(p->paramEntities));
- #endif /* XML_DTD */
- hashTableClear(&(p->elementTypes));
- hashTableClear(&(p->attributeIds));
- hashTableClear(&(p->prefixes));
- poolClear(&(p->pool));
- poolClear(&(p->entityValuePool));
- p->defaultPrefix.name = NULL;
- p->defaultPrefix.binding = NULL;
- p->in_eldecl = XML_FALSE;
- ms->free_fcn(p->scaffIndex);
- p->scaffIndex = NULL;
- ms->free_fcn(p->scaffold);
- p->scaffold = NULL;
- p->scaffLevel = 0;
- p->scaffSize = 0;
- p->scaffCount = 0;
- p->contentStringLen = 0;
- p->keepProcessing = XML_TRUE;
- p->hasParamEntityRefs = XML_FALSE;
- p->standalone = XML_FALSE;
- }
- static void
- dtdDestroy(DTD *p, XML_Bool isDocEntity, const XML_Memory_Handling_Suite *ms) {
- HASH_TABLE_ITER iter;
- hashTableIterInit(&iter, &(p->elementTypes));
- for (;;) {
- ELEMENT_TYPE *e = (ELEMENT_TYPE *)hashTableIterNext(&iter);
- if (! e)
- break;
- if (e->allocDefaultAtts != 0)
- ms->free_fcn(e->defaultAtts);
- }
- hashTableDestroy(&(p->generalEntities));
- #ifdef XML_DTD
- hashTableDestroy(&(p->paramEntities));
- #endif /* XML_DTD */
- hashTableDestroy(&(p->elementTypes));
- hashTableDestroy(&(p->attributeIds));
- hashTableDestroy(&(p->prefixes));
- poolDestroy(&(p->pool));
- poolDestroy(&(p->entityValuePool));
- if (isDocEntity) {
- ms->free_fcn(p->scaffIndex);
- ms->free_fcn(p->scaffold);
- }
- ms->free_fcn(p);
- }
- /* Do a deep copy of the DTD. Return 0 for out of memory, non-zero otherwise.
- The new DTD has already been initialized.
- */
- static int
- dtdCopy(XML_Parser oldParser, DTD *newDtd, const DTD *oldDtd,
- const XML_Memory_Handling_Suite *ms) {
- HASH_TABLE_ITER iter;
- /* Copy the prefix table. */
- hashTableIterInit(&iter, &(oldDtd->prefixes));
- for (;;) {
- const XML_Char *name;
- const PREFIX *oldP = (PREFIX *)hashTableIterNext(&iter);
- if (! oldP)
- break;
- name = poolCopyString(&(newDtd->pool), oldP->name);
- if (! name)
- return 0;
- if (! lookup(oldParser, &(newDtd->prefixes), name, sizeof(PREFIX)))
- return 0;
- }
- hashTableIterInit(&iter, &(oldDtd->attributeIds));
- /* Copy the attribute id table. */
- for (;;) {
- ATTRIBUTE_ID *newA;
- const XML_Char *name;
- const ATTRIBUTE_ID *oldA = (ATTRIBUTE_ID *)hashTableIterNext(&iter);
- if (! oldA)
- break;
- /* Remember to allocate the scratch byte before the name. */
- if (! poolAppendChar(&(newDtd->pool), XML_T('\0')))
- return 0;
- name = poolCopyString(&(newDtd->pool), oldA->name);
- if (! name)
- return 0;
- ++name;
- newA = (ATTRIBUTE_ID *)lookup(oldParser, &(newDtd->attributeIds), name,
- sizeof(ATTRIBUTE_ID));
- if (! newA)
- return 0;
- newA->maybeTokenized = oldA->maybeTokenized;
- if (oldA->prefix) {
- newA->xmlns = oldA->xmlns;
- if (oldA->prefix == &oldDtd->defaultPrefix)
- newA->prefix = &newDtd->defaultPrefix;
- else
- newA->prefix = (PREFIX *)lookup(oldParser, &(newDtd->prefixes),
- oldA->prefix->name, 0);
- }
- }
- /* Copy the element type table. */
- hashTableIterInit(&iter, &(oldDtd->elementTypes));
- for (;;) {
- int i;
- ELEMENT_TYPE *newE;
- const XML_Char *name;
- const ELEMENT_TYPE *oldE = (ELEMENT_TYPE *)hashTableIterNext(&iter);
- if (! oldE)
- break;
- name = poolCopyString(&(newDtd->pool), oldE->name);
- if (! name)
- return 0;
- newE = (ELEMENT_TYPE *)lookup(oldParser, &(newDtd->elementTypes), name,
- sizeof(ELEMENT_TYPE));
- if (! newE)
- return 0;
- if (oldE->nDefaultAtts) {
- /* Detect and prevent integer overflow.
- * The preprocessor guard addresses the "always false" warning
- * from -Wtype-limits on platforms where
- * sizeof(int) < sizeof(size_t), e.g. on x86_64. */
- #if UINT_MAX >= SIZE_MAX
- if ((size_t)oldE->nDefaultAtts
- > ((size_t)(-1) / sizeof(DEFAULT_ATTRIBUTE))) {
- return 0;
- }
- #endif
- newE->defaultAtts
- = ms->malloc_fcn(oldE->nDefaultAtts * sizeof(DEFAULT_ATTRIBUTE));
- if (! newE->defaultAtts) {
- return 0;
- }
- }
- if (oldE->idAtt)
- newE->idAtt = (ATTRIBUTE_ID *)lookup(oldParser, &(newDtd->attributeIds),
- oldE->idAtt->name, 0);
- newE->allocDefaultAtts = newE->nDefaultAtts = oldE->nDefaultAtts;
- if (oldE->prefix)
- newE->prefix = (PREFIX *)lookup(oldParser, &(newDtd->prefixes),
- oldE->prefix->name, 0);
- for (i = 0; i < newE->nDefaultAtts; i++) {
- newE->defaultAtts[i].id = (ATTRIBUTE_ID *)lookup(
- oldParser, &(newDtd->attributeIds), oldE->defaultAtts[i].id->name, 0);
- newE->defaultAtts[i].isCdata = oldE->defaultAtts[i].isCdata;
- if (oldE->defaultAtts[i].value) {
- newE->defaultAtts[i].value
- = poolCopyString(&(newDtd->pool), oldE->defaultAtts[i].value);
- if (! newE->defaultAtts[i].value)
- return 0;
- } else
- newE->defaultAtts[i].value = NULL;
- }
- }
- /* Copy the entity tables. */
- if (! copyEntityTable(oldParser, &(newDtd->generalEntities), &(newDtd->pool),
- &(oldDtd->generalEntities)))
- return 0;
- #ifdef XML_DTD
- if (! copyEntityTable(oldParser, &(newDtd->paramEntities), &(newDtd->pool),
- &(oldDtd->paramEntities)))
- return 0;
- newDtd->paramEntityRead = oldDtd->paramEntityRead;
- #endif /* XML_DTD */
- newDtd->keepProcessing = oldDtd->keepProcessing;
- newDtd->hasParamEntityRefs = oldDtd->hasParamEntityRefs;
- newDtd->standalone = oldDtd->standalone;
- /* Don't want deep copying for scaffolding */
- newDtd->in_eldecl = oldDtd->in_eldecl;
- newDtd->scaffold = oldDtd->scaffold;
- newDtd->contentStringLen = oldDtd->contentStringLen;
- newDtd->scaffSize = oldDtd->scaffSize;
- newDtd->scaffLevel = oldDtd->scaffLevel;
- newDtd->scaffIndex = oldDtd->scaffIndex;
- return 1;
- } /* End dtdCopy */
- static int
- copyEntityTable(XML_Parser oldParser, HASH_TABLE *newTable,
- STRING_POOL *newPool, const HASH_TABLE *oldTable) {
- HASH_TABLE_ITER iter;
- const XML_Char *cachedOldBase = NULL;
- const XML_Char *cachedNewBase = NULL;
- hashTableIterInit(&iter, oldTable);
- for (;;) {
- ENTITY *newE;
- const XML_Char *name;
- const ENTITY *oldE = (ENTITY *)hashTableIterNext(&iter);
- if (! oldE)
- break;
- name = poolCopyString(newPool, oldE->name);
- if (! name)
- return 0;
- newE = (ENTITY *)lookup(oldParser, newTable, name, sizeof(ENTITY));
- if (! newE)
- return 0;
- if (oldE->systemId) {
- const XML_Char *tem = poolCopyString(newPool, oldE->systemId);
- if (! tem)
- return 0;
- newE->systemId = tem;
- if (oldE->base) {
- if (oldE->base == cachedOldBase)
- newE->base = cachedNewBase;
- else {
- cachedOldBase = oldE->base;
- tem = poolCopyString(newPool, cachedOldBase);
- if (! tem)
- return 0;
- cachedNewBase = newE->base = tem;
- }
- }
- if (oldE->publicId) {
- tem = poolCopyString(newPool, oldE->publicId);
- if (! tem)
- return 0;
- newE->publicId = tem;
- }
- } else {
- const XML_Char *tem
- = poolCopyStringN(newPool, oldE->textPtr, oldE->textLen);
- if (! tem)
- return 0;
- newE->textPtr = tem;
- newE->textLen = oldE->textLen;
- }
- if (oldE->notation) {
- const XML_Char *tem = poolCopyString(newPool, oldE->notation);
- if (! tem)
- return 0;
- newE->notation = tem;
- }
- newE->is_param = oldE->is_param;
- newE->is_internal = oldE->is_internal;
- }
- return 1;
- }
- #define INIT_POWER 6
- static XML_Bool FASTCALL
- keyeq(KEY s1, KEY s2) {
- for (; *s1 == *s2; s1++, s2++)
- if (*s1 == 0)
- return XML_TRUE;
- return XML_FALSE;
- }
- static size_t
- keylen(KEY s) {
- size_t len = 0;
- for (; *s; s++, len++)
- ;
- return len;
- }
- static void
- copy_salt_to_sipkey(XML_Parser parser, struct sipkey *key) {
- key->k[0] = 0;
- key->k[1] = get_hash_secret_salt(parser);
- }
- static unsigned long FASTCALL
- hash(XML_Parser parser, KEY s) {
- struct siphash state;
- struct sipkey key;
- (void)sip24_valid;
- copy_salt_to_sipkey(parser, &key);
- sip24_init(&state, &key);
- sip24_update(&state, s, keylen(s) * sizeof(XML_Char));
- return (unsigned long)sip24_final(&state);
- }
- static NAMED *
- lookup(XML_Parser parser, HASH_TABLE *table, KEY name, size_t createSize) {
- size_t i;
- if (table->size == 0) {
- size_t tsize;
- if (! createSize)
- return NULL;
- table->power = INIT_POWER;
- /* table->size is a power of 2 */
- table->size = (size_t)1 << INIT_POWER;
- tsize = table->size * sizeof(NAMED *);
- table->v = table->mem->malloc_fcn(tsize);
- if (! table->v) {
- table->size = 0;
- return NULL;
- }
- memset(table->v, 0, tsize);
- i = hash(parser, name) & ((unsigned long)table->size - 1);
- } else {
- unsigned long h = hash(parser, name);
- unsigned long mask = (unsigned long)table->size - 1;
- unsigned char step = 0;
- i = h & mask;
- while (table->v[i]) {
- if (keyeq(name, table->v[i]->name))
- return table->v[i];
- if (! step)
- step = PROBE_STEP(h, mask, table->power);
- i < step ? (i += table->size - step) : (i -= step);
- }
- if (! createSize)
- return NULL;
- /* check for overflow (table is half full) */
- if (table->used >> (table->power - 1)) {
- unsigned char newPower = table->power + 1;
- /* Detect and prevent invalid shift */
- if (newPower >= sizeof(unsigned long) * 8 /* bits per byte */) {
- return NULL;
- }
- size_t newSize = (size_t)1 << newPower;
- unsigned long newMask = (unsigned long)newSize - 1;
- /* Detect and prevent integer overflow */
- if (newSize > (size_t)(-1) / sizeof(NAMED *)) {
- return NULL;
- }
- size_t tsize = newSize * sizeof(NAMED *);
- NAMED **newV = table->mem->malloc_fcn(tsize);
- if (! newV)
- return NULL;
- memset(newV, 0, tsize);
- for (i = 0; i < table->size; i++)
- if (table->v[i]) {
- unsigned long newHash = hash(parser, table->v[i]->name);
- size_t j = newHash & newMask;
- step = 0;
- while (newV[j]) {
- if (! step)
- step = PROBE_STEP(newHash, newMask, newPower);
- j < step ? (j += newSize - step) : (j -= step);
- }
- newV[j] = table->v[i];
- }
- table->mem->free_fcn(table->v);
- table->v = newV;
- table->power = newPower;
- table->size = newSize;
- i = h & newMask;
- step = 0;
- while (table->v[i]) {
- if (! step)
- step = PROBE_STEP(h, newMask, newPower);
- i < step ? (i += newSize - step) : (i -= step);
- }
- }
- }
- table->v[i] = table->mem->malloc_fcn(createSize);
- if (! table->v[i])
- return NULL;
- memset(table->v[i], 0, createSize);
- table->v[i]->name = name;
- (table->used)++;
- return table->v[i];
- }
- static void FASTCALL
- hashTableClear(HASH_TABLE *table) {
- size_t i;
- for (i = 0; i < table->size; i++) {
- table->mem->free_fcn(table->v[i]);
- table->v[i] = NULL;
- }
- table->used = 0;
- }
- static void FASTCALL
- hashTableDestroy(HASH_TABLE *table) {
- size_t i;
- for (i = 0; i < table->size; i++)
- table->mem->free_fcn(table->v[i]);
- table->mem->free_fcn(table->v);
- }
- static void FASTCALL
- hashTableInit(HASH_TABLE *p, const XML_Memory_Handling_Suite *ms) {
- p->power = 0;
- p->size = 0;
- p->used = 0;
- p->v = NULL;
- p->mem = ms;
- }
- static void FASTCALL
- hashTableIterInit(HASH_TABLE_ITER *iter, const HASH_TABLE *table) {
- iter->p = table->v;
- iter->end = iter->p ? iter->p + table->size : NULL;
- }
- static NAMED *FASTCALL
- hashTableIterNext(HASH_TABLE_ITER *iter) {
- while (iter->p != iter->end) {
- NAMED *tem = *(iter->p)++;
- if (tem)
- return tem;
- }
- return NULL;
- }
- static void FASTCALL
- poolInit(STRING_POOL *pool, const XML_Memory_Handling_Suite *ms) {
- pool->blocks = NULL;
- pool->freeBlocks = NULL;
- pool->start = NULL;
- pool->ptr = NULL;
- pool->end = NULL;
- pool->mem = ms;
- }
- static void FASTCALL
- poolClear(STRING_POOL *pool) {
- if (! pool->freeBlocks)
- pool->freeBlocks = pool->blocks;
- else {
- BLOCK *p = pool->blocks;
- while (p) {
- BLOCK *tem = p->next;
- p->next = pool->freeBlocks;
- pool->freeBlocks = p;
- p = tem;
- }
- }
- pool->blocks = NULL;
- pool->start = NULL;
- pool->ptr = NULL;
- pool->end = NULL;
- }
- static void FASTCALL
- poolDestroy(STRING_POOL *pool) {
- BLOCK *p = pool->blocks;
- while (p) {
- BLOCK *tem = p->next;
- pool->mem->free_fcn(p);
- p = tem;
- }
- p = pool->freeBlocks;
- while (p) {
- BLOCK *tem = p->next;
- pool->mem->free_fcn(p);
- p = tem;
- }
- }
- static XML_Char *
- poolAppend(STRING_POOL *pool, const ENCODING *enc, const char *ptr,
- const char *end) {
- if (! pool->ptr && ! poolGrow(pool))
- return NULL;
- for (;;) {
- const enum XML_Convert_Result convert_res = XmlConvert(
- enc, &ptr, end, (ICHAR **)&(pool->ptr), (const ICHAR *)pool->end);
- if ((convert_res == XML_CONVERT_COMPLETED)
- || (convert_res == XML_CONVERT_INPUT_INCOMPLETE))
- break;
- if (! poolGrow(pool))
- return NULL;
- }
- return pool->start;
- }
- static const XML_Char *FASTCALL
- poolCopyString(STRING_POOL *pool, const XML_Char *s) {
- do {
- if (! poolAppendChar(pool, *s))
- return NULL;
- } while (*s++);
- s = pool->start;
- poolFinish(pool);
- return s;
- }
- static const XML_Char *
- poolCopyStringN(STRING_POOL *pool, const XML_Char *s, int n) {
- if (! pool->ptr && ! poolGrow(pool)) {
- /* The following line is unreachable given the current usage of
- * poolCopyStringN(). Currently it is called from exactly one
- * place to copy the text of a simple general entity. By that
- * point, the name of the entity is already stored in the pool, so
- * pool->ptr cannot be NULL.
- *
- * If poolCopyStringN() is used elsewhere as it well might be,
- * this line may well become executable again. Regardless, this
- * sort of check shouldn't be removed lightly, so we just exclude
- * it from the coverage statistics.
- */
- return NULL; /* LCOV_EXCL_LINE */
- }
- for (; n > 0; --n, s++) {
- if (! poolAppendChar(pool, *s))
- return NULL;
- }
- s = pool->start;
- poolFinish(pool);
- return s;
- }
- static const XML_Char *FASTCALL
- poolAppendString(STRING_POOL *pool, const XML_Char *s) {
- while (*s) {
- if (! poolAppendChar(pool, *s))
- return NULL;
- s++;
- }
- return pool->start;
- }
- static XML_Char *
- poolStoreString(STRING_POOL *pool, const ENCODING *enc, const char *ptr,
- const char *end) {
- if (! poolAppend(pool, enc, ptr, end))
- return NULL;
- if (pool->ptr == pool->end && ! poolGrow(pool))
- return NULL;
- *(pool->ptr)++ = 0;
- return pool->start;
- }
- static size_t
- poolBytesToAllocateFor(int blockSize) {
- /* Unprotected math would be:
- ** return offsetof(BLOCK, s) + blockSize * sizeof(XML_Char);
- **
- ** Detect overflow, avoiding _signed_ overflow undefined behavior
- ** For a + b * c we check b * c in isolation first, so that addition of a
- ** on top has no chance of making us accept a small non-negative number
- */
- const size_t stretch = sizeof(XML_Char); /* can be 4 bytes */
- if (blockSize <= 0)
- return 0;
- if (blockSize > (int)(INT_MAX / stretch))
- return 0;
- {
- const int stretchedBlockSize = blockSize * (int)stretch;
- const int bytesToAllocate
- = (int)(offsetof(BLOCK, s) + (unsigned)stretchedBlockSize);
- if (bytesToAllocate < 0)
- return 0;
- return (size_t)bytesToAllocate;
- }
- }
- static XML_Bool FASTCALL
- poolGrow(STRING_POOL *pool) {
- if (pool->freeBlocks) {
- if (pool->start == 0) {
- pool->blocks = pool->freeBlocks;
- pool->freeBlocks = pool->freeBlocks->next;
- pool->blocks->next = NULL;
- pool->start = pool->blocks->s;
- pool->end = pool->start + pool->blocks->size;
- pool->ptr = pool->start;
- return XML_TRUE;
- }
- if (pool->end - pool->start < pool->freeBlocks->size) {
- BLOCK *tem = pool->freeBlocks->next;
- pool->freeBlocks->next = pool->blocks;
- pool->blocks = pool->freeBlocks;
- pool->freeBlocks = tem;
- memcpy(pool->blocks->s, pool->start,
- (pool->end - pool->start) * sizeof(XML_Char));
- pool->ptr = pool->blocks->s + (pool->ptr - pool->start);
- pool->start = pool->blocks->s;
- pool->end = pool->start + pool->blocks->size;
- return XML_TRUE;
- }
- }
- if (pool->blocks && pool->start == pool->blocks->s) {
- BLOCK *temp;
- int blockSize = (int)((unsigned)(pool->end - pool->start) * 2U);
- size_t bytesToAllocate;
- /* NOTE: Needs to be calculated prior to calling `realloc`
- to avoid dangling pointers: */
- const ptrdiff_t offsetInsideBlock = pool->ptr - pool->start;
- if (blockSize < 0) {
- /* This condition traps a situation where either more than
- * INT_MAX/2 bytes have already been allocated. This isn't
- * readily testable, since it is unlikely that an average
- * machine will have that much memory, so we exclude it from the
- * coverage statistics.
- */
- return XML_FALSE; /* LCOV_EXCL_LINE */
- }
- bytesToAllocate = poolBytesToAllocateFor(blockSize);
- if (bytesToAllocate == 0)
- return XML_FALSE;
- temp = (BLOCK *)pool->mem->realloc_fcn(pool->blocks,
- (unsigned)bytesToAllocate);
- if (temp == NULL)
- return XML_FALSE;
- pool->blocks = temp;
- pool->blocks->size = blockSize;
- pool->ptr = pool->blocks->s + offsetInsideBlock;
- pool->start = pool->blocks->s;
- pool->end = pool->start + blockSize;
- } else {
- BLOCK *tem;
- int blockSize = (int)(pool->end - pool->start);
- size_t bytesToAllocate;
- if (blockSize < 0) {
- /* This condition traps a situation where either more than
- * INT_MAX bytes have already been allocated (which is prevented
- * by various pieces of program logic, not least this one, never
- * mind the unlikelihood of actually having that much memory) or
- * the pool control fields have been corrupted (which could
- * conceivably happen in an extremely buggy user handler
- * function). Either way it isn't readily testable, so we
- * exclude it from the coverage statistics.
- */
- return XML_FALSE; /* LCOV_EXCL_LINE */
- }
- if (blockSize < INIT_BLOCK_SIZE)
- blockSize = INIT_BLOCK_SIZE;
- else {
- /* Detect overflow, avoiding _signed_ overflow undefined behavior */
- if ((int)((unsigned)blockSize * 2U) < 0) {
- return XML_FALSE;
- }
- blockSize *= 2;
- }
- bytesToAllocate = poolBytesToAllocateFor(blockSize);
- if (bytesToAllocate == 0)
- return XML_FALSE;
- tem = pool->mem->malloc_fcn(bytesToAllocate);
- if (! tem)
- return XML_FALSE;
- tem->size = blockSize;
- tem->next = pool->blocks;
- pool->blocks = tem;
- if (pool->ptr != pool->start)
- memcpy(tem->s, pool->start, (pool->ptr - pool->start) * sizeof(XML_Char));
- pool->ptr = tem->s + (pool->ptr - pool->start);
- pool->start = tem->s;
- pool->end = tem->s + blockSize;
- }
- return XML_TRUE;
- }
- static int FASTCALL
- nextScaffoldPart(XML_Parser parser) {
- DTD *const dtd = parser->m_dtd; /* save one level of indirection */
- CONTENT_SCAFFOLD *me;
- int next;
- if (! dtd->scaffIndex) {
- /* Detect and prevent integer overflow.
- * The preprocessor guard addresses the "always false" warning
- * from -Wtype-limits on platforms where
- * sizeof(unsigned int) < sizeof(size_t), e.g. on x86_64. */
- #if UINT_MAX >= SIZE_MAX
- if (parser->m_groupSize > ((size_t)(-1) / sizeof(int))) {
- return -1;
- }
- #endif
- dtd->scaffIndex = (int *)MALLOC(parser, parser->m_groupSize * sizeof(int));
- if (! dtd->scaffIndex)
- return -1;
- dtd->scaffIndex[0] = 0;
- }
- if (dtd->scaffCount >= dtd->scaffSize) {
- CONTENT_SCAFFOLD *temp;
- if (dtd->scaffold) {
- /* Detect and prevent integer overflow */
- if (dtd->scaffSize > UINT_MAX / 2u) {
- return -1;
- }
- /* Detect and prevent integer overflow.
- * The preprocessor guard addresses the "always false" warning
- * from -Wtype-limits on platforms where
- * sizeof(unsigned int) < sizeof(size_t), e.g. on x86_64. */
- #if UINT_MAX >= SIZE_MAX
- if (dtd->scaffSize > (size_t)(-1) / 2u / sizeof(CONTENT_SCAFFOLD)) {
- return -1;
- }
- #endif
- temp = (CONTENT_SCAFFOLD *)REALLOC(
- parser, dtd->scaffold, dtd->scaffSize * 2 * sizeof(CONTENT_SCAFFOLD));
- if (temp == NULL)
- return -1;
- dtd->scaffSize *= 2;
- } else {
- temp = (CONTENT_SCAFFOLD *)MALLOC(parser, INIT_SCAFFOLD_ELEMENTS
- * sizeof(CONTENT_SCAFFOLD));
- if (temp == NULL)
- return -1;
- dtd->scaffSize = INIT_SCAFFOLD_ELEMENTS;
- }
- dtd->scaffold = temp;
- }
- next = dtd->scaffCount++;
- me = &dtd->scaffold[next];
- if (dtd->scaffLevel) {
- CONTENT_SCAFFOLD *parent
- = &dtd->scaffold[dtd->scaffIndex[dtd->scaffLevel - 1]];
- if (parent->lastchild) {
- dtd->scaffold[parent->lastchild].nextsib = next;
- }
- if (! parent->childcnt)
- parent->firstchild = next;
- parent->lastchild = next;
- parent->childcnt++;
- }
- me->firstchild = me->lastchild = me->childcnt = me->nextsib = 0;
- return next;
- }
- static XML_Content *
- build_model(XML_Parser parser) {
- /* Function build_model transforms the existing parser->m_dtd->scaffold
- * array of CONTENT_SCAFFOLD tree nodes into a new array of
- * XML_Content tree nodes followed by a gapless list of zero-terminated
- * strings. */
- DTD *const dtd = parser->m_dtd; /* save one level of indirection */
- XML_Content *ret;
- XML_Char *str; /* the current string writing location */
- /* Detect and prevent integer overflow.
- * The preprocessor guard addresses the "always false" warning
- * from -Wtype-limits on platforms where
- * sizeof(unsigned int) < sizeof(size_t), e.g. on x86_64. */
- #if UINT_MAX >= SIZE_MAX
- if (dtd->scaffCount > (size_t)(-1) / sizeof(XML_Content)) {
- return NULL;
- }
- if (dtd->contentStringLen > (size_t)(-1) / sizeof(XML_Char)) {
- return NULL;
- }
- #endif
- if (dtd->scaffCount * sizeof(XML_Content)
- > (size_t)(-1) - dtd->contentStringLen * sizeof(XML_Char)) {
- return NULL;
- }
- const size_t allocsize = (dtd->scaffCount * sizeof(XML_Content)
- + (dtd->contentStringLen * sizeof(XML_Char)));
- ret = (XML_Content *)MALLOC(parser, allocsize);
- if (! ret)
- return NULL;
- /* What follows is an iterative implementation (of what was previously done
- * recursively in a dedicated function called "build_node". The old recursive
- * build_node could be forced into stack exhaustion from input as small as a
- * few megabyte, and so that was a security issue. Hence, a function call
- * stack is avoided now by resolving recursion.)
- *
- * The iterative approach works as follows:
- *
- * - We have two writing pointers, both walking up the result array; one does
- * the work, the other creates "jobs" for its colleague to do, and leads
- * the way:
- *
- * - The faster one, pointer jobDest, always leads and writes "what job
- * to do" by the other, once they reach that place in the
- * array: leader "jobDest" stores the source node array index (relative
- * to array dtd->scaffold) in field "numchildren".
- *
- * - The slower one, pointer dest, looks at the value stored in the
- * "numchildren" field (which actually holds a source node array index
- * at that time) and puts the real data from dtd->scaffold in.
- *
- * - Before the loop starts, jobDest writes source array index 0
- * (where the root node is located) so that dest will have something to do
- * when it starts operation.
- *
- * - Whenever nodes with children are encountered, jobDest appends
- * them as new jobs, in order. As a result, tree node siblings are
- * adjacent in the resulting array, for example:
- *
- * [0] root, has two children
- * [1] first child of 0, has three children
- * [3] first child of 1, does not have children
- * [4] second child of 1, does not have children
- * [5] third child of 1, does not have children
- * [2] second child of 0, does not have children
- *
- * Or (the same data) presented in flat array view:
- *
- * [0] root, has two children
- *
- * [1] first child of 0, has three children
- * [2] second child of 0, does not have children
- *
- * [3] first child of 1, does not have children
- * [4] second child of 1, does not have children
- * [5] third child of 1, does not have children
- *
- * - The algorithm repeats until all target array indices have been processed.
- */
- XML_Content *dest = ret; /* tree node writing location, moves upwards */
- XML_Content *const destLimit = &ret[dtd->scaffCount];
- XML_Content *jobDest = ret; /* next free writing location in target array */
- str = (XML_Char *)&ret[dtd->scaffCount];
- /* Add the starting job, the root node (index 0) of the source tree */
- (jobDest++)->numchildren = 0;
- for (; dest < destLimit; dest++) {
- /* Retrieve source tree array index from job storage */
- const int src_node = (int)dest->numchildren;
- /* Convert item */
- dest->type = dtd->scaffold[src_node].type;
- dest->quant = dtd->scaffold[src_node].quant;
- if (dest->type == XML_CTYPE_NAME) {
- const XML_Char *src;
- dest->name = str;
- src = dtd->scaffold[src_node].name;
- for (;;) {
- *str++ = *src;
- if (! *src)
- break;
- src++;
- }
- dest->numchildren = 0;
- dest->children = NULL;
- } else {
- unsigned int i;
- int cn;
- dest->name = NULL;
- dest->numchildren = dtd->scaffold[src_node].childcnt;
- dest->children = jobDest;
- /* Append scaffold indices of children to array */
- for (i = 0, cn = dtd->scaffold[src_node].firstchild;
- i < dest->numchildren; i++, cn = dtd->scaffold[cn].nextsib)
- (jobDest++)->numchildren = (unsigned int)cn;
- }
- }
- return ret;
- }
- static ELEMENT_TYPE *
- getElementType(XML_Parser parser, const ENCODING *enc, const char *ptr,
- const char *end) {
- DTD *const dtd = parser->m_dtd; /* save one level of indirection */
- const XML_Char *name = poolStoreString(&dtd->pool, enc, ptr, end);
- ELEMENT_TYPE *ret;
- if (! name)
- return NULL;
- ret = (ELEMENT_TYPE *)lookup(parser, &dtd->elementTypes, name,
- sizeof(ELEMENT_TYPE));
- if (! ret)
- return NULL;
- if (ret->name != name)
- poolDiscard(&dtd->pool);
- else {
- poolFinish(&dtd->pool);
- if (! setElementTypePrefix(parser, ret))
- return NULL;
- }
- return ret;
- }
- static XML_Char *
- copyString(const XML_Char *s, const XML_Memory_Handling_Suite *memsuite) {
- size_t charsRequired = 0;
- XML_Char *result;
- /* First determine how long the string is */
- while (s[charsRequired] != 0) {
- charsRequired++;
- }
- /* Include the terminator */
- charsRequired++;
- /* Now allocate space for the copy */
- result = memsuite->malloc_fcn(charsRequired * sizeof(XML_Char));
- if (result == NULL)
- return NULL;
- /* Copy the original into place */
- memcpy(result, s, charsRequired * sizeof(XML_Char));
- return result;
- }
- #if XML_GE == 1
- static float
- accountingGetCurrentAmplification(XML_Parser rootParser) {
- // 1.........1.........12 => 22
- const size_t lenOfShortestInclude = sizeof("<!ENTITY a SYSTEM 'b'>") - 1;
- const XmlBigCount countBytesOutput
- = rootParser->m_accounting.countBytesDirect
- + rootParser->m_accounting.countBytesIndirect;
- const float amplificationFactor
- = rootParser->m_accounting.countBytesDirect
- ? (countBytesOutput
- / (float)(rootParser->m_accounting.countBytesDirect))
- : ((lenOfShortestInclude
- + rootParser->m_accounting.countBytesIndirect)
- / (float)lenOfShortestInclude);
- assert(! rootParser->m_parentParser);
- return amplificationFactor;
- }
- static void
- accountingReportStats(XML_Parser originParser, const char *epilog) {
- const XML_Parser rootParser = getRootParserOf(originParser, NULL);
- assert(! rootParser->m_parentParser);
- if (rootParser->m_accounting.debugLevel == 0u) {
- return;
- }
- const float amplificationFactor
- = accountingGetCurrentAmplification(rootParser);
- fprintf(stderr,
- "expat: Accounting(%p): Direct " EXPAT_FMT_ULL(
- "10") ", indirect " EXPAT_FMT_ULL("10") ", amplification %8.2f%s",
- (void *)rootParser, rootParser->m_accounting.countBytesDirect,
- rootParser->m_accounting.countBytesIndirect,
- (double)amplificationFactor, epilog);
- }
- static void
- accountingOnAbort(XML_Parser originParser) {
- accountingReportStats(originParser, " ABORTING\n");
- }
- static void
- accountingReportDiff(XML_Parser rootParser,
- unsigned int levelsAwayFromRootParser, const char *before,
- const char *after, ptrdiff_t bytesMore, int source_line,
- enum XML_Account account) {
- assert(! rootParser->m_parentParser);
- fprintf(stderr,
- " (+" EXPAT_FMT_PTRDIFF_T("6") " bytes %s|%u, xmlparse.c:%d) %*s\"",
- bytesMore, (account == XML_ACCOUNT_DIRECT) ? "DIR" : "EXP",
- levelsAwayFromRootParser, source_line, 10, "");
- const char ellipis[] = "[..]";
- const size_t ellipsisLength = sizeof(ellipis) /* because compile-time */ - 1;
- const unsigned int contextLength = 10;
- /* Note: Performance is of no concern here */
- const char *walker = before;
- if ((rootParser->m_accounting.debugLevel >= 3u)
- || (after - before)
- <= (ptrdiff_t)(contextLength + ellipsisLength + contextLength)) {
- for (; walker < after; walker++) {
- fprintf(stderr, "%s", unsignedCharToPrintable(walker[0]));
- }
- } else {
- for (; walker < before + contextLength; walker++) {
- fprintf(stderr, "%s", unsignedCharToPrintable(walker[0]));
- }
- fprintf(stderr, ellipis);
- walker = after - contextLength;
- for (; walker < after; walker++) {
- fprintf(stderr, "%s", unsignedCharToPrintable(walker[0]));
- }
- }
- fprintf(stderr, "\"\n");
- }
- static XML_Bool
- accountingDiffTolerated(XML_Parser originParser, int tok, const char *before,
- const char *after, int source_line,
- enum XML_Account account) {
- /* Note: We need to check the token type *first* to be sure that
- * we can even access variable <after>, safely.
- * E.g. for XML_TOK_NONE <after> may hold an invalid pointer. */
- switch (tok) {
- case XML_TOK_INVALID:
- case XML_TOK_PARTIAL:
- case XML_TOK_PARTIAL_CHAR:
- case XML_TOK_NONE:
- return XML_TRUE;
- }
- if (account == XML_ACCOUNT_NONE)
- return XML_TRUE; /* because these bytes have been accounted for, already */
- unsigned int levelsAwayFromRootParser;
- const XML_Parser rootParser
- = getRootParserOf(originParser, &levelsAwayFromRootParser);
- assert(! rootParser->m_parentParser);
- const int isDirect
- = (account == XML_ACCOUNT_DIRECT) && (originParser == rootParser);
- const ptrdiff_t bytesMore = after - before;
- XmlBigCount *const additionTarget
- = isDirect ? &rootParser->m_accounting.countBytesDirect
- : &rootParser->m_accounting.countBytesIndirect;
- /* Detect and avoid integer overflow */
- if (*additionTarget > (XmlBigCount)(-1) - (XmlBigCount)bytesMore)
- return XML_FALSE;
- *additionTarget += bytesMore;
- const XmlBigCount countBytesOutput
- = rootParser->m_accounting.countBytesDirect
- + rootParser->m_accounting.countBytesIndirect;
- const float amplificationFactor
- = accountingGetCurrentAmplification(rootParser);
- const XML_Bool tolerated
- = (countBytesOutput < rootParser->m_accounting.activationThresholdBytes)
- || (amplificationFactor
- <= rootParser->m_accounting.maximumAmplificationFactor);
- if (rootParser->m_accounting.debugLevel >= 2u) {
- accountingReportStats(rootParser, "");
- accountingReportDiff(rootParser, levelsAwayFromRootParser, before, after,
- bytesMore, source_line, account);
- }
- return tolerated;
- }
- unsigned long long
- testingAccountingGetCountBytesDirect(XML_Parser parser) {
- if (! parser)
- return 0;
- return parser->m_accounting.countBytesDirect;
- }
- unsigned long long
- testingAccountingGetCountBytesIndirect(XML_Parser parser) {
- if (! parser)
- return 0;
- return parser->m_accounting.countBytesIndirect;
- }
- static void
- entityTrackingReportStats(XML_Parser rootParser, ENTITY *entity,
- const char *action, int sourceLine) {
- assert(! rootParser->m_parentParser);
- if (rootParser->m_entity_stats.debugLevel == 0u)
- return;
- # if defined(XML_UNICODE)
- const char *const entityName = "[..]";
- # else
- const char *const entityName = entity->name;
- # endif
- fprintf(
- stderr,
- "expat: Entities(%p): Count %9u, depth %2u/%2u %*s%s%s; %s length %d (xmlparse.c:%d)\n",
- (void *)rootParser, rootParser->m_entity_stats.countEverOpened,
- rootParser->m_entity_stats.currentDepth,
- rootParser->m_entity_stats.maximumDepthSeen,
- (rootParser->m_entity_stats.currentDepth - 1) * 2, "",
- entity->is_param ? "%" : "&", entityName, action, entity->textLen,
- sourceLine);
- }
- static void
- entityTrackingOnOpen(XML_Parser originParser, ENTITY *entity, int sourceLine) {
- const XML_Parser rootParser = getRootParserOf(originParser, NULL);
- assert(! rootParser->m_parentParser);
- rootParser->m_entity_stats.countEverOpened++;
- rootParser->m_entity_stats.currentDepth++;
- if (rootParser->m_entity_stats.currentDepth
- > rootParser->m_entity_stats.maximumDepthSeen) {
- rootParser->m_entity_stats.maximumDepthSeen++;
- }
- entityTrackingReportStats(rootParser, entity, "OPEN ", sourceLine);
- }
- static void
- entityTrackingOnClose(XML_Parser originParser, ENTITY *entity, int sourceLine) {
- const XML_Parser rootParser = getRootParserOf(originParser, NULL);
- assert(! rootParser->m_parentParser);
- entityTrackingReportStats(rootParser, entity, "CLOSE", sourceLine);
- rootParser->m_entity_stats.currentDepth--;
- }
- static XML_Parser
- getRootParserOf(XML_Parser parser, unsigned int *outLevelDiff) {
- XML_Parser rootParser = parser;
- unsigned int stepsTakenUpwards = 0;
- while (rootParser->m_parentParser) {
- rootParser = rootParser->m_parentParser;
- stepsTakenUpwards++;
- }
- assert(! rootParser->m_parentParser);
- if (outLevelDiff != NULL) {
- *outLevelDiff = stepsTakenUpwards;
- }
- return rootParser;
- }
- const char *
- unsignedCharToPrintable(unsigned char c) {
- switch (c) {
- case 0:
- return "\\0";
- case 1:
- return "\\x1";
- case 2:
- return "\\x2";
- case 3:
- return "\\x3";
- case 4:
- return "\\x4";
- case 5:
- return "\\x5";
- case 6:
- return "\\x6";
- case 7:
- return "\\x7";
- case 8:
- return "\\x8";
- case 9:
- return "\\t";
- case 10:
- return "\\n";
- case 11:
- return "\\xB";
- case 12:
- return "\\xC";
- case 13:
- return "\\r";
- case 14:
- return "\\xE";
- case 15:
- return "\\xF";
- case 16:
- return "\\x10";
- case 17:
- return "\\x11";
- case 18:
- return "\\x12";
- case 19:
- return "\\x13";
- case 20:
- return "\\x14";
- case 21:
- return "\\x15";
- case 22:
- return "\\x16";
- case 23:
- return "\\x17";
- case 24:
- return "\\x18";
- case 25:
- return "\\x19";
- case 26:
- return "\\x1A";
- case 27:
- return "\\x1B";
- case 28:
- return "\\x1C";
- case 29:
- return "\\x1D";
- case 30:
- return "\\x1E";
- case 31:
- return "\\x1F";
- case 32:
- return " ";
- case 33:
- return "!";
- case 34:
- return "\\\"";
- case 35:
- return "#";
- case 36:
- return "$";
- case 37:
- return "%";
- case 38:
- return "&";
- case 39:
- return "'";
- case 40:
- return "(";
- case 41:
- return ")";
- case 42:
- return "*";
- case 43:
- return "+";
- case 44:
- return ",";
- case 45:
- return "-";
- case 46:
- return ".";
- case 47:
- return "/";
- case 48:
- return "0";
- case 49:
- return "1";
- case 50:
- return "2";
- case 51:
- return "3";
- case 52:
- return "4";
- case 53:
- return "5";
- case 54:
- return "6";
- case 55:
- return "7";
- case 56:
- return "8";
- case 57:
- return "9";
- case 58:
- return ":";
- case 59:
- return ";";
- case 60:
- return "<";
- case 61:
- return "=";
- case 62:
- return ">";
- case 63:
- return "?";
- case 64:
- return "@";
- case 65:
- return "A";
- case 66:
- return "B";
- case 67:
- return "C";
- case 68:
- return "D";
- case 69:
- return "E";
- case 70:
- return "F";
- case 71:
- return "G";
- case 72:
- return "H";
- case 73:
- return "I";
- case 74:
- return "J";
- case 75:
- return "K";
- case 76:
- return "L";
- case 77:
- return "M";
- case 78:
- return "N";
- case 79:
- return "O";
- case 80:
- return "P";
- case 81:
- return "Q";
- case 82:
- return "R";
- case 83:
- return "S";
- case 84:
- return "T";
- case 85:
- return "U";
- case 86:
- return "V";
- case 87:
- return "W";
- case 88:
- return "X";
- case 89:
- return "Y";
- case 90:
- return "Z";
- case 91:
- return "[";
- case 92:
- return "\\\\";
- case 93:
- return "]";
- case 94:
- return "^";
- case 95:
- return "_";
- case 96:
- return "`";
- case 97:
- return "a";
- case 98:
- return "b";
- case 99:
- return "c";
- case 100:
- return "d";
- case 101:
- return "e";
- case 102:
- return "f";
- case 103:
- return "g";
- case 104:
- return "h";
- case 105:
- return "i";
- case 106:
- return "j";
- case 107:
- return "k";
- case 108:
- return "l";
- case 109:
- return "m";
- case 110:
- return "n";
- case 111:
- return "o";
- case 112:
- return "p";
- case 113:
- return "q";
- case 114:
- return "r";
- case 115:
- return "s";
- case 116:
- return "t";
- case 117:
- return "u";
- case 118:
- return "v";
- case 119:
- return "w";
- case 120:
- return "x";
- case 121:
- return "y";
- case 122:
- return "z";
- case 123:
- return "{";
- case 124:
- return "|";
- case 125:
- return "}";
- case 126:
- return "~";
- case 127:
- return "\\x7F";
- case 128:
- return "\\x80";
- case 129:
- return "\\x81";
- case 130:
- return "\\x82";
- case 131:
- return "\\x83";
- case 132:
- return "\\x84";
- case 133:
- return "\\x85";
- case 134:
- return "\\x86";
- case 135:
- return "\\x87";
- case 136:
- return "\\x88";
- case 137:
- return "\\x89";
- case 138:
- return "\\x8A";
- case 139:
- return "\\x8B";
- case 140:
- return "\\x8C";
- case 141:
- return "\\x8D";
- case 142:
- return "\\x8E";
- case 143:
- return "\\x8F";
- case 144:
- return "\\x90";
- case 145:
- return "\\x91";
- case 146:
- return "\\x92";
- case 147:
- return "\\x93";
- case 148:
- return "\\x94";
- case 149:
- return "\\x95";
- case 150:
- return "\\x96";
- case 151:
- return "\\x97";
- case 152:
- return "\\x98";
- case 153:
- return "\\x99";
- case 154:
- return "\\x9A";
- case 155:
- return "\\x9B";
- case 156:
- return "\\x9C";
- case 157:
- return "\\x9D";
- case 158:
- return "\\x9E";
- case 159:
- return "\\x9F";
- case 160:
- return "\\xA0";
- case 161:
- return "\\xA1";
- case 162:
- return "\\xA2";
- case 163:
- return "\\xA3";
- case 164:
- return "\\xA4";
- case 165:
- return "\\xA5";
- case 166:
- return "\\xA6";
- case 167:
- return "\\xA7";
- case 168:
- return "\\xA8";
- case 169:
- return "\\xA9";
- case 170:
- return "\\xAA";
- case 171:
- return "\\xAB";
- case 172:
- return "\\xAC";
- case 173:
- return "\\xAD";
- case 174:
- return "\\xAE";
- case 175:
- return "\\xAF";
- case 176:
- return "\\xB0";
- case 177:
- return "\\xB1";
- case 178:
- return "\\xB2";
- case 179:
- return "\\xB3";
- case 180:
- return "\\xB4";
- case 181:
- return "\\xB5";
- case 182:
- return "\\xB6";
- case 183:
- return "\\xB7";
- case 184:
- return "\\xB8";
- case 185:
- return "\\xB9";
- case 186:
- return "\\xBA";
- case 187:
- return "\\xBB";
- case 188:
- return "\\xBC";
- case 189:
- return "\\xBD";
- case 190:
- return "\\xBE";
- case 191:
- return "\\xBF";
- case 192:
- return "\\xC0";
- case 193:
- return "\\xC1";
- case 194:
- return "\\xC2";
- case 195:
- return "\\xC3";
- case 196:
- return "\\xC4";
- case 197:
- return "\\xC5";
- case 198:
- return "\\xC6";
- case 199:
- return "\\xC7";
- case 200:
- return "\\xC8";
- case 201:
- return "\\xC9";
- case 202:
- return "\\xCA";
- case 203:
- return "\\xCB";
- case 204:
- return "\\xCC";
- case 205:
- return "\\xCD";
- case 206:
- return "\\xCE";
- case 207:
- return "\\xCF";
- case 208:
- return "\\xD0";
- case 209:
- return "\\xD1";
- case 210:
- return "\\xD2";
- case 211:
- return "\\xD3";
- case 212:
- return "\\xD4";
- case 213:
- return "\\xD5";
- case 214:
- return "\\xD6";
- case 215:
- return "\\xD7";
- case 216:
- return "\\xD8";
- case 217:
- return "\\xD9";
- case 218:
- return "\\xDA";
- case 219:
- return "\\xDB";
- case 220:
- return "\\xDC";
- case 221:
- return "\\xDD";
- case 222:
- return "\\xDE";
- case 223:
- return "\\xDF";
- case 224:
- return "\\xE0";
- case 225:
- return "\\xE1";
- case 226:
- return "\\xE2";
- case 227:
- return "\\xE3";
- case 228:
- return "\\xE4";
- case 229:
- return "\\xE5";
- case 230:
- return "\\xE6";
- case 231:
- return "\\xE7";
- case 232:
- return "\\xE8";
- case 233:
- return "\\xE9";
- case 234:
- return "\\xEA";
- case 235:
- return "\\xEB";
- case 236:
- return "\\xEC";
- case 237:
- return "\\xED";
- case 238:
- return "\\xEE";
- case 239:
- return "\\xEF";
- case 240:
- return "\\xF0";
- case 241:
- return "\\xF1";
- case 242:
- return "\\xF2";
- case 243:
- return "\\xF3";
- case 244:
- return "\\xF4";
- case 245:
- return "\\xF5";
- case 246:
- return "\\xF6";
- case 247:
- return "\\xF7";
- case 248:
- return "\\xF8";
- case 249:
- return "\\xF9";
- case 250:
- return "\\xFA";
- case 251:
- return "\\xFB";
- case 252:
- return "\\xFC";
- case 253:
- return "\\xFD";
- case 254:
- return "\\xFE";
- case 255:
- return "\\xFF";
- default:
- assert(0); /* never gets here */
- return "dead code";
- }
- assert(0); /* never gets here */
- }
- #endif /* XML_GE == 1 */
- static unsigned long
- getDebugLevel(const char *variableName, unsigned long defaultDebugLevel) {
- const char *const valueOrNull = getenv(variableName);
- if (valueOrNull == NULL) {
- return defaultDebugLevel;
- }
- const char *const value = valueOrNull;
- errno = 0;
- char *afterValue = NULL;
- unsigned long debugLevel = strtoul(value, &afterValue, 10);
- if ((errno != 0) || (afterValue == value) || (afterValue[0] != '\0')) {
- errno = 0;
- return defaultDebugLevel;
- }
- return debugLevel;
- }
|