runtests.c 466 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182838485868788899091929394959697989910010110210310410510610710810911011111211311411511611711811912012112212312412512612712812913013113213313413513613713813914014114214314414514614714814915015115215315415515615715815916016116216316416516616716816917017117217317417517617717817918018118218318418518618718818919019119219319419519619719819920020120220320420520620720820921021121221321421521621721821922022122222322422522622722822923023123223323423523623723823924024124224324424524624724824925025125225325425525625725825926026126226326426526626726826927027127227327427527627727827928028128228328428528628728828929029129229329429529629729829930030130230330430530630730830931031131231331431531631731831932032132232332432532632732832933033133233333433533633733833934034134234334434534634734834935035135235335435535635735835936036136236336436536636736836937037137237337437537637737837938038138238338438538638738838939039139239339439539639739839940040140240340440540640740840941041141241341441541641741841942042142242342442542642742842943043143243343443543643743843944044144244344444544644744844945045145245345445545645745845946046146246346446546646746846947047147247347447547647747847948048148248348448548648748848949049149249349449549649749849950050150250350450550650750850951051151251351451551651751851952052152252352452552652752852953053153253353453553653753853954054154254354454554654754854955055155255355455555655755855956056156256356456556656756856957057157257357457557657757857958058158258358458558658758858959059159259359459559659759859960060160260360460560660760860961061161261361461561661761861962062162262362462562662762862963063163263363463563663763863964064164264364464564664764864965065165265365465565665765865966066166266366466566666766866967067167267367467567667767867968068168268368468568668768868969069169269369469569669769869970070170270370470570670770870971071171271371471571671771871972072172272372472572672772872973073173273373473573673773873974074174274374474574674774874975075175275375475575675775875976076176276376476576676776876977077177277377477577677777877978078178278378478578678778878979079179279379479579679779879980080180280380480580680780880981081181281381481581681781881982082182282382482582682782882983083183283383483583683783883984084184284384484584684784884985085185285385485585685785885986086186286386486586686786886987087187287387487587687787887988088188288388488588688788888989089189289389489589689789889990090190290390490590690790890991091191291391491591691791891992092192292392492592692792892993093193293393493593693793893994094194294394494594694794894995095195295395495595695795895996096196296396496596696796896997097197297397497597697797897998098198298398498598698798898999099199299399499599699799899910001001100210031004100510061007100810091010101110121013101410151016101710181019102010211022102310241025102610271028102910301031103210331034103510361037103810391040104110421043104410451046104710481049105010511052105310541055105610571058105910601061106210631064106510661067106810691070107110721073107410751076107710781079108010811082108310841085108610871088108910901091109210931094109510961097109810991100110111021103110411051106110711081109111011111112111311141115111611171118111911201121112211231124112511261127112811291130113111321133113411351136113711381139114011411142114311441145114611471148114911501151115211531154115511561157115811591160116111621163116411651166116711681169117011711172117311741175117611771178117911801181118211831184118511861187118811891190119111921193119411951196119711981199120012011202120312041205120612071208120912101211121212131214121512161217121812191220122112221223122412251226122712281229123012311232123312341235123612371238123912401241124212431244124512461247124812491250125112521253125412551256125712581259126012611262126312641265126612671268126912701271127212731274127512761277127812791280128112821283128412851286128712881289129012911292129312941295129612971298129913001301130213031304130513061307130813091310131113121313131413151316131713181319132013211322132313241325132613271328132913301331133213331334133513361337133813391340134113421343134413451346134713481349135013511352135313541355135613571358135913601361136213631364136513661367136813691370137113721373137413751376137713781379138013811382138313841385138613871388138913901391139213931394139513961397139813991400140114021403140414051406140714081409141014111412141314141415141614171418141914201421142214231424142514261427142814291430143114321433143414351436143714381439144014411442144314441445144614471448144914501451145214531454145514561457145814591460146114621463146414651466146714681469147014711472147314741475147614771478147914801481148214831484148514861487148814891490149114921493149414951496149714981499150015011502150315041505150615071508150915101511151215131514151515161517151815191520152115221523152415251526152715281529153015311532153315341535153615371538153915401541154215431544154515461547154815491550155115521553155415551556155715581559156015611562156315641565156615671568156915701571157215731574157515761577157815791580158115821583158415851586158715881589159015911592159315941595159615971598159916001601160216031604160516061607160816091610161116121613161416151616161716181619162016211622162316241625162616271628162916301631163216331634163516361637163816391640164116421643164416451646164716481649165016511652165316541655165616571658165916601661166216631664166516661667166816691670167116721673167416751676167716781679168016811682168316841685168616871688168916901691169216931694169516961697169816991700170117021703170417051706170717081709171017111712171317141715171617171718171917201721172217231724172517261727172817291730173117321733173417351736173717381739174017411742174317441745174617471748174917501751175217531754175517561757175817591760176117621763176417651766176717681769177017711772177317741775177617771778177917801781178217831784178517861787178817891790179117921793179417951796179717981799180018011802180318041805180618071808180918101811181218131814181518161817181818191820182118221823182418251826182718281829183018311832183318341835183618371838183918401841184218431844184518461847184818491850185118521853185418551856185718581859186018611862186318641865186618671868186918701871187218731874187518761877187818791880188118821883188418851886188718881889189018911892189318941895189618971898189919001901190219031904190519061907190819091910191119121913191419151916191719181919192019211922192319241925192619271928192919301931193219331934193519361937193819391940194119421943194419451946194719481949195019511952195319541955195619571958195919601961196219631964196519661967196819691970197119721973197419751976197719781979198019811982198319841985198619871988198919901991199219931994199519961997199819992000200120022003200420052006200720082009201020112012201320142015201620172018201920202021202220232024202520262027202820292030203120322033203420352036203720382039204020412042204320442045204620472048204920502051205220532054205520562057205820592060206120622063206420652066206720682069207020712072207320742075207620772078207920802081208220832084208520862087208820892090209120922093209420952096209720982099210021012102210321042105210621072108210921102111211221132114211521162117211821192120212121222123212421252126212721282129213021312132213321342135213621372138213921402141214221432144214521462147214821492150215121522153215421552156215721582159216021612162216321642165216621672168216921702171217221732174217521762177217821792180218121822183218421852186218721882189219021912192219321942195219621972198219922002201220222032204220522062207220822092210221122122213221422152216221722182219222022212222222322242225222622272228222922302231223222332234223522362237223822392240224122422243224422452246224722482249225022512252225322542255225622572258225922602261226222632264226522662267226822692270227122722273227422752276227722782279228022812282228322842285228622872288228922902291229222932294229522962297229822992300230123022303230423052306230723082309231023112312231323142315231623172318231923202321232223232324232523262327232823292330233123322333233423352336233723382339234023412342234323442345234623472348234923502351235223532354235523562357235823592360236123622363236423652366236723682369237023712372237323742375237623772378237923802381238223832384238523862387238823892390239123922393239423952396239723982399240024012402240324042405240624072408240924102411241224132414241524162417241824192420242124222423242424252426242724282429243024312432243324342435243624372438243924402441244224432444244524462447244824492450245124522453245424552456245724582459246024612462246324642465246624672468246924702471247224732474247524762477247824792480248124822483248424852486248724882489249024912492249324942495249624972498249925002501250225032504250525062507250825092510251125122513251425152516251725182519252025212522252325242525252625272528252925302531253225332534253525362537253825392540254125422543254425452546254725482549255025512552255325542555255625572558255925602561256225632564256525662567256825692570257125722573257425752576257725782579258025812582258325842585258625872588258925902591259225932594259525962597259825992600260126022603260426052606260726082609261026112612261326142615261626172618261926202621262226232624262526262627262826292630263126322633263426352636263726382639264026412642264326442645264626472648264926502651265226532654265526562657265826592660266126622663266426652666266726682669267026712672267326742675267626772678267926802681268226832684268526862687268826892690269126922693269426952696269726982699270027012702270327042705270627072708270927102711271227132714271527162717271827192720272127222723272427252726272727282729273027312732273327342735273627372738273927402741274227432744274527462747274827492750275127522753275427552756275727582759276027612762276327642765276627672768276927702771277227732774277527762777277827792780278127822783278427852786278727882789279027912792279327942795279627972798279928002801280228032804280528062807280828092810281128122813281428152816281728182819282028212822282328242825282628272828282928302831283228332834283528362837283828392840284128422843284428452846284728482849285028512852285328542855285628572858285928602861286228632864286528662867286828692870287128722873287428752876287728782879288028812882288328842885288628872888288928902891289228932894289528962897289828992900290129022903290429052906290729082909291029112912291329142915291629172918291929202921292229232924292529262927292829292930293129322933293429352936293729382939294029412942294329442945294629472948294929502951295229532954295529562957295829592960296129622963296429652966296729682969297029712972297329742975297629772978297929802981298229832984298529862987298829892990299129922993299429952996299729982999300030013002300330043005300630073008300930103011301230133014301530163017301830193020302130223023302430253026302730283029303030313032303330343035303630373038303930403041304230433044304530463047304830493050305130523053305430553056305730583059306030613062306330643065306630673068306930703071307230733074307530763077307830793080308130823083308430853086308730883089309030913092309330943095309630973098309931003101310231033104310531063107310831093110311131123113311431153116311731183119312031213122312331243125312631273128312931303131313231333134313531363137313831393140314131423143314431453146314731483149315031513152315331543155315631573158315931603161316231633164316531663167316831693170317131723173317431753176317731783179318031813182318331843185318631873188318931903191319231933194319531963197319831993200320132023203320432053206320732083209321032113212321332143215321632173218321932203221322232233224322532263227322832293230323132323233323432353236323732383239324032413242324332443245324632473248324932503251325232533254325532563257325832593260326132623263326432653266326732683269327032713272327332743275327632773278327932803281328232833284328532863287328832893290329132923293329432953296329732983299330033013302330333043305330633073308330933103311331233133314331533163317331833193320332133223323332433253326332733283329333033313332333333343335333633373338333933403341334233433344334533463347334833493350335133523353335433553356335733583359336033613362336333643365336633673368336933703371337233733374337533763377337833793380338133823383338433853386338733883389339033913392339333943395339633973398339934003401340234033404340534063407340834093410341134123413341434153416341734183419342034213422342334243425342634273428342934303431343234333434343534363437343834393440344134423443344434453446344734483449345034513452345334543455345634573458345934603461346234633464346534663467346834693470347134723473347434753476347734783479348034813482348334843485348634873488348934903491349234933494349534963497349834993500350135023503350435053506350735083509351035113512351335143515351635173518351935203521352235233524352535263527352835293530353135323533353435353536353735383539354035413542354335443545354635473548354935503551355235533554355535563557355835593560356135623563356435653566356735683569357035713572357335743575357635773578357935803581358235833584358535863587358835893590359135923593359435953596359735983599360036013602360336043605360636073608360936103611361236133614361536163617361836193620362136223623362436253626362736283629363036313632363336343635363636373638363936403641364236433644364536463647364836493650365136523653365436553656365736583659366036613662366336643665366636673668366936703671367236733674367536763677367836793680368136823683368436853686368736883689369036913692369336943695369636973698369937003701370237033704370537063707370837093710371137123713371437153716371737183719372037213722372337243725372637273728372937303731373237333734373537363737373837393740374137423743374437453746374737483749375037513752375337543755375637573758375937603761376237633764376537663767376837693770377137723773377437753776377737783779378037813782378337843785378637873788378937903791379237933794379537963797379837993800380138023803380438053806380738083809381038113812381338143815381638173818381938203821382238233824382538263827382838293830383138323833383438353836383738383839384038413842384338443845384638473848384938503851385238533854385538563857385838593860386138623863386438653866386738683869387038713872387338743875387638773878387938803881388238833884388538863887388838893890389138923893389438953896389738983899390039013902390339043905390639073908390939103911391239133914391539163917391839193920392139223923392439253926392739283929393039313932393339343935393639373938393939403941394239433944394539463947394839493950395139523953395439553956395739583959396039613962396339643965396639673968396939703971397239733974397539763977397839793980398139823983398439853986398739883989399039913992399339943995399639973998399940004001400240034004400540064007400840094010401140124013401440154016401740184019402040214022402340244025402640274028402940304031403240334034403540364037403840394040404140424043404440454046404740484049405040514052405340544055405640574058405940604061406240634064406540664067406840694070407140724073407440754076407740784079408040814082408340844085408640874088408940904091409240934094409540964097409840994100410141024103410441054106410741084109411041114112411341144115411641174118411941204121412241234124412541264127412841294130413141324133413441354136413741384139414041414142414341444145414641474148414941504151415241534154415541564157415841594160416141624163416441654166416741684169417041714172417341744175417641774178417941804181418241834184418541864187418841894190419141924193419441954196419741984199420042014202420342044205420642074208420942104211421242134214421542164217421842194220422142224223422442254226422742284229423042314232423342344235423642374238423942404241424242434244424542464247424842494250425142524253425442554256425742584259426042614262426342644265426642674268426942704271427242734274427542764277427842794280428142824283428442854286428742884289429042914292429342944295429642974298429943004301430243034304430543064307430843094310431143124313431443154316431743184319432043214322432343244325432643274328432943304331433243334334433543364337433843394340434143424343434443454346434743484349435043514352435343544355435643574358435943604361436243634364436543664367436843694370437143724373437443754376437743784379438043814382438343844385438643874388438943904391439243934394439543964397439843994400440144024403440444054406440744084409441044114412441344144415441644174418441944204421442244234424442544264427442844294430443144324433443444354436443744384439444044414442444344444445444644474448444944504451445244534454445544564457445844594460446144624463446444654466446744684469447044714472447344744475447644774478447944804481448244834484448544864487448844894490449144924493449444954496449744984499450045014502450345044505450645074508450945104511451245134514451545164517451845194520452145224523452445254526452745284529453045314532453345344535453645374538453945404541454245434544454545464547454845494550455145524553455445554556455745584559456045614562456345644565456645674568456945704571457245734574457545764577457845794580458145824583458445854586458745884589459045914592459345944595459645974598459946004601460246034604460546064607460846094610461146124613461446154616461746184619462046214622462346244625462646274628462946304631463246334634463546364637463846394640464146424643464446454646464746484649465046514652465346544655465646574658465946604661466246634664466546664667466846694670467146724673467446754676467746784679468046814682468346844685468646874688468946904691469246934694469546964697469846994700470147024703470447054706470747084709471047114712471347144715471647174718471947204721472247234724472547264727472847294730473147324733473447354736473747384739474047414742474347444745474647474748474947504751475247534754475547564757475847594760476147624763476447654766476747684769477047714772477347744775477647774778477947804781478247834784478547864787478847894790479147924793479447954796479747984799480048014802480348044805480648074808480948104811481248134814481548164817481848194820482148224823482448254826482748284829483048314832483348344835483648374838483948404841484248434844484548464847484848494850485148524853485448554856485748584859486048614862486348644865486648674868486948704871487248734874487548764877487848794880488148824883488448854886488748884889489048914892489348944895489648974898489949004901490249034904490549064907490849094910491149124913491449154916491749184919492049214922492349244925492649274928492949304931493249334934493549364937493849394940494149424943494449454946494749484949495049514952495349544955495649574958495949604961496249634964496549664967496849694970497149724973497449754976497749784979498049814982498349844985498649874988498949904991499249934994499549964997499849995000500150025003500450055006500750085009501050115012501350145015501650175018501950205021502250235024502550265027502850295030503150325033503450355036503750385039504050415042504350445045504650475048504950505051505250535054505550565057505850595060506150625063506450655066506750685069507050715072507350745075507650775078507950805081508250835084508550865087508850895090509150925093509450955096509750985099510051015102510351045105510651075108510951105111511251135114511551165117511851195120512151225123512451255126512751285129513051315132513351345135513651375138513951405141514251435144514551465147514851495150515151525153515451555156515751585159516051615162516351645165516651675168516951705171517251735174517551765177517851795180518151825183518451855186518751885189519051915192519351945195519651975198519952005201520252035204520552065207520852095210521152125213521452155216521752185219522052215222522352245225522652275228522952305231523252335234523552365237523852395240524152425243524452455246524752485249525052515252525352545255525652575258525952605261526252635264526552665267526852695270527152725273527452755276527752785279528052815282528352845285528652875288528952905291529252935294529552965297529852995300530153025303530453055306530753085309531053115312531353145315531653175318531953205321532253235324532553265327532853295330533153325333533453355336533753385339534053415342534353445345534653475348534953505351535253535354535553565357535853595360536153625363536453655366536753685369537053715372537353745375537653775378537953805381538253835384538553865387538853895390539153925393539453955396539753985399540054015402540354045405540654075408540954105411541254135414541554165417541854195420542154225423542454255426542754285429543054315432543354345435543654375438543954405441544254435444544554465447544854495450545154525453545454555456545754585459546054615462546354645465546654675468546954705471547254735474547554765477547854795480548154825483548454855486548754885489549054915492549354945495549654975498549955005501550255035504550555065507550855095510551155125513551455155516551755185519552055215522552355245525552655275528552955305531553255335534553555365537553855395540554155425543554455455546554755485549555055515552555355545555555655575558555955605561556255635564556555665567556855695570557155725573557455755576557755785579558055815582558355845585558655875588558955905591559255935594559555965597559855995600560156025603560456055606560756085609561056115612561356145615561656175618561956205621562256235624562556265627562856295630563156325633563456355636563756385639564056415642564356445645564656475648564956505651565256535654565556565657565856595660566156625663566456655666566756685669567056715672567356745675567656775678567956805681568256835684568556865687568856895690569156925693569456955696569756985699570057015702570357045705570657075708570957105711571257135714571557165717571857195720572157225723572457255726572757285729573057315732573357345735573657375738573957405741574257435744574557465747574857495750575157525753575457555756575757585759576057615762576357645765576657675768576957705771577257735774577557765777577857795780578157825783578457855786578757885789579057915792579357945795579657975798579958005801580258035804580558065807580858095810581158125813581458155816581758185819582058215822582358245825582658275828582958305831583258335834583558365837583858395840584158425843584458455846584758485849585058515852585358545855585658575858585958605861586258635864586558665867586858695870587158725873587458755876587758785879588058815882588358845885588658875888588958905891589258935894589558965897589858995900590159025903590459055906590759085909591059115912591359145915591659175918591959205921592259235924592559265927592859295930593159325933593459355936593759385939594059415942594359445945594659475948594959505951595259535954595559565957595859595960596159625963596459655966596759685969597059715972597359745975597659775978597959805981598259835984598559865987598859895990599159925993599459955996599759985999600060016002600360046005600660076008600960106011601260136014601560166017601860196020602160226023602460256026602760286029603060316032603360346035603660376038603960406041604260436044604560466047604860496050605160526053605460556056605760586059606060616062606360646065606660676068606960706071607260736074607560766077607860796080608160826083608460856086608760886089609060916092609360946095609660976098609961006101610261036104610561066107610861096110611161126113611461156116611761186119612061216122612361246125612661276128612961306131613261336134613561366137613861396140614161426143614461456146614761486149615061516152615361546155615661576158615961606161616261636164616561666167616861696170617161726173617461756176617761786179618061816182618361846185618661876188618961906191619261936194619561966197619861996200620162026203620462056206620762086209621062116212621362146215621662176218621962206221622262236224622562266227622862296230623162326233623462356236623762386239624062416242624362446245624662476248624962506251625262536254625562566257625862596260626162626263626462656266626762686269627062716272627362746275627662776278627962806281628262836284628562866287628862896290629162926293629462956296629762986299630063016302630363046305630663076308630963106311631263136314631563166317631863196320632163226323632463256326632763286329633063316332633363346335633663376338633963406341634263436344634563466347634863496350635163526353635463556356635763586359636063616362636363646365636663676368636963706371637263736374637563766377637863796380638163826383638463856386638763886389639063916392639363946395639663976398639964006401640264036404640564066407640864096410641164126413641464156416641764186419642064216422642364246425642664276428642964306431643264336434643564366437643864396440644164426443644464456446644764486449645064516452645364546455645664576458645964606461646264636464646564666467646864696470647164726473647464756476647764786479648064816482648364846485648664876488648964906491649264936494649564966497649864996500650165026503650465056506650765086509651065116512651365146515651665176518651965206521652265236524652565266527652865296530653165326533653465356536653765386539654065416542654365446545654665476548654965506551655265536554655565566557655865596560656165626563656465656566656765686569657065716572657365746575657665776578657965806581658265836584658565866587658865896590659165926593659465956596659765986599660066016602660366046605660666076608660966106611661266136614661566166617661866196620662166226623662466256626662766286629663066316632663366346635663666376638663966406641664266436644664566466647664866496650665166526653665466556656665766586659666066616662666366646665666666676668666966706671667266736674667566766677667866796680668166826683668466856686668766886689669066916692669366946695669666976698669967006701670267036704670567066707670867096710671167126713671467156716671767186719672067216722672367246725672667276728672967306731673267336734673567366737673867396740674167426743674467456746674767486749675067516752675367546755675667576758675967606761676267636764676567666767676867696770677167726773677467756776677767786779678067816782678367846785678667876788678967906791679267936794679567966797679867996800680168026803680468056806680768086809681068116812681368146815681668176818681968206821682268236824682568266827682868296830683168326833683468356836683768386839684068416842684368446845684668476848684968506851685268536854685568566857685868596860686168626863686468656866686768686869687068716872687368746875687668776878687968806881688268836884688568866887688868896890689168926893689468956896689768986899690069016902690369046905690669076908690969106911691269136914691569166917691869196920692169226923692469256926692769286929693069316932693369346935693669376938693969406941694269436944694569466947694869496950695169526953695469556956695769586959696069616962696369646965696669676968696969706971697269736974697569766977697869796980698169826983698469856986698769886989699069916992699369946995699669976998699970007001700270037004700570067007700870097010701170127013701470157016701770187019702070217022702370247025702670277028702970307031703270337034703570367037703870397040704170427043704470457046704770487049705070517052705370547055705670577058705970607061706270637064706570667067706870697070707170727073707470757076707770787079708070817082708370847085708670877088708970907091709270937094709570967097709870997100710171027103710471057106710771087109711071117112711371147115711671177118711971207121712271237124712571267127712871297130713171327133713471357136713771387139714071417142714371447145714671477148714971507151715271537154715571567157715871597160716171627163716471657166716771687169717071717172717371747175717671777178717971807181718271837184718571867187718871897190719171927193719471957196719771987199720072017202720372047205720672077208720972107211721272137214721572167217721872197220722172227223722472257226722772287229723072317232723372347235723672377238723972407241724272437244724572467247724872497250725172527253725472557256725772587259726072617262726372647265726672677268726972707271727272737274727572767277727872797280728172827283728472857286728772887289729072917292729372947295729672977298729973007301730273037304730573067307730873097310731173127313731473157316731773187319732073217322732373247325732673277328732973307331733273337334733573367337733873397340734173427343734473457346734773487349735073517352735373547355735673577358735973607361736273637364736573667367736873697370737173727373737473757376737773787379738073817382738373847385738673877388738973907391739273937394739573967397739873997400740174027403740474057406740774087409741074117412741374147415741674177418741974207421742274237424742574267427742874297430743174327433743474357436743774387439744074417442744374447445744674477448744974507451745274537454745574567457745874597460746174627463746474657466746774687469747074717472747374747475747674777478747974807481748274837484748574867487748874897490749174927493749474957496749774987499750075017502750375047505750675077508750975107511751275137514751575167517751875197520752175227523752475257526752775287529753075317532753375347535753675377538753975407541754275437544754575467547754875497550755175527553755475557556755775587559756075617562756375647565756675677568756975707571757275737574757575767577757875797580758175827583758475857586758775887589759075917592759375947595759675977598759976007601760276037604760576067607760876097610761176127613761476157616761776187619762076217622762376247625762676277628762976307631763276337634763576367637763876397640764176427643764476457646764776487649765076517652765376547655765676577658765976607661766276637664766576667667766876697670767176727673767476757676767776787679768076817682768376847685768676877688768976907691769276937694769576967697769876997700770177027703770477057706770777087709771077117712771377147715771677177718771977207721772277237724772577267727772877297730773177327733773477357736773777387739774077417742774377447745774677477748774977507751775277537754775577567757775877597760776177627763776477657766776777687769777077717772777377747775777677777778777977807781778277837784778577867787778877897790779177927793779477957796779777987799780078017802780378047805780678077808780978107811781278137814781578167817781878197820782178227823782478257826782778287829783078317832783378347835783678377838783978407841784278437844784578467847784878497850785178527853785478557856785778587859786078617862786378647865786678677868786978707871787278737874787578767877787878797880788178827883788478857886788778887889789078917892789378947895789678977898789979007901790279037904790579067907790879097910791179127913791479157916791779187919792079217922792379247925792679277928792979307931793279337934793579367937793879397940794179427943794479457946794779487949795079517952795379547955795679577958795979607961796279637964796579667967796879697970797179727973797479757976797779787979798079817982798379847985798679877988798979907991799279937994799579967997799879998000800180028003800480058006800780088009801080118012801380148015801680178018801980208021802280238024802580268027802880298030803180328033803480358036803780388039804080418042804380448045804680478048804980508051805280538054805580568057805880598060806180628063806480658066806780688069807080718072807380748075807680778078807980808081808280838084808580868087808880898090809180928093809480958096809780988099810081018102810381048105810681078108810981108111811281138114811581168117811881198120812181228123812481258126812781288129813081318132813381348135813681378138813981408141814281438144814581468147814881498150815181528153815481558156815781588159816081618162816381648165816681678168816981708171817281738174817581768177817881798180818181828183818481858186818781888189819081918192819381948195819681978198819982008201820282038204820582068207820882098210821182128213821482158216821782188219822082218222822382248225822682278228822982308231823282338234823582368237823882398240824182428243824482458246824782488249825082518252825382548255825682578258825982608261826282638264826582668267826882698270827182728273827482758276827782788279828082818282828382848285828682878288828982908291829282938294829582968297829882998300830183028303830483058306830783088309831083118312831383148315831683178318831983208321832283238324832583268327832883298330833183328333833483358336833783388339834083418342834383448345834683478348834983508351835283538354835583568357835883598360836183628363836483658366836783688369837083718372837383748375837683778378837983808381838283838384838583868387838883898390839183928393839483958396839783988399840084018402840384048405840684078408840984108411841284138414841584168417841884198420842184228423842484258426842784288429843084318432843384348435843684378438843984408441844284438444844584468447844884498450845184528453845484558456845784588459846084618462846384648465846684678468846984708471847284738474847584768477847884798480848184828483848484858486848784888489849084918492849384948495849684978498849985008501850285038504850585068507850885098510851185128513851485158516851785188519852085218522852385248525852685278528852985308531853285338534853585368537853885398540854185428543854485458546854785488549855085518552855385548555855685578558855985608561856285638564856585668567856885698570857185728573857485758576857785788579858085818582858385848585858685878588858985908591859285938594859585968597859885998600860186028603860486058606860786088609861086118612861386148615861686178618861986208621862286238624862586268627862886298630863186328633863486358636863786388639864086418642864386448645864686478648864986508651865286538654865586568657865886598660866186628663866486658666866786688669867086718672867386748675867686778678867986808681868286838684868586868687868886898690869186928693869486958696869786988699870087018702870387048705870687078708870987108711871287138714871587168717871887198720872187228723872487258726872787288729873087318732873387348735873687378738873987408741874287438744874587468747874887498750875187528753875487558756875787588759876087618762876387648765876687678768876987708771877287738774877587768777877887798780878187828783878487858786878787888789879087918792879387948795879687978798879988008801880288038804880588068807880888098810881188128813881488158816881788188819882088218822882388248825882688278828882988308831883288338834883588368837883888398840884188428843884488458846884788488849885088518852885388548855885688578858885988608861886288638864886588668867886888698870887188728873887488758876887788788879888088818882888388848885888688878888888988908891889288938894889588968897889888998900890189028903890489058906890789088909891089118912891389148915891689178918891989208921892289238924892589268927892889298930893189328933893489358936893789388939894089418942894389448945894689478948894989508951895289538954895589568957895889598960896189628963896489658966896789688969897089718972897389748975897689778978897989808981898289838984898589868987898889898990899189928993899489958996899789988999900090019002900390049005900690079008900990109011901290139014901590169017901890199020902190229023902490259026902790289029903090319032903390349035903690379038903990409041904290439044904590469047904890499050905190529053905490559056905790589059906090619062906390649065906690679068906990709071907290739074907590769077907890799080908190829083908490859086908790889089909090919092909390949095909690979098909991009101910291039104910591069107910891099110911191129113911491159116911791189119912091219122912391249125912691279128912991309131913291339134913591369137913891399140914191429143914491459146914791489149915091519152915391549155915691579158915991609161916291639164916591669167916891699170917191729173917491759176917791789179918091819182918391849185918691879188918991909191919291939194919591969197919891999200920192029203920492059206920792089209921092119212921392149215921692179218921992209221922292239224922592269227922892299230923192329233923492359236923792389239924092419242924392449245924692479248924992509251925292539254925592569257925892599260926192629263926492659266926792689269927092719272927392749275927692779278927992809281928292839284928592869287928892899290929192929293929492959296929792989299930093019302930393049305930693079308930993109311931293139314931593169317931893199320932193229323932493259326932793289329933093319332933393349335933693379338933993409341934293439344934593469347934893499350935193529353935493559356935793589359936093619362936393649365936693679368936993709371937293739374937593769377937893799380938193829383938493859386938793889389939093919392939393949395939693979398939994009401940294039404940594069407940894099410941194129413941494159416941794189419942094219422942394249425942694279428942994309431943294339434943594369437943894399440944194429443944494459446944794489449945094519452945394549455945694579458945994609461946294639464946594669467946894699470947194729473947494759476947794789479948094819482948394849485948694879488948994909491949294939494949594969497949894999500950195029503950495059506950795089509951095119512951395149515951695179518951995209521952295239524952595269527952895299530953195329533953495359536953795389539954095419542954395449545954695479548954995509551955295539554955595569557955895599560956195629563956495659566956795689569957095719572957395749575957695779578957995809581958295839584958595869587958895899590959195929593959495959596959795989599960096019602960396049605960696079608960996109611961296139614961596169617961896199620962196229623962496259626962796289629963096319632963396349635963696379638963996409641964296439644964596469647964896499650965196529653965496559656965796589659966096619662966396649665966696679668966996709671967296739674967596769677967896799680968196829683968496859686968796889689969096919692969396949695969696979698969997009701970297039704970597069707970897099710971197129713971497159716971797189719972097219722972397249725972697279728972997309731973297339734973597369737973897399740974197429743974497459746974797489749975097519752975397549755975697579758975997609761976297639764976597669767976897699770977197729773977497759776977797789779978097819782978397849785978697879788978997909791979297939794979597969797979897999800980198029803980498059806980798089809981098119812981398149815981698179818981998209821982298239824982598269827982898299830983198329833983498359836983798389839984098419842984398449845984698479848984998509851985298539854985598569857985898599860986198629863986498659866986798689869987098719872987398749875987698779878987998809881988298839884988598869887988898899890989198929893989498959896989798989899990099019902990399049905990699079908990999109911991299139914991599169917991899199920992199229923992499259926992799289929993099319932993399349935993699379938993999409941994299439944994599469947994899499950995199529953995499559956995799589959996099619962996399649965996699679968996999709971997299739974997599769977997899799980998199829983998499859986998799889989999099919992999399949995999699979998999910000100011000210003100041000510006100071000810009100101001110012100131001410015100161001710018100191002010021100221002310024100251002610027100281002910030100311003210033100341003510036100371003810039100401004110042100431004410045100461004710048100491005010051100521005310054100551005610057100581005910060100611006210063100641006510066100671006810069100701007110072100731007410075100761007710078100791008010081100821008310084100851008610087100881008910090100911009210093100941009510096100971009810099101001010110102101031010410105101061010710108101091011010111101121011310114101151011610117101181011910120101211012210123101241012510126101271012810129101301013110132101331013410135101361013710138101391014010141101421014310144101451014610147101481014910150101511015210153101541015510156101571015810159101601016110162101631016410165101661016710168101691017010171101721017310174101751017610177101781017910180101811018210183101841018510186101871018810189101901019110192101931019410195101961019710198101991020010201102021020310204102051020610207102081020910210102111021210213102141021510216102171021810219102201022110222102231022410225102261022710228102291023010231102321023310234102351023610237102381023910240102411024210243102441024510246102471024810249102501025110252102531025410255102561025710258102591026010261102621026310264102651026610267102681026910270102711027210273102741027510276102771027810279102801028110282102831028410285102861028710288102891029010291102921029310294102951029610297102981029910300103011030210303103041030510306103071030810309103101031110312103131031410315103161031710318103191032010321103221032310324103251032610327103281032910330103311033210333103341033510336103371033810339103401034110342103431034410345103461034710348103491035010351103521035310354103551035610357103581035910360103611036210363103641036510366103671036810369103701037110372103731037410375103761037710378103791038010381103821038310384103851038610387103881038910390103911039210393103941039510396103971039810399104001040110402104031040410405104061040710408104091041010411104121041310414104151041610417104181041910420104211042210423104241042510426104271042810429104301043110432104331043410435104361043710438104391044010441104421044310444104451044610447104481044910450104511045210453104541045510456104571045810459104601046110462104631046410465104661046710468104691047010471104721047310474104751047610477104781047910480104811048210483104841048510486104871048810489104901049110492104931049410495104961049710498104991050010501105021050310504105051050610507105081050910510105111051210513105141051510516105171051810519105201052110522105231052410525105261052710528105291053010531105321053310534105351053610537105381053910540105411054210543105441054510546105471054810549105501055110552105531055410555105561055710558105591056010561105621056310564105651056610567105681056910570105711057210573105741057510576105771057810579105801058110582105831058410585105861058710588105891059010591105921059310594105951059610597105981059910600106011060210603106041060510606106071060810609106101061110612106131061410615106161061710618106191062010621106221062310624106251062610627106281062910630106311063210633106341063510636106371063810639106401064110642106431064410645106461064710648106491065010651106521065310654106551065610657106581065910660106611066210663106641066510666106671066810669106701067110672106731067410675106761067710678106791068010681106821068310684106851068610687106881068910690106911069210693106941069510696106971069810699107001070110702107031070410705107061070710708107091071010711107121071310714107151071610717107181071910720107211072210723107241072510726107271072810729107301073110732107331073410735107361073710738107391074010741107421074310744107451074610747107481074910750107511075210753107541075510756107571075810759107601076110762107631076410765107661076710768107691077010771107721077310774107751077610777107781077910780107811078210783107841078510786107871078810789107901079110792107931079410795107961079710798107991080010801108021080310804108051080610807108081080910810108111081210813108141081510816108171081810819108201082110822108231082410825108261082710828108291083010831108321083310834108351083610837108381083910840108411084210843108441084510846108471084810849108501085110852108531085410855108561085710858108591086010861108621086310864108651086610867108681086910870108711087210873108741087510876108771087810879108801088110882108831088410885108861088710888108891089010891108921089310894108951089610897108981089910900109011090210903109041090510906109071090810909109101091110912109131091410915109161091710918109191092010921109221092310924109251092610927109281092910930109311093210933109341093510936109371093810939109401094110942109431094410945109461094710948109491095010951109521095310954109551095610957109581095910960109611096210963109641096510966109671096810969109701097110972109731097410975109761097710978109791098010981109821098310984109851098610987109881098910990109911099210993109941099510996109971099810999110001100111002110031100411005110061100711008110091101011011110121101311014110151101611017110181101911020110211102211023110241102511026110271102811029110301103111032110331103411035110361103711038110391104011041110421104311044110451104611047110481104911050110511105211053110541105511056110571105811059110601106111062110631106411065110661106711068110691107011071110721107311074110751107611077110781107911080110811108211083110841108511086110871108811089110901109111092110931109411095110961109711098110991110011101111021110311104111051110611107111081110911110111111111211113111141111511116111171111811119111201112111122111231112411125111261112711128111291113011131111321113311134111351113611137111381113911140111411114211143111441114511146111471114811149111501115111152111531115411155111561115711158111591116011161111621116311164111651116611167111681116911170111711117211173111741117511176111771117811179111801118111182111831118411185111861118711188111891119011191111921119311194111951119611197111981119911200112011120211203112041120511206112071120811209112101121111212112131121411215112161121711218112191122011221112221122311224112251122611227112281122911230112311123211233112341123511236112371123811239112401124111242112431124411245112461124711248112491125011251112521125311254112551125611257112581125911260112611126211263112641126511266112671126811269112701127111272112731127411275112761127711278112791128011281112821128311284112851128611287112881128911290112911129211293112941129511296112971129811299113001130111302113031130411305113061130711308113091131011311113121131311314113151131611317113181131911320113211132211323113241132511326113271132811329113301133111332113331133411335113361133711338113391134011341113421134311344113451134611347113481134911350113511135211353113541135511356113571135811359113601136111362113631136411365113661136711368113691137011371113721137311374113751137611377113781137911380113811138211383113841138511386113871138811389113901139111392113931139411395113961139711398113991140011401114021140311404114051140611407114081140911410114111141211413114141141511416114171141811419114201142111422114231142411425114261142711428114291143011431114321143311434114351143611437114381143911440114411144211443114441144511446114471144811449114501145111452114531145411455114561145711458114591146011461114621146311464114651146611467114681146911470114711147211473114741147511476114771147811479114801148111482114831148411485114861148711488114891149011491114921149311494114951149611497114981149911500115011150211503115041150511506115071150811509115101151111512115131151411515115161151711518115191152011521115221152311524115251152611527115281152911530115311153211533115341153511536115371153811539115401154111542115431154411545115461154711548115491155011551115521155311554115551155611557115581155911560115611156211563115641156511566115671156811569115701157111572115731157411575115761157711578115791158011581115821158311584115851158611587115881158911590115911159211593115941159511596115971159811599116001160111602116031160411605116061160711608116091161011611116121161311614116151161611617116181161911620116211162211623116241162511626116271162811629116301163111632116331163411635116361163711638116391164011641116421164311644116451164611647116481164911650116511165211653116541165511656116571165811659116601166111662116631166411665116661166711668116691167011671116721167311674116751167611677116781167911680116811168211683116841168511686116871168811689116901169111692116931169411695116961169711698116991170011701117021170311704117051170611707117081170911710117111171211713117141171511716117171171811719117201172111722117231172411725117261172711728117291173011731117321173311734117351173611737117381173911740117411174211743117441174511746117471174811749117501175111752117531175411755117561175711758117591176011761117621176311764117651176611767117681176911770117711177211773117741177511776117771177811779117801178111782117831178411785117861178711788117891179011791117921179311794117951179611797117981179911800118011180211803118041180511806118071180811809118101181111812118131181411815118161181711818118191182011821118221182311824118251182611827118281182911830118311183211833118341183511836118371183811839118401184111842118431184411845118461184711848118491185011851118521185311854118551185611857118581185911860118611186211863118641186511866118671186811869118701187111872118731187411875118761187711878118791188011881118821188311884118851188611887118881188911890118911189211893118941189511896118971189811899119001190111902119031190411905119061190711908119091191011911119121191311914119151191611917119181191911920119211192211923119241192511926119271192811929119301193111932119331193411935119361193711938119391194011941119421194311944119451194611947119481194911950119511195211953119541195511956119571195811959119601196111962119631196411965119661196711968119691197011971119721197311974119751197611977119781197911980119811198211983119841198511986119871198811989119901199111992119931199411995119961199711998119991200012001120021200312004120051200612007120081200912010120111201212013120141201512016120171201812019120201202112022
  1. /* Run the Expat test suite
  2. __ __ _
  3. ___\ \/ /_ __ __ _| |_
  4. / _ \\ /| '_ \ / _` | __|
  5. | __// \| |_) | (_| | |_
  6. \___/_/\_\ .__/ \__,_|\__|
  7. |_| XML parser
  8. Copyright (c) 2001-2006 Fred L. Drake, Jr. <[email protected]>
  9. Copyright (c) 2003 Greg Stein <[email protected]>
  10. Copyright (c) 2005-2007 Steven Solie <[email protected]>
  11. Copyright (c) 2005-2012 Karl Waclawek <[email protected]>
  12. Copyright (c) 2016-2022 Sebastian Pipping <[email protected]>
  13. Copyright (c) 2017-2018 Rhodri James <[email protected]>
  14. Copyright (c) 2017 Joe Orton <[email protected]>
  15. Copyright (c) 2017 José Gutiérrez de la Concha <[email protected]>
  16. Copyright (c) 2018 Marco Maggi <[email protected]>
  17. Copyright (c) 2019 David Loffredo <[email protected]>
  18. Copyright (c) 2020 Tim Gates <[email protected]>
  19. Copyright (c) 2021 Dong-hee Na <[email protected]>
  20. Licensed under the MIT license:
  21. Permission is hereby granted, free of charge, to any person obtaining
  22. a copy of this software and associated documentation files (the
  23. "Software"), to deal in the Software without restriction, including
  24. without limitation the rights to use, copy, modify, merge, publish,
  25. distribute, sublicense, and/or sell copies of the Software, and to permit
  26. persons to whom the Software is furnished to do so, subject to the
  27. following conditions:
  28. The above copyright notice and this permission notice shall be included
  29. in all copies or substantial portions of the Software.
  30. THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
  31. EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
  32. MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN
  33. NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM,
  34. DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR
  35. OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE
  36. USE OR OTHER DEALINGS IN THE SOFTWARE.
  37. */
  38. #include <expat_config.h>
  39. #if defined(NDEBUG)
  40. # undef NDEBUG /* because test suite relies on assert(...) at the moment */
  41. #endif
  42. #include <assert.h>
  43. #include <stdlib.h>
  44. #include <stdio.h>
  45. #include <string.h>
  46. #include <stddef.h> /* ptrdiff_t */
  47. #include <ctype.h>
  48. #include <limits.h>
  49. #include <stdint.h> /* intptr_t uint64_t */
  50. #include <math.h> /* NAN, INFINITY, isnan */
  51. #if ! defined(__cplusplus)
  52. # include <stdbool.h>
  53. #endif
  54. #include "expat.h"
  55. #include "chardata.h"
  56. #include "structdata.h"
  57. #include "internal.h"
  58. #include "minicheck.h"
  59. #include "memcheck.h"
  60. #include "siphash.h"
  61. #include "ascii.h" /* for ASCII_xxx */
  62. #ifdef XML_LARGE_SIZE
  63. # define XML_FMT_INT_MOD "ll"
  64. #else
  65. # define XML_FMT_INT_MOD "l"
  66. #endif
  67. #ifdef XML_UNICODE_WCHAR_T
  68. # define XML_FMT_CHAR "lc"
  69. # define XML_FMT_STR "ls"
  70. # include <wchar.h>
  71. # define xcstrlen(s) wcslen(s)
  72. # define xcstrcmp(s, t) wcscmp((s), (t))
  73. # define xcstrncmp(s, t, n) wcsncmp((s), (t), (n))
  74. # define XCS(s) _XCS(s)
  75. # define _XCS(s) L##s
  76. #else
  77. # ifdef XML_UNICODE
  78. # error "No support for UTF-16 character without wchar_t in tests"
  79. # else
  80. # define XML_FMT_CHAR "c"
  81. # define XML_FMT_STR "s"
  82. # define xcstrlen(s) strlen(s)
  83. # define xcstrcmp(s, t) strcmp((s), (t))
  84. # define xcstrncmp(s, t, n) strncmp((s), (t), (n))
  85. # define XCS(s) s
  86. # endif /* XML_UNICODE */
  87. #endif /* XML_UNICODE_WCHAR_T */
  88. static XML_Parser g_parser = NULL;
  89. static void
  90. tcase_add_test__ifdef_xml_dtd(TCase *tc, tcase_test_function test) {
  91. #ifdef XML_DTD
  92. tcase_add_test(tc, test);
  93. #else
  94. UNUSED_P(tc);
  95. UNUSED_P(test);
  96. #endif
  97. }
  98. static void
  99. basic_setup(void) {
  100. g_parser = XML_ParserCreate(NULL);
  101. if (g_parser == NULL)
  102. fail("Parser not created.");
  103. }
  104. static void
  105. basic_teardown(void) {
  106. if (g_parser != NULL) {
  107. XML_ParserFree(g_parser);
  108. g_parser = NULL;
  109. }
  110. }
  111. /* Generate a failure using the parser state to create an error message;
  112. this should be used when the parser reports an error we weren't
  113. expecting.
  114. */
  115. static void
  116. _xml_failure(XML_Parser parser, const char *file, int line) {
  117. char buffer[1024];
  118. enum XML_Error err = XML_GetErrorCode(parser);
  119. sprintf(buffer,
  120. " %d: %" XML_FMT_STR " (line %" XML_FMT_INT_MOD
  121. "u, offset %" XML_FMT_INT_MOD "u)\n reported from %s, line %d\n",
  122. err, XML_ErrorString(err), XML_GetCurrentLineNumber(parser),
  123. XML_GetCurrentColumnNumber(parser), file, line);
  124. _fail_unless(0, file, line, buffer);
  125. }
  126. static enum XML_Status
  127. _XML_Parse_SINGLE_BYTES(XML_Parser parser, const char *s, int len,
  128. int isFinal) {
  129. enum XML_Status res = XML_STATUS_ERROR;
  130. int offset = 0;
  131. if (len == 0) {
  132. return XML_Parse(parser, s, len, isFinal);
  133. }
  134. for (; offset < len; offset++) {
  135. const int innerIsFinal = (offset == len - 1) && isFinal;
  136. const char c = s[offset]; /* to help out-of-bounds detection */
  137. res = XML_Parse(parser, &c, sizeof(char), innerIsFinal);
  138. if (res != XML_STATUS_OK) {
  139. return res;
  140. }
  141. }
  142. return res;
  143. }
  144. #define xml_failure(parser) _xml_failure((parser), __FILE__, __LINE__)
  145. static void
  146. _expect_failure(const char *text, enum XML_Error errorCode,
  147. const char *errorMessage, const char *file, int lineno) {
  148. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_TRUE)
  149. == XML_STATUS_OK)
  150. /* Hackish use of _fail_unless() macro, but let's us report
  151. the right filename and line number. */
  152. _fail_unless(0, file, lineno, errorMessage);
  153. if (XML_GetErrorCode(g_parser) != errorCode)
  154. _xml_failure(g_parser, file, lineno);
  155. }
  156. #define expect_failure(text, errorCode, errorMessage) \
  157. _expect_failure((text), (errorCode), (errorMessage), __FILE__, __LINE__)
  158. /* Dummy handlers for when we need to set a handler to tickle a bug,
  159. but it doesn't need to do anything.
  160. */
  161. static unsigned long dummy_handler_flags = 0;
  162. #define DUMMY_START_DOCTYPE_HANDLER_FLAG (1UL << 0)
  163. #define DUMMY_END_DOCTYPE_HANDLER_FLAG (1UL << 1)
  164. #define DUMMY_ENTITY_DECL_HANDLER_FLAG (1UL << 2)
  165. #define DUMMY_NOTATION_DECL_HANDLER_FLAG (1UL << 3)
  166. #define DUMMY_ELEMENT_DECL_HANDLER_FLAG (1UL << 4)
  167. #define DUMMY_ATTLIST_DECL_HANDLER_FLAG (1UL << 5)
  168. #define DUMMY_COMMENT_HANDLER_FLAG (1UL << 6)
  169. #define DUMMY_PI_HANDLER_FLAG (1UL << 7)
  170. #define DUMMY_START_ELEMENT_HANDLER_FLAG (1UL << 8)
  171. #define DUMMY_START_CDATA_HANDLER_FLAG (1UL << 9)
  172. #define DUMMY_END_CDATA_HANDLER_FLAG (1UL << 10)
  173. #define DUMMY_UNPARSED_ENTITY_DECL_HANDLER_FLAG (1UL << 11)
  174. #define DUMMY_START_NS_DECL_HANDLER_FLAG (1UL << 12)
  175. #define DUMMY_END_NS_DECL_HANDLER_FLAG (1UL << 13)
  176. #define DUMMY_START_DOCTYPE_DECL_HANDLER_FLAG (1UL << 14)
  177. #define DUMMY_END_DOCTYPE_DECL_HANDLER_FLAG (1UL << 15)
  178. #define DUMMY_SKIP_HANDLER_FLAG (1UL << 16)
  179. #define DUMMY_DEFAULT_HANDLER_FLAG (1UL << 17)
  180. static void XMLCALL
  181. dummy_xdecl_handler(void *userData, const XML_Char *version,
  182. const XML_Char *encoding, int standalone) {
  183. UNUSED_P(userData);
  184. UNUSED_P(version);
  185. UNUSED_P(encoding);
  186. UNUSED_P(standalone);
  187. }
  188. static void XMLCALL
  189. dummy_start_doctype_handler(void *userData, const XML_Char *doctypeName,
  190. const XML_Char *sysid, const XML_Char *pubid,
  191. int has_internal_subset) {
  192. UNUSED_P(userData);
  193. UNUSED_P(doctypeName);
  194. UNUSED_P(sysid);
  195. UNUSED_P(pubid);
  196. UNUSED_P(has_internal_subset);
  197. dummy_handler_flags |= DUMMY_START_DOCTYPE_HANDLER_FLAG;
  198. }
  199. static void XMLCALL
  200. dummy_end_doctype_handler(void *userData) {
  201. UNUSED_P(userData);
  202. dummy_handler_flags |= DUMMY_END_DOCTYPE_HANDLER_FLAG;
  203. }
  204. static void XMLCALL
  205. dummy_entity_decl_handler(void *userData, const XML_Char *entityName,
  206. int is_parameter_entity, const XML_Char *value,
  207. int value_length, const XML_Char *base,
  208. const XML_Char *systemId, const XML_Char *publicId,
  209. const XML_Char *notationName) {
  210. UNUSED_P(userData);
  211. UNUSED_P(entityName);
  212. UNUSED_P(is_parameter_entity);
  213. UNUSED_P(value);
  214. UNUSED_P(value_length);
  215. UNUSED_P(base);
  216. UNUSED_P(systemId);
  217. UNUSED_P(publicId);
  218. UNUSED_P(notationName);
  219. dummy_handler_flags |= DUMMY_ENTITY_DECL_HANDLER_FLAG;
  220. }
  221. static void XMLCALL
  222. dummy_notation_decl_handler(void *userData, const XML_Char *notationName,
  223. const XML_Char *base, const XML_Char *systemId,
  224. const XML_Char *publicId) {
  225. UNUSED_P(userData);
  226. UNUSED_P(notationName);
  227. UNUSED_P(base);
  228. UNUSED_P(systemId);
  229. UNUSED_P(publicId);
  230. dummy_handler_flags |= DUMMY_NOTATION_DECL_HANDLER_FLAG;
  231. }
  232. static void XMLCALL
  233. dummy_element_decl_handler(void *userData, const XML_Char *name,
  234. XML_Content *model) {
  235. UNUSED_P(userData);
  236. UNUSED_P(name);
  237. /* The content model must be freed by the handler. Unfortunately
  238. * we cannot pass the parser as the userData because this is used
  239. * with other handlers that require other userData.
  240. */
  241. XML_FreeContentModel(g_parser, model);
  242. dummy_handler_flags |= DUMMY_ELEMENT_DECL_HANDLER_FLAG;
  243. }
  244. static void XMLCALL
  245. dummy_attlist_decl_handler(void *userData, const XML_Char *elname,
  246. const XML_Char *attname, const XML_Char *att_type,
  247. const XML_Char *dflt, int isrequired) {
  248. UNUSED_P(userData);
  249. UNUSED_P(elname);
  250. UNUSED_P(attname);
  251. UNUSED_P(att_type);
  252. UNUSED_P(dflt);
  253. UNUSED_P(isrequired);
  254. dummy_handler_flags |= DUMMY_ATTLIST_DECL_HANDLER_FLAG;
  255. }
  256. static void XMLCALL
  257. dummy_comment_handler(void *userData, const XML_Char *data) {
  258. UNUSED_P(userData);
  259. UNUSED_P(data);
  260. dummy_handler_flags |= DUMMY_COMMENT_HANDLER_FLAG;
  261. }
  262. static void XMLCALL
  263. dummy_pi_handler(void *userData, const XML_Char *target, const XML_Char *data) {
  264. UNUSED_P(userData);
  265. UNUSED_P(target);
  266. UNUSED_P(data);
  267. dummy_handler_flags |= DUMMY_PI_HANDLER_FLAG;
  268. }
  269. static void XMLCALL
  270. dummy_start_element(void *userData, const XML_Char *name,
  271. const XML_Char **atts) {
  272. UNUSED_P(userData);
  273. UNUSED_P(name);
  274. UNUSED_P(atts);
  275. dummy_handler_flags |= DUMMY_START_ELEMENT_HANDLER_FLAG;
  276. }
  277. static void XMLCALL
  278. dummy_end_element(void *userData, const XML_Char *name) {
  279. UNUSED_P(userData);
  280. UNUSED_P(name);
  281. }
  282. static void XMLCALL
  283. dummy_start_cdata_handler(void *userData) {
  284. UNUSED_P(userData);
  285. dummy_handler_flags |= DUMMY_START_CDATA_HANDLER_FLAG;
  286. }
  287. static void XMLCALL
  288. dummy_end_cdata_handler(void *userData) {
  289. UNUSED_P(userData);
  290. dummy_handler_flags |= DUMMY_END_CDATA_HANDLER_FLAG;
  291. }
  292. static void XMLCALL
  293. dummy_cdata_handler(void *userData, const XML_Char *s, int len) {
  294. UNUSED_P(userData);
  295. UNUSED_P(s);
  296. UNUSED_P(len);
  297. }
  298. static void XMLCALL
  299. dummy_start_namespace_decl_handler(void *userData, const XML_Char *prefix,
  300. const XML_Char *uri) {
  301. UNUSED_P(userData);
  302. UNUSED_P(prefix);
  303. UNUSED_P(uri);
  304. dummy_handler_flags |= DUMMY_START_NS_DECL_HANDLER_FLAG;
  305. }
  306. static void XMLCALL
  307. dummy_end_namespace_decl_handler(void *userData, const XML_Char *prefix) {
  308. UNUSED_P(userData);
  309. UNUSED_P(prefix);
  310. dummy_handler_flags |= DUMMY_END_NS_DECL_HANDLER_FLAG;
  311. }
  312. /* This handler is obsolete, but while the code exists we should
  313. * ensure that dealing with the handler is covered by tests.
  314. */
  315. static void XMLCALL
  316. dummy_unparsed_entity_decl_handler(void *userData, const XML_Char *entityName,
  317. const XML_Char *base,
  318. const XML_Char *systemId,
  319. const XML_Char *publicId,
  320. const XML_Char *notationName) {
  321. UNUSED_P(userData);
  322. UNUSED_P(entityName);
  323. UNUSED_P(base);
  324. UNUSED_P(systemId);
  325. UNUSED_P(publicId);
  326. UNUSED_P(notationName);
  327. dummy_handler_flags |= DUMMY_UNPARSED_ENTITY_DECL_HANDLER_FLAG;
  328. }
  329. static void XMLCALL
  330. dummy_default_handler(void *userData, const XML_Char *s, int len) {
  331. UNUSED_P(userData);
  332. UNUSED_P(s);
  333. UNUSED_P(len);
  334. }
  335. static void XMLCALL
  336. dummy_start_doctype_decl_handler(void *userData, const XML_Char *doctypeName,
  337. const XML_Char *sysid, const XML_Char *pubid,
  338. int has_internal_subset) {
  339. UNUSED_P(userData);
  340. UNUSED_P(doctypeName);
  341. UNUSED_P(sysid);
  342. UNUSED_P(pubid);
  343. UNUSED_P(has_internal_subset);
  344. dummy_handler_flags |= DUMMY_START_DOCTYPE_DECL_HANDLER_FLAG;
  345. }
  346. static void XMLCALL
  347. dummy_end_doctype_decl_handler(void *userData) {
  348. UNUSED_P(userData);
  349. dummy_handler_flags |= DUMMY_END_DOCTYPE_DECL_HANDLER_FLAG;
  350. }
  351. static void XMLCALL
  352. dummy_skip_handler(void *userData, const XML_Char *entityName,
  353. int is_parameter_entity) {
  354. UNUSED_P(userData);
  355. UNUSED_P(entityName);
  356. UNUSED_P(is_parameter_entity);
  357. dummy_handler_flags |= DUMMY_SKIP_HANDLER_FLAG;
  358. }
  359. /* Useful external entity handler */
  360. typedef struct ExtOption {
  361. const XML_Char *system_id;
  362. const char *parse_text;
  363. } ExtOption;
  364. static int XMLCALL
  365. external_entity_optioner(XML_Parser parser, const XML_Char *context,
  366. const XML_Char *base, const XML_Char *systemId,
  367. const XML_Char *publicId) {
  368. ExtOption *options = (ExtOption *)XML_GetUserData(parser);
  369. XML_Parser ext_parser;
  370. UNUSED_P(base);
  371. UNUSED_P(publicId);
  372. while (options->parse_text != NULL) {
  373. if (! xcstrcmp(systemId, options->system_id)) {
  374. enum XML_Status rc;
  375. ext_parser = XML_ExternalEntityParserCreate(parser, context, NULL);
  376. if (ext_parser == NULL)
  377. return XML_STATUS_ERROR;
  378. rc = _XML_Parse_SINGLE_BYTES(ext_parser, options->parse_text,
  379. (int)strlen(options->parse_text), XML_TRUE);
  380. XML_ParserFree(ext_parser);
  381. return rc;
  382. }
  383. options++;
  384. }
  385. fail("No suitable option found");
  386. return XML_STATUS_ERROR;
  387. }
  388. /*
  389. * Parameter entity evaluation support.
  390. */
  391. #define ENTITY_MATCH_FAIL (-1)
  392. #define ENTITY_MATCH_NOT_FOUND (0)
  393. #define ENTITY_MATCH_SUCCESS (1)
  394. static const XML_Char *entity_name_to_match = NULL;
  395. static const XML_Char *entity_value_to_match = NULL;
  396. static int entity_match_flag = ENTITY_MATCH_NOT_FOUND;
  397. static void XMLCALL
  398. param_entity_match_handler(void *userData, const XML_Char *entityName,
  399. int is_parameter_entity, const XML_Char *value,
  400. int value_length, const XML_Char *base,
  401. const XML_Char *systemId, const XML_Char *publicId,
  402. const XML_Char *notationName) {
  403. UNUSED_P(userData);
  404. UNUSED_P(base);
  405. UNUSED_P(systemId);
  406. UNUSED_P(publicId);
  407. UNUSED_P(notationName);
  408. if (! is_parameter_entity || entity_name_to_match == NULL
  409. || entity_value_to_match == NULL) {
  410. return;
  411. }
  412. if (! xcstrcmp(entityName, entity_name_to_match)) {
  413. /* The cast here is safe because we control the horizontal and
  414. * the vertical, and we therefore know our strings are never
  415. * going to overflow an int.
  416. */
  417. if (value_length != (int)xcstrlen(entity_value_to_match)
  418. || xcstrncmp(value, entity_value_to_match, value_length)) {
  419. entity_match_flag = ENTITY_MATCH_FAIL;
  420. } else {
  421. entity_match_flag = ENTITY_MATCH_SUCCESS;
  422. }
  423. }
  424. /* Else leave the match flag alone */
  425. }
  426. /*
  427. * Character & encoding tests.
  428. */
  429. START_TEST(test_nul_byte) {
  430. char text[] = "<doc>\0</doc>";
  431. /* test that a NUL byte (in US-ASCII data) is an error */
  432. if (_XML_Parse_SINGLE_BYTES(g_parser, text, sizeof(text) - 1, XML_TRUE)
  433. == XML_STATUS_OK)
  434. fail("Parser did not report error on NUL-byte.");
  435. if (XML_GetErrorCode(g_parser) != XML_ERROR_INVALID_TOKEN)
  436. xml_failure(g_parser);
  437. }
  438. END_TEST
  439. START_TEST(test_u0000_char) {
  440. /* test that a NUL byte (in US-ASCII data) is an error */
  441. expect_failure("<doc>&#0;</doc>", XML_ERROR_BAD_CHAR_REF,
  442. "Parser did not report error on NUL-byte.");
  443. }
  444. END_TEST
  445. START_TEST(test_siphash_self) {
  446. if (! sip24_valid())
  447. fail("SipHash self-test failed");
  448. }
  449. END_TEST
  450. START_TEST(test_siphash_spec) {
  451. /* https://131002.net/siphash/siphash.pdf (page 19, "Test values") */
  452. const char message[] = "\x00\x01\x02\x03\x04\x05\x06\x07\x08\x09"
  453. "\x0a\x0b\x0c\x0d\x0e";
  454. const size_t len = sizeof(message) - 1;
  455. const uint64_t expected = _SIP_ULL(0xa129ca61U, 0x49be45e5U);
  456. struct siphash state;
  457. struct sipkey key;
  458. sip_tokey(&key, "\x00\x01\x02\x03\x04\x05\x06\x07\x08\x09"
  459. "\x0a\x0b\x0c\x0d\x0e\x0f");
  460. sip24_init(&state, &key);
  461. /* Cover spread across calls */
  462. sip24_update(&state, message, 4);
  463. sip24_update(&state, message + 4, len - 4);
  464. /* Cover null length */
  465. sip24_update(&state, message, 0);
  466. if (sip24_final(&state) != expected)
  467. fail("sip24_final failed spec test\n");
  468. /* Cover wrapper */
  469. if (siphash24(message, len, &key) != expected)
  470. fail("siphash24 failed spec test\n");
  471. }
  472. END_TEST
  473. START_TEST(test_bom_utf8) {
  474. /* This test is really just making sure we don't core on a UTF-8 BOM. */
  475. const char *text = "\357\273\277<e/>";
  476. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_TRUE)
  477. == XML_STATUS_ERROR)
  478. xml_failure(g_parser);
  479. }
  480. END_TEST
  481. START_TEST(test_bom_utf16_be) {
  482. char text[] = "\376\377\0<\0e\0/\0>";
  483. if (_XML_Parse_SINGLE_BYTES(g_parser, text, sizeof(text) - 1, XML_TRUE)
  484. == XML_STATUS_ERROR)
  485. xml_failure(g_parser);
  486. }
  487. END_TEST
  488. START_TEST(test_bom_utf16_le) {
  489. char text[] = "\377\376<\0e\0/\0>\0";
  490. if (_XML_Parse_SINGLE_BYTES(g_parser, text, sizeof(text) - 1, XML_TRUE)
  491. == XML_STATUS_ERROR)
  492. xml_failure(g_parser);
  493. }
  494. END_TEST
  495. /* Parse whole buffer at once to exercise a different code path */
  496. START_TEST(test_nobom_utf16_le) {
  497. char text[] = " \0<\0e\0/\0>\0";
  498. if (XML_Parse(g_parser, text, sizeof(text) - 1, XML_TRUE) == XML_STATUS_ERROR)
  499. xml_failure(g_parser);
  500. }
  501. END_TEST
  502. static void XMLCALL
  503. accumulate_characters(void *userData, const XML_Char *s, int len) {
  504. CharData_AppendXMLChars((CharData *)userData, s, len);
  505. }
  506. static void XMLCALL
  507. accumulate_attribute(void *userData, const XML_Char *name,
  508. const XML_Char **atts) {
  509. CharData *storage = (CharData *)userData;
  510. UNUSED_P(name);
  511. /* Check there are attributes to deal with */
  512. if (atts == NULL)
  513. return;
  514. while (storage->count < 0 && atts[0] != NULL) {
  515. /* "accumulate" the value of the first attribute we see */
  516. CharData_AppendXMLChars(storage, atts[1], -1);
  517. atts += 2;
  518. }
  519. }
  520. static void
  521. _run_character_check(const char *text, const XML_Char *expected,
  522. const char *file, int line) {
  523. CharData storage;
  524. CharData_Init(&storage);
  525. XML_SetUserData(g_parser, &storage);
  526. XML_SetCharacterDataHandler(g_parser, accumulate_characters);
  527. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_TRUE)
  528. == XML_STATUS_ERROR)
  529. _xml_failure(g_parser, file, line);
  530. CharData_CheckXMLChars(&storage, expected);
  531. }
  532. #define run_character_check(text, expected) \
  533. _run_character_check(text, expected, __FILE__, __LINE__)
  534. static void
  535. _run_attribute_check(const char *text, const XML_Char *expected,
  536. const char *file, int line) {
  537. CharData storage;
  538. CharData_Init(&storage);
  539. XML_SetUserData(g_parser, &storage);
  540. XML_SetStartElementHandler(g_parser, accumulate_attribute);
  541. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_TRUE)
  542. == XML_STATUS_ERROR)
  543. _xml_failure(g_parser, file, line);
  544. CharData_CheckXMLChars(&storage, expected);
  545. }
  546. #define run_attribute_check(text, expected) \
  547. _run_attribute_check(text, expected, __FILE__, __LINE__)
  548. typedef struct ExtTest {
  549. const char *parse_text;
  550. const XML_Char *encoding;
  551. CharData *storage;
  552. } ExtTest;
  553. static void XMLCALL
  554. ext_accumulate_characters(void *userData, const XML_Char *s, int len) {
  555. ExtTest *test_data = (ExtTest *)userData;
  556. accumulate_characters(test_data->storage, s, len);
  557. }
  558. static void
  559. _run_ext_character_check(const char *text, ExtTest *test_data,
  560. const XML_Char *expected, const char *file, int line) {
  561. CharData *const storage = (CharData *)malloc(sizeof(CharData));
  562. CharData_Init(storage);
  563. test_data->storage = storage;
  564. XML_SetUserData(g_parser, test_data);
  565. XML_SetCharacterDataHandler(g_parser, ext_accumulate_characters);
  566. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_TRUE)
  567. == XML_STATUS_ERROR)
  568. _xml_failure(g_parser, file, line);
  569. CharData_CheckXMLChars(storage, expected);
  570. free(storage);
  571. }
  572. #define run_ext_character_check(text, test_data, expected) \
  573. _run_ext_character_check(text, test_data, expected, __FILE__, __LINE__)
  574. /* Regression test for SF bug #491986. */
  575. START_TEST(test_danish_latin1) {
  576. const char *text = "<?xml version='1.0' encoding='iso-8859-1'?>\n"
  577. "<e>J\xF8rgen \xE6\xF8\xE5\xC6\xD8\xC5</e>";
  578. #ifdef XML_UNICODE
  579. const XML_Char *expected
  580. = XCS("J\x00f8rgen \x00e6\x00f8\x00e5\x00c6\x00d8\x00c5");
  581. #else
  582. const XML_Char *expected
  583. = XCS("J\xC3\xB8rgen \xC3\xA6\xC3\xB8\xC3\xA5\xC3\x86\xC3\x98\xC3\x85");
  584. #endif
  585. run_character_check(text, expected);
  586. }
  587. END_TEST
  588. /* Regression test for SF bug #514281. */
  589. START_TEST(test_french_charref_hexidecimal) {
  590. const char *text = "<?xml version='1.0' encoding='iso-8859-1'?>\n"
  591. "<doc>&#xE9;&#xE8;&#xE0;&#xE7;&#xEA;&#xC8;</doc>";
  592. #ifdef XML_UNICODE
  593. const XML_Char *expected = XCS("\x00e9\x00e8\x00e0\x00e7\x00ea\x00c8");
  594. #else
  595. const XML_Char *expected
  596. = XCS("\xC3\xA9\xC3\xA8\xC3\xA0\xC3\xA7\xC3\xAA\xC3\x88");
  597. #endif
  598. run_character_check(text, expected);
  599. }
  600. END_TEST
  601. START_TEST(test_french_charref_decimal) {
  602. const char *text = "<?xml version='1.0' encoding='iso-8859-1'?>\n"
  603. "<doc>&#233;&#232;&#224;&#231;&#234;&#200;</doc>";
  604. #ifdef XML_UNICODE
  605. const XML_Char *expected = XCS("\x00e9\x00e8\x00e0\x00e7\x00ea\x00c8");
  606. #else
  607. const XML_Char *expected
  608. = XCS("\xC3\xA9\xC3\xA8\xC3\xA0\xC3\xA7\xC3\xAA\xC3\x88");
  609. #endif
  610. run_character_check(text, expected);
  611. }
  612. END_TEST
  613. START_TEST(test_french_latin1) {
  614. const char *text = "<?xml version='1.0' encoding='iso-8859-1'?>\n"
  615. "<doc>\xE9\xE8\xE0\xE7\xEa\xC8</doc>";
  616. #ifdef XML_UNICODE
  617. const XML_Char *expected = XCS("\x00e9\x00e8\x00e0\x00e7\x00ea\x00c8");
  618. #else
  619. const XML_Char *expected
  620. = XCS("\xC3\xA9\xC3\xA8\xC3\xA0\xC3\xA7\xC3\xAA\xC3\x88");
  621. #endif
  622. run_character_check(text, expected);
  623. }
  624. END_TEST
  625. START_TEST(test_french_utf8) {
  626. const char *text = "<?xml version='1.0' encoding='utf-8'?>\n"
  627. "<doc>\xC3\xA9</doc>";
  628. #ifdef XML_UNICODE
  629. const XML_Char *expected = XCS("\x00e9");
  630. #else
  631. const XML_Char *expected = XCS("\xC3\xA9");
  632. #endif
  633. run_character_check(text, expected);
  634. }
  635. END_TEST
  636. /* Regression test for SF bug #600479.
  637. XXX There should be a test that exercises all legal XML Unicode
  638. characters as PCDATA and attribute value content, and XML Name
  639. characters as part of element and attribute names.
  640. */
  641. START_TEST(test_utf8_false_rejection) {
  642. const char *text = "<doc>\xEF\xBA\xBF</doc>";
  643. #ifdef XML_UNICODE
  644. const XML_Char *expected = XCS("\xfebf");
  645. #else
  646. const XML_Char *expected = XCS("\xEF\xBA\xBF");
  647. #endif
  648. run_character_check(text, expected);
  649. }
  650. END_TEST
  651. /* Regression test for SF bug #477667.
  652. This test assures that any 8-bit character followed by a 7-bit
  653. character will not be mistakenly interpreted as a valid UTF-8
  654. sequence.
  655. */
  656. START_TEST(test_illegal_utf8) {
  657. char text[100];
  658. int i;
  659. for (i = 128; i <= 255; ++i) {
  660. sprintf(text, "<e>%ccd</e>", i);
  661. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_TRUE)
  662. == XML_STATUS_OK) {
  663. sprintf(text, "expected token error for '%c' (ordinal %d) in UTF-8 text",
  664. i, i);
  665. fail(text);
  666. } else if (XML_GetErrorCode(g_parser) != XML_ERROR_INVALID_TOKEN)
  667. xml_failure(g_parser);
  668. /* Reset the parser since we use the same parser repeatedly. */
  669. XML_ParserReset(g_parser, NULL);
  670. }
  671. }
  672. END_TEST
  673. /* Examples, not masks: */
  674. #define UTF8_LEAD_1 "\x7f" /* 0b01111111 */
  675. #define UTF8_LEAD_2 "\xdf" /* 0b11011111 */
  676. #define UTF8_LEAD_3 "\xef" /* 0b11101111 */
  677. #define UTF8_LEAD_4 "\xf7" /* 0b11110111 */
  678. #define UTF8_FOLLOW "\xbf" /* 0b10111111 */
  679. START_TEST(test_utf8_auto_align) {
  680. struct TestCase {
  681. ptrdiff_t expectedMovementInChars;
  682. const char *input;
  683. };
  684. struct TestCase cases[] = {
  685. {00, ""},
  686. {00, UTF8_LEAD_1},
  687. {-1, UTF8_LEAD_2},
  688. {00, UTF8_LEAD_2 UTF8_FOLLOW},
  689. {-1, UTF8_LEAD_3},
  690. {-2, UTF8_LEAD_3 UTF8_FOLLOW},
  691. {00, UTF8_LEAD_3 UTF8_FOLLOW UTF8_FOLLOW},
  692. {-1, UTF8_LEAD_4},
  693. {-2, UTF8_LEAD_4 UTF8_FOLLOW},
  694. {-3, UTF8_LEAD_4 UTF8_FOLLOW UTF8_FOLLOW},
  695. {00, UTF8_LEAD_4 UTF8_FOLLOW UTF8_FOLLOW UTF8_FOLLOW},
  696. };
  697. size_t i = 0;
  698. bool success = true;
  699. for (; i < sizeof(cases) / sizeof(*cases); i++) {
  700. const char *fromLim = cases[i].input + strlen(cases[i].input);
  701. const char *const fromLimInitially = fromLim;
  702. ptrdiff_t actualMovementInChars;
  703. _INTERNAL_trim_to_complete_utf8_characters(cases[i].input, &fromLim);
  704. actualMovementInChars = (fromLim - fromLimInitially);
  705. if (actualMovementInChars != cases[i].expectedMovementInChars) {
  706. size_t j = 0;
  707. success = false;
  708. printf("[-] UTF-8 case %2u: Expected movement by %2d chars"
  709. ", actually moved by %2d chars: \"",
  710. (unsigned)(i + 1), (int)cases[i].expectedMovementInChars,
  711. (int)actualMovementInChars);
  712. for (; j < strlen(cases[i].input); j++) {
  713. printf("\\x%02x", (unsigned char)cases[i].input[j]);
  714. }
  715. printf("\"\n");
  716. }
  717. }
  718. if (! success) {
  719. fail("UTF-8 auto-alignment is not bullet-proof\n");
  720. }
  721. }
  722. END_TEST
  723. START_TEST(test_utf16) {
  724. /* <?xml version="1.0" encoding="UTF-16"?>
  725. * <doc a='123'>some {A} text</doc>
  726. *
  727. * where {A} is U+FF21, FULLWIDTH LATIN CAPITAL LETTER A
  728. */
  729. char text[]
  730. = "\000<\000?\000x\000m\000\154\000 \000v\000e\000r\000s\000i\000o"
  731. "\000n\000=\000'\0001\000.\000\060\000'\000 \000e\000n\000c\000o"
  732. "\000d\000i\000n\000g\000=\000'\000U\000T\000F\000-\0001\000\066"
  733. "\000'\000?\000>\000\n"
  734. "\000<\000d\000o\000c\000 \000a\000=\000'\0001\0002\0003\000'\000>"
  735. "\000s\000o\000m\000e\000 \xff\x21\000 \000t\000e\000x\000t\000"
  736. "<\000/\000d\000o\000c\000>";
  737. #ifdef XML_UNICODE
  738. const XML_Char *expected = XCS("some \xff21 text");
  739. #else
  740. const XML_Char *expected = XCS("some \357\274\241 text");
  741. #endif
  742. CharData storage;
  743. CharData_Init(&storage);
  744. XML_SetUserData(g_parser, &storage);
  745. XML_SetCharacterDataHandler(g_parser, accumulate_characters);
  746. if (_XML_Parse_SINGLE_BYTES(g_parser, text, sizeof(text) - 1, XML_TRUE)
  747. == XML_STATUS_ERROR)
  748. xml_failure(g_parser);
  749. CharData_CheckXMLChars(&storage, expected);
  750. }
  751. END_TEST
  752. START_TEST(test_utf16_le_epilog_newline) {
  753. unsigned int first_chunk_bytes = 17;
  754. char text[] = "\xFF\xFE" /* BOM */
  755. "<\000e\000/\000>\000" /* document element */
  756. "\r\000\n\000\r\000\n\000"; /* epilog */
  757. if (first_chunk_bytes >= sizeof(text) - 1)
  758. fail("bad value of first_chunk_bytes");
  759. if (_XML_Parse_SINGLE_BYTES(g_parser, text, first_chunk_bytes, XML_FALSE)
  760. == XML_STATUS_ERROR)
  761. xml_failure(g_parser);
  762. else {
  763. enum XML_Status rc;
  764. rc = _XML_Parse_SINGLE_BYTES(g_parser, text + first_chunk_bytes,
  765. sizeof(text) - first_chunk_bytes - 1,
  766. XML_TRUE);
  767. if (rc == XML_STATUS_ERROR)
  768. xml_failure(g_parser);
  769. }
  770. }
  771. END_TEST
  772. /* Test that an outright lie in the encoding is faulted */
  773. START_TEST(test_not_utf16) {
  774. const char *text = "<?xml version='1.0' encoding='utf-16'?>"
  775. "<doc>Hi</doc>";
  776. /* Use a handler to provoke the appropriate code paths */
  777. XML_SetXmlDeclHandler(g_parser, dummy_xdecl_handler);
  778. expect_failure(text, XML_ERROR_INCORRECT_ENCODING,
  779. "UTF-16 declared in UTF-8 not faulted");
  780. }
  781. END_TEST
  782. /* Test that an unknown encoding is rejected */
  783. START_TEST(test_bad_encoding) {
  784. const char *text = "<doc>Hi</doc>";
  785. if (! XML_SetEncoding(g_parser, XCS("unknown-encoding")))
  786. fail("XML_SetEncoding failed");
  787. expect_failure(text, XML_ERROR_UNKNOWN_ENCODING,
  788. "Unknown encoding not faulted");
  789. }
  790. END_TEST
  791. /* Regression test for SF bug #481609, #774028. */
  792. START_TEST(test_latin1_umlauts) {
  793. const char *text
  794. = "<?xml version='1.0' encoding='iso-8859-1'?>\n"
  795. "<e a='\xE4 \xF6 \xFC &#228; &#246; &#252; &#x00E4; &#x0F6; &#xFC; >'\n"
  796. " >\xE4 \xF6 \xFC &#228; &#246; &#252; &#x00E4; &#x0F6; &#xFC; ></e>";
  797. #ifdef XML_UNICODE
  798. /* Expected results in UTF-16 */
  799. const XML_Char *expected = XCS("\x00e4 \x00f6 \x00fc ")
  800. XCS("\x00e4 \x00f6 \x00fc ") XCS("\x00e4 \x00f6 \x00fc >");
  801. #else
  802. /* Expected results in UTF-8 */
  803. const XML_Char *expected = XCS("\xC3\xA4 \xC3\xB6 \xC3\xBC ")
  804. XCS("\xC3\xA4 \xC3\xB6 \xC3\xBC ") XCS("\xC3\xA4 \xC3\xB6 \xC3\xBC >");
  805. #endif
  806. run_character_check(text, expected);
  807. XML_ParserReset(g_parser, NULL);
  808. run_attribute_check(text, expected);
  809. /* Repeat with a default handler */
  810. XML_ParserReset(g_parser, NULL);
  811. XML_SetDefaultHandler(g_parser, dummy_default_handler);
  812. run_character_check(text, expected);
  813. XML_ParserReset(g_parser, NULL);
  814. XML_SetDefaultHandler(g_parser, dummy_default_handler);
  815. run_attribute_check(text, expected);
  816. }
  817. END_TEST
  818. /* Test that an element name with a 4-byte UTF-8 character is rejected */
  819. START_TEST(test_long_utf8_character) {
  820. const char *text
  821. = "<?xml version='1.0' encoding='utf-8'?>\n"
  822. /* 0xf0 0x90 0x80 0x80 = U+10000, the first Linear B character */
  823. "<do\xf0\x90\x80\x80/>";
  824. expect_failure(text, XML_ERROR_INVALID_TOKEN,
  825. "4-byte UTF-8 character in element name not faulted");
  826. }
  827. END_TEST
  828. /* Test that a long latin-1 attribute (too long to convert in one go)
  829. * is correctly converted
  830. */
  831. START_TEST(test_long_latin1_attribute) {
  832. const char *text
  833. = "<?xml version='1.0' encoding='iso-8859-1'?>\n"
  834. "<doc att='"
  835. /* 64 characters per line */
  836. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  837. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  838. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  839. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  840. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  841. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  842. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  843. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  844. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  845. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  846. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  847. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  848. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  849. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  850. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  851. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNO"
  852. /* Last character splits across a buffer boundary */
  853. "\xe4'>\n</doc>";
  854. const XML_Char *expected =
  855. /* 64 characters per line */
  856. /* clang-format off */
  857. XCS("ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP")
  858. XCS("ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP")
  859. XCS("ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP")
  860. XCS("ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP")
  861. XCS("ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP")
  862. XCS("ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP")
  863. XCS("ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP")
  864. XCS("ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP")
  865. XCS("ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP")
  866. XCS("ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP")
  867. XCS("ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP")
  868. XCS("ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP")
  869. XCS("ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP")
  870. XCS("ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP")
  871. XCS("ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP")
  872. XCS("ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNO")
  873. /* clang-format on */
  874. #ifdef XML_UNICODE
  875. XCS("\x00e4");
  876. #else
  877. XCS("\xc3\xa4");
  878. #endif
  879. run_attribute_check(text, expected);
  880. }
  881. END_TEST
  882. /* Test that a long ASCII attribute (too long to convert in one go)
  883. * is correctly converted
  884. */
  885. START_TEST(test_long_ascii_attribute) {
  886. const char *text
  887. = "<?xml version='1.0' encoding='us-ascii'?>\n"
  888. "<doc att='"
  889. /* 64 characters per line */
  890. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  891. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  892. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  893. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  894. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  895. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  896. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  897. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  898. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  899. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  900. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  901. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  902. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  903. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  904. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  905. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  906. "01234'>\n</doc>";
  907. const XML_Char *expected =
  908. /* 64 characters per line */
  909. /* clang-format off */
  910. XCS("ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP")
  911. XCS("ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP")
  912. XCS("ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP")
  913. XCS("ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP")
  914. XCS("ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP")
  915. XCS("ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP")
  916. XCS("ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP")
  917. XCS("ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP")
  918. XCS("ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP")
  919. XCS("ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP")
  920. XCS("ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP")
  921. XCS("ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP")
  922. XCS("ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP")
  923. XCS("ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP")
  924. XCS("ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP")
  925. XCS("ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP")
  926. XCS("01234");
  927. /* clang-format on */
  928. run_attribute_check(text, expected);
  929. }
  930. END_TEST
  931. /* Regression test #1 for SF bug #653180. */
  932. START_TEST(test_line_number_after_parse) {
  933. const char *text = "<tag>\n"
  934. "\n"
  935. "\n</tag>";
  936. XML_Size lineno;
  937. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_FALSE)
  938. == XML_STATUS_ERROR)
  939. xml_failure(g_parser);
  940. lineno = XML_GetCurrentLineNumber(g_parser);
  941. if (lineno != 4) {
  942. char buffer[100];
  943. sprintf(buffer, "expected 4 lines, saw %" XML_FMT_INT_MOD "u", lineno);
  944. fail(buffer);
  945. }
  946. }
  947. END_TEST
  948. /* Regression test #2 for SF bug #653180. */
  949. START_TEST(test_column_number_after_parse) {
  950. const char *text = "<tag></tag>";
  951. XML_Size colno;
  952. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_FALSE)
  953. == XML_STATUS_ERROR)
  954. xml_failure(g_parser);
  955. colno = XML_GetCurrentColumnNumber(g_parser);
  956. if (colno != 11) {
  957. char buffer[100];
  958. sprintf(buffer, "expected 11 columns, saw %" XML_FMT_INT_MOD "u", colno);
  959. fail(buffer);
  960. }
  961. }
  962. END_TEST
  963. #define STRUCT_START_TAG 0
  964. #define STRUCT_END_TAG 1
  965. static void XMLCALL
  966. start_element_event_handler2(void *userData, const XML_Char *name,
  967. const XML_Char **attr) {
  968. StructData *storage = (StructData *)userData;
  969. UNUSED_P(attr);
  970. StructData_AddItem(storage, name, XML_GetCurrentColumnNumber(g_parser),
  971. XML_GetCurrentLineNumber(g_parser), STRUCT_START_TAG);
  972. }
  973. static void XMLCALL
  974. end_element_event_handler2(void *userData, const XML_Char *name) {
  975. StructData *storage = (StructData *)userData;
  976. StructData_AddItem(storage, name, XML_GetCurrentColumnNumber(g_parser),
  977. XML_GetCurrentLineNumber(g_parser), STRUCT_END_TAG);
  978. }
  979. /* Regression test #3 for SF bug #653180. */
  980. START_TEST(test_line_and_column_numbers_inside_handlers) {
  981. const char *text = "<a>\n" /* Unix end-of-line */
  982. " <b>\r\n" /* Windows end-of-line */
  983. " <c/>\r" /* Mac OS end-of-line */
  984. " </b>\n"
  985. " <d>\n"
  986. " <f/>\n"
  987. " </d>\n"
  988. "</a>";
  989. const StructDataEntry expected[]
  990. = {{XCS("a"), 0, 1, STRUCT_START_TAG}, {XCS("b"), 2, 2, STRUCT_START_TAG},
  991. {XCS("c"), 4, 3, STRUCT_START_TAG}, {XCS("c"), 8, 3, STRUCT_END_TAG},
  992. {XCS("b"), 2, 4, STRUCT_END_TAG}, {XCS("d"), 2, 5, STRUCT_START_TAG},
  993. {XCS("f"), 4, 6, STRUCT_START_TAG}, {XCS("f"), 8, 6, STRUCT_END_TAG},
  994. {XCS("d"), 2, 7, STRUCT_END_TAG}, {XCS("a"), 0, 8, STRUCT_END_TAG}};
  995. const int expected_count = sizeof(expected) / sizeof(StructDataEntry);
  996. StructData storage;
  997. StructData_Init(&storage);
  998. XML_SetUserData(g_parser, &storage);
  999. XML_SetStartElementHandler(g_parser, start_element_event_handler2);
  1000. XML_SetEndElementHandler(g_parser, end_element_event_handler2);
  1001. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_TRUE)
  1002. == XML_STATUS_ERROR)
  1003. xml_failure(g_parser);
  1004. StructData_CheckItems(&storage, expected, expected_count);
  1005. StructData_Dispose(&storage);
  1006. }
  1007. END_TEST
  1008. /* Regression test #4 for SF bug #653180. */
  1009. START_TEST(test_line_number_after_error) {
  1010. const char *text = "<a>\n"
  1011. " <b>\n"
  1012. " </a>"; /* missing </b> */
  1013. XML_Size lineno;
  1014. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_FALSE)
  1015. != XML_STATUS_ERROR)
  1016. fail("Expected a parse error");
  1017. lineno = XML_GetCurrentLineNumber(g_parser);
  1018. if (lineno != 3) {
  1019. char buffer[100];
  1020. sprintf(buffer, "expected 3 lines, saw %" XML_FMT_INT_MOD "u", lineno);
  1021. fail(buffer);
  1022. }
  1023. }
  1024. END_TEST
  1025. /* Regression test #5 for SF bug #653180. */
  1026. START_TEST(test_column_number_after_error) {
  1027. const char *text = "<a>\n"
  1028. " <b>\n"
  1029. " </a>"; /* missing </b> */
  1030. XML_Size colno;
  1031. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_FALSE)
  1032. != XML_STATUS_ERROR)
  1033. fail("Expected a parse error");
  1034. colno = XML_GetCurrentColumnNumber(g_parser);
  1035. if (colno != 4) {
  1036. char buffer[100];
  1037. sprintf(buffer, "expected 4 columns, saw %" XML_FMT_INT_MOD "u", colno);
  1038. fail(buffer);
  1039. }
  1040. }
  1041. END_TEST
  1042. /* Regression test for SF bug #478332. */
  1043. START_TEST(test_really_long_lines) {
  1044. /* This parses an input line longer than INIT_DATA_BUF_SIZE
  1045. characters long (defined to be 1024 in xmlparse.c). We take a
  1046. really cheesy approach to building the input buffer, because
  1047. this avoids writing bugs in buffer-filling code.
  1048. */
  1049. const char *text
  1050. = "<e>"
  1051. /* 64 chars */
  1052. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789-+"
  1053. /* until we have at least 1024 characters on the line: */
  1054. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789-+"
  1055. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789-+"
  1056. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789-+"
  1057. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789-+"
  1058. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789-+"
  1059. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789-+"
  1060. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789-+"
  1061. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789-+"
  1062. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789-+"
  1063. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789-+"
  1064. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789-+"
  1065. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789-+"
  1066. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789-+"
  1067. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789-+"
  1068. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789-+"
  1069. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789-+"
  1070. "</e>";
  1071. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_TRUE)
  1072. == XML_STATUS_ERROR)
  1073. xml_failure(g_parser);
  1074. }
  1075. END_TEST
  1076. /* Test cdata processing across a buffer boundary */
  1077. START_TEST(test_really_long_encoded_lines) {
  1078. /* As above, except that we want to provoke an output buffer
  1079. * overflow with a non-trivial encoding. For this we need to pass
  1080. * the whole cdata in one go, not byte-by-byte.
  1081. */
  1082. void *buffer;
  1083. const char *text
  1084. = "<?xml version='1.0' encoding='iso-8859-1'?>"
  1085. "<e>"
  1086. /* 64 chars */
  1087. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789-+"
  1088. /* until we have at least 1024 characters on the line: */
  1089. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789-+"
  1090. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789-+"
  1091. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789-+"
  1092. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789-+"
  1093. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789-+"
  1094. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789-+"
  1095. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789-+"
  1096. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789-+"
  1097. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789-+"
  1098. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789-+"
  1099. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789-+"
  1100. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789-+"
  1101. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789-+"
  1102. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789-+"
  1103. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789-+"
  1104. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789-+"
  1105. "</e>";
  1106. int parse_len = (int)strlen(text);
  1107. /* Need a cdata handler to provoke the code path we want to test */
  1108. XML_SetCharacterDataHandler(g_parser, dummy_cdata_handler);
  1109. buffer = XML_GetBuffer(g_parser, parse_len);
  1110. if (buffer == NULL)
  1111. fail("Could not allocate parse buffer");
  1112. assert(buffer != NULL);
  1113. memcpy(buffer, text, parse_len);
  1114. if (XML_ParseBuffer(g_parser, parse_len, XML_TRUE) == XML_STATUS_ERROR)
  1115. xml_failure(g_parser);
  1116. }
  1117. END_TEST
  1118. /*
  1119. * Element event tests.
  1120. */
  1121. static void XMLCALL
  1122. start_element_event_handler(void *userData, const XML_Char *name,
  1123. const XML_Char **atts) {
  1124. UNUSED_P(atts);
  1125. CharData_AppendXMLChars((CharData *)userData, name, -1);
  1126. }
  1127. static void XMLCALL
  1128. end_element_event_handler(void *userData, const XML_Char *name) {
  1129. CharData *storage = (CharData *)userData;
  1130. CharData_AppendXMLChars(storage, XCS("/"), 1);
  1131. CharData_AppendXMLChars(storage, name, -1);
  1132. }
  1133. START_TEST(test_end_element_events) {
  1134. const char *text = "<a><b><c/></b><d><f/></d></a>";
  1135. const XML_Char *expected = XCS("/c/b/f/d/a");
  1136. CharData storage;
  1137. CharData_Init(&storage);
  1138. XML_SetUserData(g_parser, &storage);
  1139. XML_SetEndElementHandler(g_parser, end_element_event_handler);
  1140. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_TRUE)
  1141. == XML_STATUS_ERROR)
  1142. xml_failure(g_parser);
  1143. CharData_CheckXMLChars(&storage, expected);
  1144. }
  1145. END_TEST
  1146. /*
  1147. * Attribute tests.
  1148. */
  1149. /* Helpers used by the following test; this checks any "attr" and "refs"
  1150. attributes to make sure whitespace has been normalized.
  1151. Return true if whitespace has been normalized in a string, using
  1152. the rules for attribute value normalization. The 'is_cdata' flag
  1153. is needed since CDATA attributes don't need to have multiple
  1154. whitespace characters collapsed to a single space, while other
  1155. attribute data types do. (Section 3.3.3 of the recommendation.)
  1156. */
  1157. static int
  1158. is_whitespace_normalized(const XML_Char *s, int is_cdata) {
  1159. int blanks = 0;
  1160. int at_start = 1;
  1161. while (*s) {
  1162. if (*s == XCS(' '))
  1163. ++blanks;
  1164. else if (*s == XCS('\t') || *s == XCS('\n') || *s == XCS('\r'))
  1165. return 0;
  1166. else {
  1167. if (at_start) {
  1168. at_start = 0;
  1169. if (blanks && ! is_cdata)
  1170. /* illegal leading blanks */
  1171. return 0;
  1172. } else if (blanks > 1 && ! is_cdata)
  1173. return 0;
  1174. blanks = 0;
  1175. }
  1176. ++s;
  1177. }
  1178. if (blanks && ! is_cdata)
  1179. return 0;
  1180. return 1;
  1181. }
  1182. /* Check the attribute whitespace checker: */
  1183. static void
  1184. testhelper_is_whitespace_normalized(void) {
  1185. assert(is_whitespace_normalized(XCS("abc"), 0));
  1186. assert(is_whitespace_normalized(XCS("abc"), 1));
  1187. assert(is_whitespace_normalized(XCS("abc def ghi"), 0));
  1188. assert(is_whitespace_normalized(XCS("abc def ghi"), 1));
  1189. assert(! is_whitespace_normalized(XCS(" abc def ghi"), 0));
  1190. assert(is_whitespace_normalized(XCS(" abc def ghi"), 1));
  1191. assert(! is_whitespace_normalized(XCS("abc def ghi"), 0));
  1192. assert(is_whitespace_normalized(XCS("abc def ghi"), 1));
  1193. assert(! is_whitespace_normalized(XCS("abc def ghi "), 0));
  1194. assert(is_whitespace_normalized(XCS("abc def ghi "), 1));
  1195. assert(! is_whitespace_normalized(XCS(" "), 0));
  1196. assert(is_whitespace_normalized(XCS(" "), 1));
  1197. assert(! is_whitespace_normalized(XCS("\t"), 0));
  1198. assert(! is_whitespace_normalized(XCS("\t"), 1));
  1199. assert(! is_whitespace_normalized(XCS("\n"), 0));
  1200. assert(! is_whitespace_normalized(XCS("\n"), 1));
  1201. assert(! is_whitespace_normalized(XCS("\r"), 0));
  1202. assert(! is_whitespace_normalized(XCS("\r"), 1));
  1203. assert(! is_whitespace_normalized(XCS("abc\t def"), 1));
  1204. }
  1205. static void XMLCALL
  1206. check_attr_contains_normalized_whitespace(void *userData, const XML_Char *name,
  1207. const XML_Char **atts) {
  1208. int i;
  1209. UNUSED_P(userData);
  1210. UNUSED_P(name);
  1211. for (i = 0; atts[i] != NULL; i += 2) {
  1212. const XML_Char *attrname = atts[i];
  1213. const XML_Char *value = atts[i + 1];
  1214. if (xcstrcmp(XCS("attr"), attrname) == 0
  1215. || xcstrcmp(XCS("ents"), attrname) == 0
  1216. || xcstrcmp(XCS("refs"), attrname) == 0) {
  1217. if (! is_whitespace_normalized(value, 0)) {
  1218. char buffer[256];
  1219. sprintf(buffer,
  1220. "attribute value not normalized: %" XML_FMT_STR
  1221. "='%" XML_FMT_STR "'",
  1222. attrname, value);
  1223. fail(buffer);
  1224. }
  1225. }
  1226. }
  1227. }
  1228. START_TEST(test_attr_whitespace_normalization) {
  1229. const char *text
  1230. = "<!DOCTYPE doc [\n"
  1231. " <!ATTLIST doc\n"
  1232. " attr NMTOKENS #REQUIRED\n"
  1233. " ents ENTITIES #REQUIRED\n"
  1234. " refs IDREFS #REQUIRED>\n"
  1235. "]>\n"
  1236. "<doc attr=' a b c\t\td\te\t' refs=' id-1 \t id-2\t\t' \n"
  1237. " ents=' ent-1 \t\r\n"
  1238. " ent-2 ' >\n"
  1239. " <e id='id-1'/>\n"
  1240. " <e id='id-2'/>\n"
  1241. "</doc>";
  1242. XML_SetStartElementHandler(g_parser,
  1243. check_attr_contains_normalized_whitespace);
  1244. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_TRUE)
  1245. == XML_STATUS_ERROR)
  1246. xml_failure(g_parser);
  1247. }
  1248. END_TEST
  1249. /*
  1250. * XML declaration tests.
  1251. */
  1252. START_TEST(test_xmldecl_misplaced) {
  1253. expect_failure("\n"
  1254. "<?xml version='1.0'?>\n"
  1255. "<a/>",
  1256. XML_ERROR_MISPLACED_XML_PI,
  1257. "failed to report misplaced XML declaration");
  1258. }
  1259. END_TEST
  1260. START_TEST(test_xmldecl_invalid) {
  1261. expect_failure("<?xml version='1.0' \xc3\xa7?>\n<doc/>", XML_ERROR_XML_DECL,
  1262. "Failed to report invalid XML declaration");
  1263. }
  1264. END_TEST
  1265. START_TEST(test_xmldecl_missing_attr) {
  1266. expect_failure("<?xml ='1.0'?>\n<doc/>\n", XML_ERROR_XML_DECL,
  1267. "Failed to report missing XML declaration attribute");
  1268. }
  1269. END_TEST
  1270. START_TEST(test_xmldecl_missing_value) {
  1271. expect_failure("<?xml version='1.0' encoding='us-ascii' standalone?>\n"
  1272. "<doc/>",
  1273. XML_ERROR_XML_DECL,
  1274. "Failed to report missing attribute value");
  1275. }
  1276. END_TEST
  1277. /* Regression test for SF bug #584832. */
  1278. static int XMLCALL
  1279. UnknownEncodingHandler(void *data, const XML_Char *encoding,
  1280. XML_Encoding *info) {
  1281. UNUSED_P(data);
  1282. if (xcstrcmp(encoding, XCS("unsupported-encoding")) == 0) {
  1283. int i;
  1284. for (i = 0; i < 256; ++i)
  1285. info->map[i] = i;
  1286. info->data = NULL;
  1287. info->convert = NULL;
  1288. info->release = NULL;
  1289. return XML_STATUS_OK;
  1290. }
  1291. return XML_STATUS_ERROR;
  1292. }
  1293. START_TEST(test_unknown_encoding_internal_entity) {
  1294. const char *text = "<?xml version='1.0' encoding='unsupported-encoding'?>\n"
  1295. "<!DOCTYPE test [<!ENTITY foo 'bar'>]>\n"
  1296. "<test a='&foo;'/>";
  1297. XML_SetUnknownEncodingHandler(g_parser, UnknownEncodingHandler, NULL);
  1298. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_TRUE)
  1299. == XML_STATUS_ERROR)
  1300. xml_failure(g_parser);
  1301. }
  1302. END_TEST
  1303. /* Test unrecognised encoding handler */
  1304. static void
  1305. dummy_release(void *data) {
  1306. UNUSED_P(data);
  1307. }
  1308. static int XMLCALL
  1309. UnrecognisedEncodingHandler(void *data, const XML_Char *encoding,
  1310. XML_Encoding *info) {
  1311. UNUSED_P(data);
  1312. UNUSED_P(encoding);
  1313. info->data = NULL;
  1314. info->convert = NULL;
  1315. info->release = dummy_release;
  1316. return XML_STATUS_ERROR;
  1317. }
  1318. START_TEST(test_unrecognised_encoding_internal_entity) {
  1319. const char *text = "<?xml version='1.0' encoding='unsupported-encoding'?>\n"
  1320. "<!DOCTYPE test [<!ENTITY foo 'bar'>]>\n"
  1321. "<test a='&foo;'/>";
  1322. XML_SetUnknownEncodingHandler(g_parser, UnrecognisedEncodingHandler, NULL);
  1323. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_TRUE)
  1324. != XML_STATUS_ERROR)
  1325. fail("Unrecognised encoding not rejected");
  1326. }
  1327. END_TEST
  1328. /* Regression test for SF bug #620106. */
  1329. static int XMLCALL
  1330. external_entity_loader(XML_Parser parser, const XML_Char *context,
  1331. const XML_Char *base, const XML_Char *systemId,
  1332. const XML_Char *publicId) {
  1333. ExtTest *test_data = (ExtTest *)XML_GetUserData(parser);
  1334. XML_Parser extparser;
  1335. UNUSED_P(base);
  1336. UNUSED_P(systemId);
  1337. UNUSED_P(publicId);
  1338. extparser = XML_ExternalEntityParserCreate(parser, context, NULL);
  1339. if (extparser == NULL)
  1340. fail("Could not create external entity parser.");
  1341. if (test_data->encoding != NULL) {
  1342. if (! XML_SetEncoding(extparser, test_data->encoding))
  1343. fail("XML_SetEncoding() ignored for external entity");
  1344. }
  1345. if (_XML_Parse_SINGLE_BYTES(extparser, test_data->parse_text,
  1346. (int)strlen(test_data->parse_text), XML_TRUE)
  1347. == XML_STATUS_ERROR) {
  1348. xml_failure(extparser);
  1349. return XML_STATUS_ERROR;
  1350. }
  1351. XML_ParserFree(extparser);
  1352. return XML_STATUS_OK;
  1353. }
  1354. START_TEST(test_ext_entity_set_encoding) {
  1355. const char *text = "<!DOCTYPE doc [\n"
  1356. " <!ENTITY en SYSTEM 'http://example.org/dummy.ent'>\n"
  1357. "]>\n"
  1358. "<doc>&en;</doc>";
  1359. ExtTest test_data
  1360. = {/* This text says it's an unsupported encoding, but it's really
  1361. UTF-8, which we tell Expat using XML_SetEncoding().
  1362. */
  1363. "<?xml encoding='iso-8859-3'?>\xC3\xA9", XCS("utf-8"), NULL};
  1364. #ifdef XML_UNICODE
  1365. const XML_Char *expected = XCS("\x00e9");
  1366. #else
  1367. const XML_Char *expected = XCS("\xc3\xa9");
  1368. #endif
  1369. XML_SetExternalEntityRefHandler(g_parser, external_entity_loader);
  1370. run_ext_character_check(text, &test_data, expected);
  1371. }
  1372. END_TEST
  1373. /* Test external entities with no handler */
  1374. START_TEST(test_ext_entity_no_handler) {
  1375. const char *text = "<!DOCTYPE doc [\n"
  1376. " <!ENTITY en SYSTEM 'http://example.org/dummy.ent'>\n"
  1377. "]>\n"
  1378. "<doc>&en;</doc>";
  1379. XML_SetDefaultHandler(g_parser, dummy_default_handler);
  1380. run_character_check(text, XCS(""));
  1381. }
  1382. END_TEST
  1383. /* Test UTF-8 BOM is accepted */
  1384. START_TEST(test_ext_entity_set_bom) {
  1385. const char *text = "<!DOCTYPE doc [\n"
  1386. " <!ENTITY en SYSTEM 'http://example.org/dummy.ent'>\n"
  1387. "]>\n"
  1388. "<doc>&en;</doc>";
  1389. ExtTest test_data = {"\xEF\xBB\xBF" /* BOM */
  1390. "<?xml encoding='iso-8859-3'?>"
  1391. "\xC3\xA9",
  1392. XCS("utf-8"), NULL};
  1393. #ifdef XML_UNICODE
  1394. const XML_Char *expected = XCS("\x00e9");
  1395. #else
  1396. const XML_Char *expected = XCS("\xc3\xa9");
  1397. #endif
  1398. XML_SetExternalEntityRefHandler(g_parser, external_entity_loader);
  1399. run_ext_character_check(text, &test_data, expected);
  1400. }
  1401. END_TEST
  1402. /* Test that bad encodings are faulted */
  1403. typedef struct ext_faults {
  1404. const char *parse_text;
  1405. const char *fail_text;
  1406. const XML_Char *encoding;
  1407. enum XML_Error error;
  1408. } ExtFaults;
  1409. static int XMLCALL
  1410. external_entity_faulter(XML_Parser parser, const XML_Char *context,
  1411. const XML_Char *base, const XML_Char *systemId,
  1412. const XML_Char *publicId) {
  1413. XML_Parser ext_parser;
  1414. ExtFaults *fault = (ExtFaults *)XML_GetUserData(parser);
  1415. UNUSED_P(base);
  1416. UNUSED_P(systemId);
  1417. UNUSED_P(publicId);
  1418. ext_parser = XML_ExternalEntityParserCreate(parser, context, NULL);
  1419. if (ext_parser == NULL)
  1420. fail("Could not create external entity parser");
  1421. if (fault->encoding != NULL) {
  1422. if (! XML_SetEncoding(ext_parser, fault->encoding))
  1423. fail("XML_SetEncoding failed");
  1424. }
  1425. if (_XML_Parse_SINGLE_BYTES(ext_parser, fault->parse_text,
  1426. (int)strlen(fault->parse_text), XML_TRUE)
  1427. != XML_STATUS_ERROR)
  1428. fail(fault->fail_text);
  1429. if (XML_GetErrorCode(ext_parser) != fault->error)
  1430. xml_failure(ext_parser);
  1431. XML_ParserFree(ext_parser);
  1432. return XML_STATUS_ERROR;
  1433. }
  1434. START_TEST(test_ext_entity_bad_encoding) {
  1435. const char *text = "<!DOCTYPE doc [\n"
  1436. " <!ENTITY en SYSTEM 'http://example.org/dummy.ent'>\n"
  1437. "]>\n"
  1438. "<doc>&en;</doc>";
  1439. ExtFaults fault
  1440. = {"<?xml encoding='iso-8859-3'?>u", "Unsupported encoding not faulted",
  1441. XCS("unknown"), XML_ERROR_UNKNOWN_ENCODING};
  1442. XML_SetExternalEntityRefHandler(g_parser, external_entity_faulter);
  1443. XML_SetUserData(g_parser, &fault);
  1444. expect_failure(text, XML_ERROR_EXTERNAL_ENTITY_HANDLING,
  1445. "Bad encoding should not have been accepted");
  1446. }
  1447. END_TEST
  1448. /* Try handing an invalid encoding to an external entity parser */
  1449. START_TEST(test_ext_entity_bad_encoding_2) {
  1450. const char *text = "<?xml version='1.0' encoding='us-ascii'?>\n"
  1451. "<!DOCTYPE doc SYSTEM 'foo'>\n"
  1452. "<doc>&entity;</doc>";
  1453. ExtFaults fault
  1454. = {"<!ELEMENT doc (#PCDATA)*>", "Unknown encoding not faulted",
  1455. XCS("unknown-encoding"), XML_ERROR_UNKNOWN_ENCODING};
  1456. XML_SetParamEntityParsing(g_parser, XML_PARAM_ENTITY_PARSING_ALWAYS);
  1457. XML_SetExternalEntityRefHandler(g_parser, external_entity_faulter);
  1458. XML_SetUserData(g_parser, &fault);
  1459. expect_failure(text, XML_ERROR_EXTERNAL_ENTITY_HANDLING,
  1460. "Bad encoding not faulted in external entity handler");
  1461. }
  1462. END_TEST
  1463. /* Test that no error is reported for unknown entities if we don't
  1464. read an external subset. This was fixed in Expat 1.95.5.
  1465. */
  1466. START_TEST(test_wfc_undeclared_entity_unread_external_subset) {
  1467. const char *text = "<!DOCTYPE doc SYSTEM 'foo'>\n"
  1468. "<doc>&entity;</doc>";
  1469. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_TRUE)
  1470. == XML_STATUS_ERROR)
  1471. xml_failure(g_parser);
  1472. }
  1473. END_TEST
  1474. /* Test that an error is reported for unknown entities if we don't
  1475. have an external subset.
  1476. */
  1477. START_TEST(test_wfc_undeclared_entity_no_external_subset) {
  1478. expect_failure("<doc>&entity;</doc>", XML_ERROR_UNDEFINED_ENTITY,
  1479. "Parser did not report undefined entity w/out a DTD.");
  1480. }
  1481. END_TEST
  1482. /* Test that an error is reported for unknown entities if we don't
  1483. read an external subset, but have been declared standalone.
  1484. */
  1485. START_TEST(test_wfc_undeclared_entity_standalone) {
  1486. const char *text
  1487. = "<?xml version='1.0' encoding='us-ascii' standalone='yes'?>\n"
  1488. "<!DOCTYPE doc SYSTEM 'foo'>\n"
  1489. "<doc>&entity;</doc>";
  1490. expect_failure(text, XML_ERROR_UNDEFINED_ENTITY,
  1491. "Parser did not report undefined entity (standalone).");
  1492. }
  1493. END_TEST
  1494. /* Test that an error is reported for unknown entities if we have read
  1495. an external subset, and standalone is true.
  1496. */
  1497. START_TEST(test_wfc_undeclared_entity_with_external_subset_standalone) {
  1498. const char *text
  1499. = "<?xml version='1.0' encoding='us-ascii' standalone='yes'?>\n"
  1500. "<!DOCTYPE doc SYSTEM 'foo'>\n"
  1501. "<doc>&entity;</doc>";
  1502. ExtTest test_data = {"<!ELEMENT doc (#PCDATA)*>", NULL, NULL};
  1503. XML_SetParamEntityParsing(g_parser, XML_PARAM_ENTITY_PARSING_ALWAYS);
  1504. XML_SetUserData(g_parser, &test_data);
  1505. XML_SetExternalEntityRefHandler(g_parser, external_entity_loader);
  1506. expect_failure(text, XML_ERROR_UNDEFINED_ENTITY,
  1507. "Parser did not report undefined entity (external DTD).");
  1508. }
  1509. END_TEST
  1510. /* Test that external entity handling is not done if the parsing flag
  1511. * is set to UNLESS_STANDALONE
  1512. */
  1513. START_TEST(test_entity_with_external_subset_unless_standalone) {
  1514. const char *text
  1515. = "<?xml version='1.0' encoding='us-ascii' standalone='yes'?>\n"
  1516. "<!DOCTYPE doc SYSTEM 'foo'>\n"
  1517. "<doc>&entity;</doc>";
  1518. ExtTest test_data = {"<!ENTITY entity 'bar'>", NULL, NULL};
  1519. XML_SetParamEntityParsing(g_parser,
  1520. XML_PARAM_ENTITY_PARSING_UNLESS_STANDALONE);
  1521. XML_SetUserData(g_parser, &test_data);
  1522. XML_SetExternalEntityRefHandler(g_parser, external_entity_loader);
  1523. expect_failure(text, XML_ERROR_UNDEFINED_ENTITY,
  1524. "Parser did not report undefined entity");
  1525. }
  1526. END_TEST
  1527. /* Test that no error is reported for unknown entities if we have read
  1528. an external subset, and standalone is false.
  1529. */
  1530. START_TEST(test_wfc_undeclared_entity_with_external_subset) {
  1531. const char *text = "<?xml version='1.0' encoding='us-ascii'?>\n"
  1532. "<!DOCTYPE doc SYSTEM 'foo'>\n"
  1533. "<doc>&entity;</doc>";
  1534. ExtTest test_data = {"<!ELEMENT doc (#PCDATA)*>", NULL, NULL};
  1535. XML_SetParamEntityParsing(g_parser, XML_PARAM_ENTITY_PARSING_ALWAYS);
  1536. XML_SetExternalEntityRefHandler(g_parser, external_entity_loader);
  1537. run_ext_character_check(text, &test_data, XCS(""));
  1538. }
  1539. END_TEST
  1540. /* Test that an error is reported if our NotStandalone handler fails */
  1541. static int XMLCALL
  1542. reject_not_standalone_handler(void *userData) {
  1543. UNUSED_P(userData);
  1544. return XML_STATUS_ERROR;
  1545. }
  1546. START_TEST(test_not_standalone_handler_reject) {
  1547. const char *text = "<?xml version='1.0' encoding='us-ascii'?>\n"
  1548. "<!DOCTYPE doc SYSTEM 'foo'>\n"
  1549. "<doc>&entity;</doc>";
  1550. ExtTest test_data = {"<!ELEMENT doc (#PCDATA)*>", NULL, NULL};
  1551. XML_SetParamEntityParsing(g_parser, XML_PARAM_ENTITY_PARSING_ALWAYS);
  1552. XML_SetUserData(g_parser, &test_data);
  1553. XML_SetExternalEntityRefHandler(g_parser, external_entity_loader);
  1554. XML_SetNotStandaloneHandler(g_parser, reject_not_standalone_handler);
  1555. expect_failure(text, XML_ERROR_NOT_STANDALONE,
  1556. "NotStandalone handler failed to reject");
  1557. /* Try again but without external entity handling */
  1558. XML_ParserReset(g_parser, NULL);
  1559. XML_SetNotStandaloneHandler(g_parser, reject_not_standalone_handler);
  1560. expect_failure(text, XML_ERROR_NOT_STANDALONE,
  1561. "NotStandalone handler failed to reject");
  1562. }
  1563. END_TEST
  1564. /* Test that no error is reported if our NotStandalone handler succeeds */
  1565. static int XMLCALL
  1566. accept_not_standalone_handler(void *userData) {
  1567. UNUSED_P(userData);
  1568. return XML_STATUS_OK;
  1569. }
  1570. START_TEST(test_not_standalone_handler_accept) {
  1571. const char *text = "<?xml version='1.0' encoding='us-ascii'?>\n"
  1572. "<!DOCTYPE doc SYSTEM 'foo'>\n"
  1573. "<doc>&entity;</doc>";
  1574. ExtTest test_data = {"<!ELEMENT doc (#PCDATA)*>", NULL, NULL};
  1575. XML_SetParamEntityParsing(g_parser, XML_PARAM_ENTITY_PARSING_ALWAYS);
  1576. XML_SetExternalEntityRefHandler(g_parser, external_entity_loader);
  1577. XML_SetNotStandaloneHandler(g_parser, accept_not_standalone_handler);
  1578. run_ext_character_check(text, &test_data, XCS(""));
  1579. /* Repeat without the external entity handler */
  1580. XML_ParserReset(g_parser, NULL);
  1581. XML_SetNotStandaloneHandler(g_parser, accept_not_standalone_handler);
  1582. run_character_check(text, XCS(""));
  1583. }
  1584. END_TEST
  1585. START_TEST(test_wfc_no_recursive_entity_refs) {
  1586. const char *text = "<!DOCTYPE doc [\n"
  1587. " <!ENTITY entity '&#38;entity;'>\n"
  1588. "]>\n"
  1589. "<doc>&entity;</doc>";
  1590. expect_failure(text, XML_ERROR_RECURSIVE_ENTITY_REF,
  1591. "Parser did not report recursive entity reference.");
  1592. }
  1593. END_TEST
  1594. /* Test incomplete external entities are faulted */
  1595. START_TEST(test_ext_entity_invalid_parse) {
  1596. const char *text = "<!DOCTYPE doc [\n"
  1597. " <!ENTITY en SYSTEM 'http://example.org/dummy.ent'>\n"
  1598. "]>\n"
  1599. "<doc>&en;</doc>";
  1600. const ExtFaults faults[]
  1601. = {{"<", "Incomplete element declaration not faulted", NULL,
  1602. XML_ERROR_UNCLOSED_TOKEN},
  1603. {"<\xe2\x82", /* First two bytes of a three-byte char */
  1604. "Incomplete character not faulted", NULL, XML_ERROR_PARTIAL_CHAR},
  1605. {"<tag>\xe2\x82", "Incomplete character in CDATA not faulted", NULL,
  1606. XML_ERROR_PARTIAL_CHAR},
  1607. {NULL, NULL, NULL, XML_ERROR_NONE}};
  1608. const ExtFaults *fault = faults;
  1609. for (; fault->parse_text != NULL; fault++) {
  1610. XML_SetParamEntityParsing(g_parser, XML_PARAM_ENTITY_PARSING_ALWAYS);
  1611. XML_SetExternalEntityRefHandler(g_parser, external_entity_faulter);
  1612. XML_SetUserData(g_parser, (void *)fault);
  1613. expect_failure(text, XML_ERROR_EXTERNAL_ENTITY_HANDLING,
  1614. "Parser did not report external entity error");
  1615. XML_ParserReset(g_parser, NULL);
  1616. }
  1617. }
  1618. END_TEST
  1619. /* Regression test for SF bug #483514. */
  1620. START_TEST(test_dtd_default_handling) {
  1621. const char *text = "<!DOCTYPE doc [\n"
  1622. "<!ENTITY e SYSTEM 'http://example.org/e'>\n"
  1623. "<!NOTATION n SYSTEM 'http://example.org/n'>\n"
  1624. "<!ELEMENT doc EMPTY>\n"
  1625. "<!ATTLIST doc a CDATA #IMPLIED>\n"
  1626. "<?pi in dtd?>\n"
  1627. "<!--comment in dtd-->\n"
  1628. "]><doc/>";
  1629. XML_SetDefaultHandler(g_parser, accumulate_characters);
  1630. XML_SetStartDoctypeDeclHandler(g_parser, dummy_start_doctype_handler);
  1631. XML_SetEndDoctypeDeclHandler(g_parser, dummy_end_doctype_handler);
  1632. XML_SetEntityDeclHandler(g_parser, dummy_entity_decl_handler);
  1633. XML_SetNotationDeclHandler(g_parser, dummy_notation_decl_handler);
  1634. XML_SetElementDeclHandler(g_parser, dummy_element_decl_handler);
  1635. XML_SetAttlistDeclHandler(g_parser, dummy_attlist_decl_handler);
  1636. XML_SetProcessingInstructionHandler(g_parser, dummy_pi_handler);
  1637. XML_SetCommentHandler(g_parser, dummy_comment_handler);
  1638. XML_SetStartCdataSectionHandler(g_parser, dummy_start_cdata_handler);
  1639. XML_SetEndCdataSectionHandler(g_parser, dummy_end_cdata_handler);
  1640. run_character_check(text, XCS("\n\n\n\n\n\n\n<doc/>"));
  1641. }
  1642. END_TEST
  1643. /* Test handling of attribute declarations */
  1644. typedef struct AttTest {
  1645. const char *definition;
  1646. const XML_Char *element_name;
  1647. const XML_Char *attr_name;
  1648. const XML_Char *attr_type;
  1649. const XML_Char *default_value;
  1650. int is_required;
  1651. } AttTest;
  1652. static void XMLCALL
  1653. verify_attlist_decl_handler(void *userData, const XML_Char *element_name,
  1654. const XML_Char *attr_name,
  1655. const XML_Char *attr_type,
  1656. const XML_Char *default_value, int is_required) {
  1657. AttTest *at = (AttTest *)userData;
  1658. if (xcstrcmp(element_name, at->element_name))
  1659. fail("Unexpected element name in attribute declaration");
  1660. if (xcstrcmp(attr_name, at->attr_name))
  1661. fail("Unexpected attribute name in attribute declaration");
  1662. if (xcstrcmp(attr_type, at->attr_type))
  1663. fail("Unexpected attribute type in attribute declaration");
  1664. if ((default_value == NULL && at->default_value != NULL)
  1665. || (default_value != NULL && at->default_value == NULL)
  1666. || (default_value != NULL && xcstrcmp(default_value, at->default_value)))
  1667. fail("Unexpected default value in attribute declaration");
  1668. if (is_required != at->is_required)
  1669. fail("Requirement mismatch in attribute declaration");
  1670. }
  1671. START_TEST(test_dtd_attr_handling) {
  1672. const char *prolog = "<!DOCTYPE doc [\n"
  1673. "<!ELEMENT doc EMPTY>\n";
  1674. AttTest attr_data[]
  1675. = {{"<!ATTLIST doc a ( one | two | three ) #REQUIRED>\n"
  1676. "]>"
  1677. "<doc a='two'/>",
  1678. XCS("doc"), XCS("a"),
  1679. XCS("(one|two|three)"), /* Extraneous spaces will be removed */
  1680. NULL, XML_TRUE},
  1681. {"<!NOTATION foo SYSTEM 'http://example.org/foo'>\n"
  1682. "<!ATTLIST doc a NOTATION (foo) #IMPLIED>\n"
  1683. "]>"
  1684. "<doc/>",
  1685. XCS("doc"), XCS("a"), XCS("NOTATION(foo)"), NULL, XML_FALSE},
  1686. {"<!ATTLIST doc a NOTATION (foo) 'bar'>\n"
  1687. "]>"
  1688. "<doc/>",
  1689. XCS("doc"), XCS("a"), XCS("NOTATION(foo)"), XCS("bar"), XML_FALSE},
  1690. {"<!ATTLIST doc a CDATA '\xdb\xb2'>\n"
  1691. "]>"
  1692. "<doc/>",
  1693. XCS("doc"), XCS("a"), XCS("CDATA"),
  1694. #ifdef XML_UNICODE
  1695. XCS("\x06f2"),
  1696. #else
  1697. XCS("\xdb\xb2"),
  1698. #endif
  1699. XML_FALSE},
  1700. {NULL, NULL, NULL, NULL, NULL, XML_FALSE}};
  1701. AttTest *test;
  1702. for (test = attr_data; test->definition != NULL; test++) {
  1703. XML_SetAttlistDeclHandler(g_parser, verify_attlist_decl_handler);
  1704. XML_SetUserData(g_parser, test);
  1705. if (_XML_Parse_SINGLE_BYTES(g_parser, prolog, (int)strlen(prolog),
  1706. XML_FALSE)
  1707. == XML_STATUS_ERROR)
  1708. xml_failure(g_parser);
  1709. if (_XML_Parse_SINGLE_BYTES(g_parser, test->definition,
  1710. (int)strlen(test->definition), XML_TRUE)
  1711. == XML_STATUS_ERROR)
  1712. xml_failure(g_parser);
  1713. XML_ParserReset(g_parser, NULL);
  1714. }
  1715. }
  1716. END_TEST
  1717. /* See related SF bug #673791.
  1718. When namespace processing is enabled, setting the namespace URI for
  1719. a prefix is not allowed; this test ensures that it *is* allowed
  1720. when namespace processing is not enabled.
  1721. (See Namespaces in XML, section 2.)
  1722. */
  1723. START_TEST(test_empty_ns_without_namespaces) {
  1724. const char *text = "<doc xmlns:prefix='http://example.org/'>\n"
  1725. " <e xmlns:prefix=''/>\n"
  1726. "</doc>";
  1727. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_TRUE)
  1728. == XML_STATUS_ERROR)
  1729. xml_failure(g_parser);
  1730. }
  1731. END_TEST
  1732. /* Regression test for SF bug #824420.
  1733. Checks that an xmlns:prefix attribute set in an attribute's default
  1734. value isn't misinterpreted.
  1735. */
  1736. START_TEST(test_ns_in_attribute_default_without_namespaces) {
  1737. const char *text = "<!DOCTYPE e:element [\n"
  1738. " <!ATTLIST e:element\n"
  1739. " xmlns:e CDATA 'http://example.org/'>\n"
  1740. " ]>\n"
  1741. "<e:element/>";
  1742. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_TRUE)
  1743. == XML_STATUS_ERROR)
  1744. xml_failure(g_parser);
  1745. }
  1746. END_TEST
  1747. static const char *long_character_data_text
  1748. = "<?xml version='1.0' encoding='iso-8859-1'?><s>"
  1749. "012345678901234567890123456789012345678901234567890123456789"
  1750. "012345678901234567890123456789012345678901234567890123456789"
  1751. "012345678901234567890123456789012345678901234567890123456789"
  1752. "012345678901234567890123456789012345678901234567890123456789"
  1753. "012345678901234567890123456789012345678901234567890123456789"
  1754. "012345678901234567890123456789012345678901234567890123456789"
  1755. "012345678901234567890123456789012345678901234567890123456789"
  1756. "012345678901234567890123456789012345678901234567890123456789"
  1757. "012345678901234567890123456789012345678901234567890123456789"
  1758. "012345678901234567890123456789012345678901234567890123456789"
  1759. "012345678901234567890123456789012345678901234567890123456789"
  1760. "012345678901234567890123456789012345678901234567890123456789"
  1761. "012345678901234567890123456789012345678901234567890123456789"
  1762. "012345678901234567890123456789012345678901234567890123456789"
  1763. "012345678901234567890123456789012345678901234567890123456789"
  1764. "012345678901234567890123456789012345678901234567890123456789"
  1765. "012345678901234567890123456789012345678901234567890123456789"
  1766. "012345678901234567890123456789012345678901234567890123456789"
  1767. "012345678901234567890123456789012345678901234567890123456789"
  1768. "012345678901234567890123456789012345678901234567890123456789"
  1769. "</s>";
  1770. static XML_Bool resumable = XML_FALSE;
  1771. static void
  1772. clearing_aborting_character_handler(void *userData, const XML_Char *s,
  1773. int len) {
  1774. UNUSED_P(userData);
  1775. UNUSED_P(s);
  1776. UNUSED_P(len);
  1777. XML_StopParser(g_parser, resumable);
  1778. XML_SetCharacterDataHandler(g_parser, NULL);
  1779. }
  1780. /* Regression test for SF bug #1515266: missing check of stopped
  1781. parser in doContext() 'for' loop. */
  1782. START_TEST(test_stop_parser_between_char_data_calls) {
  1783. /* The sample data must be big enough that there are two calls to
  1784. the character data handler from within the inner "for" loop of
  1785. the XML_TOK_DATA_CHARS case in doContent(), and the character
  1786. handler must stop the parser and clear the character data
  1787. handler.
  1788. */
  1789. const char *text = long_character_data_text;
  1790. XML_SetCharacterDataHandler(g_parser, clearing_aborting_character_handler);
  1791. resumable = XML_FALSE;
  1792. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_TRUE)
  1793. != XML_STATUS_ERROR)
  1794. xml_failure(g_parser);
  1795. if (XML_GetErrorCode(g_parser) != XML_ERROR_ABORTED)
  1796. xml_failure(g_parser);
  1797. }
  1798. END_TEST
  1799. /* Regression test for SF bug #1515266: missing check of stopped
  1800. parser in doContext() 'for' loop. */
  1801. START_TEST(test_suspend_parser_between_char_data_calls) {
  1802. /* The sample data must be big enough that there are two calls to
  1803. the character data handler from within the inner "for" loop of
  1804. the XML_TOK_DATA_CHARS case in doContent(), and the character
  1805. handler must stop the parser and clear the character data
  1806. handler.
  1807. */
  1808. const char *text = long_character_data_text;
  1809. XML_SetCharacterDataHandler(g_parser, clearing_aborting_character_handler);
  1810. resumable = XML_TRUE;
  1811. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_TRUE)
  1812. != XML_STATUS_SUSPENDED)
  1813. xml_failure(g_parser);
  1814. if (XML_GetErrorCode(g_parser) != XML_ERROR_NONE)
  1815. xml_failure(g_parser);
  1816. /* Try parsing directly */
  1817. if (XML_Parse(g_parser, text, (int)strlen(text), XML_TRUE)
  1818. != XML_STATUS_ERROR)
  1819. fail("Attempt to continue parse while suspended not faulted");
  1820. if (XML_GetErrorCode(g_parser) != XML_ERROR_SUSPENDED)
  1821. fail("Suspended parse not faulted with correct error");
  1822. }
  1823. END_TEST
  1824. static XML_Bool abortable = XML_FALSE;
  1825. static void
  1826. parser_stop_character_handler(void *userData, const XML_Char *s, int len) {
  1827. UNUSED_P(userData);
  1828. UNUSED_P(s);
  1829. UNUSED_P(len);
  1830. XML_StopParser(g_parser, resumable);
  1831. XML_SetCharacterDataHandler(g_parser, NULL);
  1832. if (! resumable) {
  1833. /* Check that aborting an aborted parser is faulted */
  1834. if (XML_StopParser(g_parser, XML_FALSE) != XML_STATUS_ERROR)
  1835. fail("Aborting aborted parser not faulted");
  1836. if (XML_GetErrorCode(g_parser) != XML_ERROR_FINISHED)
  1837. xml_failure(g_parser);
  1838. } else if (abortable) {
  1839. /* Check that aborting a suspended parser works */
  1840. if (XML_StopParser(g_parser, XML_FALSE) == XML_STATUS_ERROR)
  1841. xml_failure(g_parser);
  1842. } else {
  1843. /* Check that suspending a suspended parser works */
  1844. if (XML_StopParser(g_parser, XML_TRUE) != XML_STATUS_ERROR)
  1845. fail("Suspending suspended parser not faulted");
  1846. if (XML_GetErrorCode(g_parser) != XML_ERROR_SUSPENDED)
  1847. xml_failure(g_parser);
  1848. }
  1849. }
  1850. /* Test repeated calls to XML_StopParser are handled correctly */
  1851. START_TEST(test_repeated_stop_parser_between_char_data_calls) {
  1852. const char *text = long_character_data_text;
  1853. XML_SetCharacterDataHandler(g_parser, parser_stop_character_handler);
  1854. resumable = XML_FALSE;
  1855. abortable = XML_FALSE;
  1856. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_TRUE)
  1857. != XML_STATUS_ERROR)
  1858. fail("Failed to double-stop parser");
  1859. XML_ParserReset(g_parser, NULL);
  1860. XML_SetCharacterDataHandler(g_parser, parser_stop_character_handler);
  1861. resumable = XML_TRUE;
  1862. abortable = XML_FALSE;
  1863. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_TRUE)
  1864. != XML_STATUS_SUSPENDED)
  1865. fail("Failed to double-suspend parser");
  1866. XML_ParserReset(g_parser, NULL);
  1867. XML_SetCharacterDataHandler(g_parser, parser_stop_character_handler);
  1868. resumable = XML_TRUE;
  1869. abortable = XML_TRUE;
  1870. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_TRUE)
  1871. != XML_STATUS_ERROR)
  1872. fail("Failed to suspend-abort parser");
  1873. }
  1874. END_TEST
  1875. START_TEST(test_good_cdata_ascii) {
  1876. const char *text = "<a><![CDATA[<greeting>Hello, world!</greeting>]]></a>";
  1877. const XML_Char *expected = XCS("<greeting>Hello, world!</greeting>");
  1878. CharData storage;
  1879. CharData_Init(&storage);
  1880. XML_SetUserData(g_parser, &storage);
  1881. XML_SetCharacterDataHandler(g_parser, accumulate_characters);
  1882. /* Add start and end handlers for coverage */
  1883. XML_SetStartCdataSectionHandler(g_parser, dummy_start_cdata_handler);
  1884. XML_SetEndCdataSectionHandler(g_parser, dummy_end_cdata_handler);
  1885. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_TRUE)
  1886. == XML_STATUS_ERROR)
  1887. xml_failure(g_parser);
  1888. CharData_CheckXMLChars(&storage, expected);
  1889. /* Try again, this time with a default handler */
  1890. XML_ParserReset(g_parser, NULL);
  1891. CharData_Init(&storage);
  1892. XML_SetUserData(g_parser, &storage);
  1893. XML_SetCharacterDataHandler(g_parser, accumulate_characters);
  1894. XML_SetDefaultHandler(g_parser, dummy_default_handler);
  1895. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_TRUE)
  1896. == XML_STATUS_ERROR)
  1897. xml_failure(g_parser);
  1898. CharData_CheckXMLChars(&storage, expected);
  1899. }
  1900. END_TEST
  1901. START_TEST(test_good_cdata_utf16) {
  1902. /* Test data is:
  1903. * <?xml version='1.0' encoding='utf-16'?>
  1904. * <a><![CDATA[hello]]></a>
  1905. */
  1906. const char text[]
  1907. = "\0<\0?\0x\0m\0l\0"
  1908. " \0v\0e\0r\0s\0i\0o\0n\0=\0'\0\x31\0.\0\x30\0'\0"
  1909. " \0e\0n\0c\0o\0d\0i\0n\0g\0=\0'\0u\0t\0f\0-\0"
  1910. "1\0"
  1911. "6\0'"
  1912. "\0?\0>\0\n"
  1913. "\0<\0a\0>\0<\0!\0[\0C\0D\0A\0T\0A\0[\0h\0e\0l\0l\0o\0]\0]\0>\0<\0/\0a\0>";
  1914. const XML_Char *expected = XCS("hello");
  1915. CharData storage;
  1916. CharData_Init(&storage);
  1917. XML_SetUserData(g_parser, &storage);
  1918. XML_SetCharacterDataHandler(g_parser, accumulate_characters);
  1919. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)sizeof(text) - 1, XML_TRUE)
  1920. == XML_STATUS_ERROR)
  1921. xml_failure(g_parser);
  1922. CharData_CheckXMLChars(&storage, expected);
  1923. }
  1924. END_TEST
  1925. START_TEST(test_good_cdata_utf16_le) {
  1926. /* Test data is:
  1927. * <?xml version='1.0' encoding='utf-16'?>
  1928. * <a><![CDATA[hello]]></a>
  1929. */
  1930. const char text[]
  1931. = "<\0?\0x\0m\0l\0"
  1932. " \0v\0e\0r\0s\0i\0o\0n\0=\0'\0\x31\0.\0\x30\0'\0"
  1933. " \0e\0n\0c\0o\0d\0i\0n\0g\0=\0'\0u\0t\0f\0-\0"
  1934. "1\0"
  1935. "6\0'"
  1936. "\0?\0>\0\n"
  1937. "\0<\0a\0>\0<\0!\0[\0C\0D\0A\0T\0A\0[\0h\0e\0l\0l\0o\0]\0]\0>\0<\0/\0a\0>\0";
  1938. const XML_Char *expected = XCS("hello");
  1939. CharData storage;
  1940. CharData_Init(&storage);
  1941. XML_SetUserData(g_parser, &storage);
  1942. XML_SetCharacterDataHandler(g_parser, accumulate_characters);
  1943. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)sizeof(text) - 1, XML_TRUE)
  1944. == XML_STATUS_ERROR)
  1945. xml_failure(g_parser);
  1946. CharData_CheckXMLChars(&storage, expected);
  1947. }
  1948. END_TEST
  1949. /* Test UTF16 conversion of a long cdata string */
  1950. /* 16 characters: handy macro to reduce visual clutter */
  1951. #define A_TO_P_IN_UTF16 "\0A\0B\0C\0D\0E\0F\0G\0H\0I\0J\0K\0L\0M\0N\0O\0P"
  1952. START_TEST(test_long_cdata_utf16) {
  1953. /* Test data is:
  1954. * <?xlm version='1.0' encoding='utf-16'?>
  1955. * <a><![CDATA[
  1956. * ABCDEFGHIJKLMNOP
  1957. * ]]></a>
  1958. */
  1959. const char text[]
  1960. = "\0<\0?\0x\0m\0l\0 "
  1961. "\0v\0e\0r\0s\0i\0o\0n\0=\0'\0\x31\0.\0\x30\0'\0 "
  1962. "\0e\0n\0c\0o\0d\0i\0n\0g\0=\0'\0u\0t\0f\0-\0\x31\0\x36\0'\0?\0>"
  1963. "\0<\0a\0>\0<\0!\0[\0C\0D\0A\0T\0A\0["
  1964. /* 64 characters per line */
  1965. /* clang-format off */
  1966. A_TO_P_IN_UTF16 A_TO_P_IN_UTF16 A_TO_P_IN_UTF16 A_TO_P_IN_UTF16
  1967. A_TO_P_IN_UTF16 A_TO_P_IN_UTF16 A_TO_P_IN_UTF16 A_TO_P_IN_UTF16
  1968. A_TO_P_IN_UTF16 A_TO_P_IN_UTF16 A_TO_P_IN_UTF16 A_TO_P_IN_UTF16
  1969. A_TO_P_IN_UTF16 A_TO_P_IN_UTF16 A_TO_P_IN_UTF16 A_TO_P_IN_UTF16
  1970. A_TO_P_IN_UTF16 A_TO_P_IN_UTF16 A_TO_P_IN_UTF16 A_TO_P_IN_UTF16
  1971. A_TO_P_IN_UTF16 A_TO_P_IN_UTF16 A_TO_P_IN_UTF16 A_TO_P_IN_UTF16
  1972. A_TO_P_IN_UTF16 A_TO_P_IN_UTF16 A_TO_P_IN_UTF16 A_TO_P_IN_UTF16
  1973. A_TO_P_IN_UTF16 A_TO_P_IN_UTF16 A_TO_P_IN_UTF16 A_TO_P_IN_UTF16
  1974. A_TO_P_IN_UTF16 A_TO_P_IN_UTF16 A_TO_P_IN_UTF16 A_TO_P_IN_UTF16
  1975. A_TO_P_IN_UTF16 A_TO_P_IN_UTF16 A_TO_P_IN_UTF16 A_TO_P_IN_UTF16
  1976. A_TO_P_IN_UTF16 A_TO_P_IN_UTF16 A_TO_P_IN_UTF16 A_TO_P_IN_UTF16
  1977. A_TO_P_IN_UTF16 A_TO_P_IN_UTF16 A_TO_P_IN_UTF16 A_TO_P_IN_UTF16
  1978. A_TO_P_IN_UTF16 A_TO_P_IN_UTF16 A_TO_P_IN_UTF16 A_TO_P_IN_UTF16
  1979. A_TO_P_IN_UTF16 A_TO_P_IN_UTF16 A_TO_P_IN_UTF16 A_TO_P_IN_UTF16
  1980. A_TO_P_IN_UTF16 A_TO_P_IN_UTF16 A_TO_P_IN_UTF16 A_TO_P_IN_UTF16
  1981. A_TO_P_IN_UTF16 A_TO_P_IN_UTF16 A_TO_P_IN_UTF16 A_TO_P_IN_UTF16
  1982. A_TO_P_IN_UTF16
  1983. /* clang-format on */
  1984. "\0]\0]\0>\0<\0/\0a\0>";
  1985. const XML_Char *expected =
  1986. /* clang-format off */
  1987. XCS("ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP")
  1988. XCS("ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP")
  1989. XCS("ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP")
  1990. XCS("ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP")
  1991. XCS("ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP")
  1992. XCS("ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP")
  1993. XCS("ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP")
  1994. XCS("ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP")
  1995. XCS("ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP")
  1996. XCS("ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP")
  1997. XCS("ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP")
  1998. XCS("ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP")
  1999. XCS("ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP")
  2000. XCS("ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP")
  2001. XCS("ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP")
  2002. XCS("ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP")
  2003. XCS("ABCDEFGHIJKLMNOP");
  2004. /* clang-format on */
  2005. CharData storage;
  2006. void *buffer;
  2007. CharData_Init(&storage);
  2008. XML_SetUserData(g_parser, &storage);
  2009. XML_SetCharacterDataHandler(g_parser, accumulate_characters);
  2010. buffer = XML_GetBuffer(g_parser, sizeof(text) - 1);
  2011. if (buffer == NULL)
  2012. fail("Could not allocate parse buffer");
  2013. assert(buffer != NULL);
  2014. memcpy(buffer, text, sizeof(text) - 1);
  2015. if (XML_ParseBuffer(g_parser, sizeof(text) - 1, XML_TRUE) == XML_STATUS_ERROR)
  2016. xml_failure(g_parser);
  2017. CharData_CheckXMLChars(&storage, expected);
  2018. }
  2019. END_TEST
  2020. /* Test handling of multiple unit UTF-16 characters */
  2021. START_TEST(test_multichar_cdata_utf16) {
  2022. /* Test data is:
  2023. * <?xml version='1.0' encoding='utf-16'?>
  2024. * <a><![CDATA[{MINIM}{CROTCHET}]]></a>
  2025. *
  2026. * where {MINIM} is U+1d15e (a minim or half-note)
  2027. * UTF-16: 0xd834 0xdd5e
  2028. * UTF-8: 0xf0 0x9d 0x85 0x9e
  2029. * and {CROTCHET} is U+1d15f (a crotchet or quarter-note)
  2030. * UTF-16: 0xd834 0xdd5f
  2031. * UTF-8: 0xf0 0x9d 0x85 0x9f
  2032. */
  2033. const char text[] = "\0<\0?\0x\0m\0l\0"
  2034. " \0v\0e\0r\0s\0i\0o\0n\0=\0'\0\x31\0.\0\x30\0'\0"
  2035. " \0e\0n\0c\0o\0d\0i\0n\0g\0=\0'\0u\0t\0f\0-\0"
  2036. "1\0"
  2037. "6\0'"
  2038. "\0?\0>\0\n"
  2039. "\0<\0a\0>\0<\0!\0[\0C\0D\0A\0T\0A\0["
  2040. "\xd8\x34\xdd\x5e\xd8\x34\xdd\x5f"
  2041. "\0]\0]\0>\0<\0/\0a\0>";
  2042. #ifdef XML_UNICODE
  2043. const XML_Char *expected = XCS("\xd834\xdd5e\xd834\xdd5f");
  2044. #else
  2045. const XML_Char *expected = XCS("\xf0\x9d\x85\x9e\xf0\x9d\x85\x9f");
  2046. #endif
  2047. CharData storage;
  2048. CharData_Init(&storage);
  2049. XML_SetUserData(g_parser, &storage);
  2050. XML_SetCharacterDataHandler(g_parser, accumulate_characters);
  2051. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)sizeof(text) - 1, XML_TRUE)
  2052. == XML_STATUS_ERROR)
  2053. xml_failure(g_parser);
  2054. CharData_CheckXMLChars(&storage, expected);
  2055. }
  2056. END_TEST
  2057. /* Test that an element name with a UTF-16 surrogate pair is rejected */
  2058. START_TEST(test_utf16_bad_surrogate_pair) {
  2059. /* Test data is:
  2060. * <?xml version='1.0' encoding='utf-16'?>
  2061. * <a><![CDATA[{BADLINB}]]></a>
  2062. *
  2063. * where {BADLINB} is U+10000 (the first Linear B character)
  2064. * with the UTF-16 surrogate pair in the wrong order, i.e.
  2065. * 0xdc00 0xd800
  2066. */
  2067. const char text[] = "\0<\0?\0x\0m\0l\0"
  2068. " \0v\0e\0r\0s\0i\0o\0n\0=\0'\0\x31\0.\0\x30\0'\0"
  2069. " \0e\0n\0c\0o\0d\0i\0n\0g\0=\0'\0u\0t\0f\0-\0"
  2070. "1\0"
  2071. "6\0'"
  2072. "\0?\0>\0\n"
  2073. "\0<\0a\0>\0<\0!\0[\0C\0D\0A\0T\0A\0["
  2074. "\xdc\x00\xd8\x00"
  2075. "\0]\0]\0>\0<\0/\0a\0>";
  2076. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)sizeof(text) - 1, XML_TRUE)
  2077. != XML_STATUS_ERROR)
  2078. fail("Reversed UTF-16 surrogate pair not faulted");
  2079. if (XML_GetErrorCode(g_parser) != XML_ERROR_INVALID_TOKEN)
  2080. xml_failure(g_parser);
  2081. }
  2082. END_TEST
  2083. START_TEST(test_bad_cdata) {
  2084. struct CaseData {
  2085. const char *text;
  2086. enum XML_Error expectedError;
  2087. };
  2088. struct CaseData cases[]
  2089. = {{"<a><", XML_ERROR_UNCLOSED_TOKEN},
  2090. {"<a><!", XML_ERROR_UNCLOSED_TOKEN},
  2091. {"<a><![", XML_ERROR_UNCLOSED_TOKEN},
  2092. {"<a><![C", XML_ERROR_UNCLOSED_TOKEN},
  2093. {"<a><![CD", XML_ERROR_UNCLOSED_TOKEN},
  2094. {"<a><![CDA", XML_ERROR_UNCLOSED_TOKEN},
  2095. {"<a><![CDAT", XML_ERROR_UNCLOSED_TOKEN},
  2096. {"<a><![CDATA", XML_ERROR_UNCLOSED_TOKEN},
  2097. {"<a><![CDATA[", XML_ERROR_UNCLOSED_CDATA_SECTION},
  2098. {"<a><![CDATA[]", XML_ERROR_UNCLOSED_CDATA_SECTION},
  2099. {"<a><![CDATA[]]", XML_ERROR_UNCLOSED_CDATA_SECTION},
  2100. {"<a><!<a/>", XML_ERROR_INVALID_TOKEN},
  2101. {"<a><![<a/>", XML_ERROR_UNCLOSED_TOKEN}, /* ?! */
  2102. {"<a><![C<a/>", XML_ERROR_UNCLOSED_TOKEN}, /* ?! */
  2103. {"<a><![CD<a/>", XML_ERROR_INVALID_TOKEN},
  2104. {"<a><![CDA<a/>", XML_ERROR_INVALID_TOKEN},
  2105. {"<a><![CDAT<a/>", XML_ERROR_INVALID_TOKEN},
  2106. {"<a><![CDATA<a/>", XML_ERROR_INVALID_TOKEN},
  2107. {"<a><![CDATA[<a/>", XML_ERROR_UNCLOSED_CDATA_SECTION},
  2108. {"<a><![CDATA[]<a/>", XML_ERROR_UNCLOSED_CDATA_SECTION},
  2109. {"<a><![CDATA[]]<a/>", XML_ERROR_UNCLOSED_CDATA_SECTION}};
  2110. size_t i = 0;
  2111. for (; i < sizeof(cases) / sizeof(struct CaseData); i++) {
  2112. const enum XML_Status actualStatus = _XML_Parse_SINGLE_BYTES(
  2113. g_parser, cases[i].text, (int)strlen(cases[i].text), XML_TRUE);
  2114. const enum XML_Error actualError = XML_GetErrorCode(g_parser);
  2115. assert(actualStatus == XML_STATUS_ERROR);
  2116. if (actualError != cases[i].expectedError) {
  2117. char message[100];
  2118. sprintf(message,
  2119. "Expected error %d but got error %d for case %u: \"%s\"\n",
  2120. cases[i].expectedError, actualError, (unsigned int)i + 1,
  2121. cases[i].text);
  2122. fail(message);
  2123. }
  2124. XML_ParserReset(g_parser, NULL);
  2125. }
  2126. }
  2127. END_TEST
  2128. /* Test failures in UTF-16 CDATA */
  2129. START_TEST(test_bad_cdata_utf16) {
  2130. struct CaseData {
  2131. size_t text_bytes;
  2132. const char *text;
  2133. enum XML_Error expected_error;
  2134. };
  2135. const char prolog[] = "\0<\0?\0x\0m\0l\0"
  2136. " \0v\0e\0r\0s\0i\0o\0n\0=\0'\0\x31\0.\0\x30\0'\0"
  2137. " \0e\0n\0c\0o\0d\0i\0n\0g\0=\0'\0u\0t\0f\0-\0"
  2138. "1\0"
  2139. "6\0'"
  2140. "\0?\0>\0\n"
  2141. "\0<\0a\0>";
  2142. struct CaseData cases[] = {
  2143. {1, "\0", XML_ERROR_UNCLOSED_TOKEN},
  2144. {2, "\0<", XML_ERROR_UNCLOSED_TOKEN},
  2145. {3, "\0<\0", XML_ERROR_UNCLOSED_TOKEN},
  2146. {4, "\0<\0!", XML_ERROR_UNCLOSED_TOKEN},
  2147. {5, "\0<\0!\0", XML_ERROR_UNCLOSED_TOKEN},
  2148. {6, "\0<\0!\0[", XML_ERROR_UNCLOSED_TOKEN},
  2149. {7, "\0<\0!\0[\0", XML_ERROR_UNCLOSED_TOKEN},
  2150. {8, "\0<\0!\0[\0C", XML_ERROR_UNCLOSED_TOKEN},
  2151. {9, "\0<\0!\0[\0C\0", XML_ERROR_UNCLOSED_TOKEN},
  2152. {10, "\0<\0!\0[\0C\0D", XML_ERROR_UNCLOSED_TOKEN},
  2153. {11, "\0<\0!\0[\0C\0D\0", XML_ERROR_UNCLOSED_TOKEN},
  2154. {12, "\0<\0!\0[\0C\0D\0A", XML_ERROR_UNCLOSED_TOKEN},
  2155. {13, "\0<\0!\0[\0C\0D\0A\0", XML_ERROR_UNCLOSED_TOKEN},
  2156. {14, "\0<\0!\0[\0C\0D\0A\0T", XML_ERROR_UNCLOSED_TOKEN},
  2157. {15, "\0<\0!\0[\0C\0D\0A\0T\0", XML_ERROR_UNCLOSED_TOKEN},
  2158. {16, "\0<\0!\0[\0C\0D\0A\0T\0A", XML_ERROR_UNCLOSED_TOKEN},
  2159. {17, "\0<\0!\0[\0C\0D\0A\0T\0A\0", XML_ERROR_UNCLOSED_TOKEN},
  2160. {18, "\0<\0!\0[\0C\0D\0A\0T\0A\0[", XML_ERROR_UNCLOSED_CDATA_SECTION},
  2161. {19, "\0<\0!\0[\0C\0D\0A\0T\0A\0[\0", XML_ERROR_UNCLOSED_CDATA_SECTION},
  2162. {20, "\0<\0!\0[\0C\0D\0A\0T\0A\0[\0Z", XML_ERROR_UNCLOSED_CDATA_SECTION},
  2163. /* Now add a four-byte UTF-16 character */
  2164. {21, "\0<\0!\0[\0C\0D\0A\0T\0A\0[\0Z\xd8",
  2165. XML_ERROR_UNCLOSED_CDATA_SECTION},
  2166. {22, "\0<\0!\0[\0C\0D\0A\0T\0A\0[\0Z\xd8\x34", XML_ERROR_PARTIAL_CHAR},
  2167. {23, "\0<\0!\0[\0C\0D\0A\0T\0A\0[\0Z\xd8\x34\xdd",
  2168. XML_ERROR_PARTIAL_CHAR},
  2169. {24, "\0<\0!\0[\0C\0D\0A\0T\0A\0[\0Z\xd8\x34\xdd\x5e",
  2170. XML_ERROR_UNCLOSED_CDATA_SECTION}};
  2171. size_t i;
  2172. for (i = 0; i < sizeof(cases) / sizeof(struct CaseData); i++) {
  2173. enum XML_Status actual_status;
  2174. enum XML_Error actual_error;
  2175. if (_XML_Parse_SINGLE_BYTES(g_parser, prolog, (int)sizeof(prolog) - 1,
  2176. XML_FALSE)
  2177. == XML_STATUS_ERROR)
  2178. xml_failure(g_parser);
  2179. actual_status = _XML_Parse_SINGLE_BYTES(g_parser, cases[i].text,
  2180. (int)cases[i].text_bytes, XML_TRUE);
  2181. assert(actual_status == XML_STATUS_ERROR);
  2182. actual_error = XML_GetErrorCode(g_parser);
  2183. if (actual_error != cases[i].expected_error) {
  2184. char message[1024];
  2185. sprintf(message,
  2186. "Expected error %d (%" XML_FMT_STR "), got %d (%" XML_FMT_STR
  2187. ") for case %lu\n",
  2188. cases[i].expected_error, XML_ErrorString(cases[i].expected_error),
  2189. actual_error, XML_ErrorString(actual_error),
  2190. (long unsigned)(i + 1));
  2191. fail(message);
  2192. }
  2193. XML_ParserReset(g_parser, NULL);
  2194. }
  2195. }
  2196. END_TEST
  2197. static const char *long_cdata_text
  2198. = "<s><![CDATA["
  2199. "012345678901234567890123456789012345678901234567890123456789"
  2200. "012345678901234567890123456789012345678901234567890123456789"
  2201. "012345678901234567890123456789012345678901234567890123456789"
  2202. "012345678901234567890123456789012345678901234567890123456789"
  2203. "012345678901234567890123456789012345678901234567890123456789"
  2204. "012345678901234567890123456789012345678901234567890123456789"
  2205. "012345678901234567890123456789012345678901234567890123456789"
  2206. "012345678901234567890123456789012345678901234567890123456789"
  2207. "012345678901234567890123456789012345678901234567890123456789"
  2208. "012345678901234567890123456789012345678901234567890123456789"
  2209. "012345678901234567890123456789012345678901234567890123456789"
  2210. "012345678901234567890123456789012345678901234567890123456789"
  2211. "012345678901234567890123456789012345678901234567890123456789"
  2212. "012345678901234567890123456789012345678901234567890123456789"
  2213. "012345678901234567890123456789012345678901234567890123456789"
  2214. "012345678901234567890123456789012345678901234567890123456789"
  2215. "012345678901234567890123456789012345678901234567890123456789"
  2216. "012345678901234567890123456789012345678901234567890123456789"
  2217. "012345678901234567890123456789012345678901234567890123456789"
  2218. "012345678901234567890123456789012345678901234567890123456789"
  2219. "]]></s>";
  2220. /* Test stopping the parser in cdata handler */
  2221. START_TEST(test_stop_parser_between_cdata_calls) {
  2222. const char *text = long_cdata_text;
  2223. XML_SetCharacterDataHandler(g_parser, clearing_aborting_character_handler);
  2224. resumable = XML_FALSE;
  2225. expect_failure(text, XML_ERROR_ABORTED, "Parse not aborted in CDATA handler");
  2226. }
  2227. END_TEST
  2228. /* Test suspending the parser in cdata handler */
  2229. START_TEST(test_suspend_parser_between_cdata_calls) {
  2230. const char *text = long_cdata_text;
  2231. enum XML_Status result;
  2232. XML_SetCharacterDataHandler(g_parser, clearing_aborting_character_handler);
  2233. resumable = XML_TRUE;
  2234. result = _XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_TRUE);
  2235. if (result != XML_STATUS_SUSPENDED) {
  2236. if (result == XML_STATUS_ERROR)
  2237. xml_failure(g_parser);
  2238. fail("Parse not suspended in CDATA handler");
  2239. }
  2240. if (XML_GetErrorCode(g_parser) != XML_ERROR_NONE)
  2241. xml_failure(g_parser);
  2242. }
  2243. END_TEST
  2244. /* Test memory allocation functions */
  2245. START_TEST(test_memory_allocation) {
  2246. char *buffer = (char *)XML_MemMalloc(g_parser, 256);
  2247. char *p;
  2248. if (buffer == NULL) {
  2249. fail("Allocation failed");
  2250. } else {
  2251. /* Try writing to memory; some OSes try to cheat! */
  2252. buffer[0] = 'T';
  2253. buffer[1] = 'E';
  2254. buffer[2] = 'S';
  2255. buffer[3] = 'T';
  2256. buffer[4] = '\0';
  2257. if (strcmp(buffer, "TEST") != 0) {
  2258. fail("Memory not writable");
  2259. } else {
  2260. p = (char *)XML_MemRealloc(g_parser, buffer, 512);
  2261. if (p == NULL) {
  2262. fail("Reallocation failed");
  2263. } else {
  2264. /* Write again, just to be sure */
  2265. buffer = p;
  2266. buffer[0] = 'V';
  2267. if (strcmp(buffer, "VEST") != 0) {
  2268. fail("Reallocated memory not writable");
  2269. }
  2270. }
  2271. }
  2272. XML_MemFree(g_parser, buffer);
  2273. }
  2274. }
  2275. END_TEST
  2276. static void XMLCALL
  2277. record_default_handler(void *userData, const XML_Char *s, int len) {
  2278. UNUSED_P(s);
  2279. UNUSED_P(len);
  2280. CharData_AppendXMLChars((CharData *)userData, XCS("D"), 1);
  2281. }
  2282. static void XMLCALL
  2283. record_cdata_handler(void *userData, const XML_Char *s, int len) {
  2284. UNUSED_P(s);
  2285. UNUSED_P(len);
  2286. CharData_AppendXMLChars((CharData *)userData, XCS("C"), 1);
  2287. XML_DefaultCurrent(g_parser);
  2288. }
  2289. static void XMLCALL
  2290. record_cdata_nodefault_handler(void *userData, const XML_Char *s, int len) {
  2291. UNUSED_P(s);
  2292. UNUSED_P(len);
  2293. CharData_AppendXMLChars((CharData *)userData, XCS("c"), 1);
  2294. }
  2295. static void XMLCALL
  2296. record_skip_handler(void *userData, const XML_Char *entityName,
  2297. int is_parameter_entity) {
  2298. UNUSED_P(entityName);
  2299. CharData_AppendXMLChars((CharData *)userData,
  2300. is_parameter_entity ? XCS("E") : XCS("e"), 1);
  2301. }
  2302. /* Test XML_DefaultCurrent() passes handling on correctly */
  2303. START_TEST(test_default_current) {
  2304. const char *text = "<doc>hell]</doc>";
  2305. const char *entity_text = "<!DOCTYPE doc [\n"
  2306. "<!ENTITY entity '&#37;'>\n"
  2307. "]>\n"
  2308. "<doc>&entity;</doc>";
  2309. CharData storage;
  2310. XML_SetDefaultHandler(g_parser, record_default_handler);
  2311. XML_SetCharacterDataHandler(g_parser, record_cdata_handler);
  2312. CharData_Init(&storage);
  2313. XML_SetUserData(g_parser, &storage);
  2314. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_TRUE)
  2315. == XML_STATUS_ERROR)
  2316. xml_failure(g_parser);
  2317. CharData_CheckXMLChars(&storage, XCS("DCDCDCDCDCDD"));
  2318. /* Again, without the defaulting */
  2319. XML_ParserReset(g_parser, NULL);
  2320. XML_SetDefaultHandler(g_parser, record_default_handler);
  2321. XML_SetCharacterDataHandler(g_parser, record_cdata_nodefault_handler);
  2322. CharData_Init(&storage);
  2323. XML_SetUserData(g_parser, &storage);
  2324. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_TRUE)
  2325. == XML_STATUS_ERROR)
  2326. xml_failure(g_parser);
  2327. CharData_CheckXMLChars(&storage, XCS("DcccccD"));
  2328. /* Now with an internal entity to complicate matters */
  2329. XML_ParserReset(g_parser, NULL);
  2330. XML_SetDefaultHandler(g_parser, record_default_handler);
  2331. XML_SetCharacterDataHandler(g_parser, record_cdata_handler);
  2332. CharData_Init(&storage);
  2333. XML_SetUserData(g_parser, &storage);
  2334. if (_XML_Parse_SINGLE_BYTES(g_parser, entity_text, (int)strlen(entity_text),
  2335. XML_TRUE)
  2336. == XML_STATUS_ERROR)
  2337. xml_failure(g_parser);
  2338. /* The default handler suppresses the entity */
  2339. CharData_CheckXMLChars(&storage, XCS("DDDDDDDDDDDDDDDDDDD"));
  2340. /* Again, with a skip handler */
  2341. XML_ParserReset(g_parser, NULL);
  2342. XML_SetDefaultHandler(g_parser, record_default_handler);
  2343. XML_SetCharacterDataHandler(g_parser, record_cdata_handler);
  2344. XML_SetSkippedEntityHandler(g_parser, record_skip_handler);
  2345. CharData_Init(&storage);
  2346. XML_SetUserData(g_parser, &storage);
  2347. if (_XML_Parse_SINGLE_BYTES(g_parser, entity_text, (int)strlen(entity_text),
  2348. XML_TRUE)
  2349. == XML_STATUS_ERROR)
  2350. xml_failure(g_parser);
  2351. /* The default handler suppresses the entity */
  2352. CharData_CheckXMLChars(&storage, XCS("DDDDDDDDDDDDDDDDDeD"));
  2353. /* This time, allow the entity through */
  2354. XML_ParserReset(g_parser, NULL);
  2355. XML_SetDefaultHandlerExpand(g_parser, record_default_handler);
  2356. XML_SetCharacterDataHandler(g_parser, record_cdata_handler);
  2357. CharData_Init(&storage);
  2358. XML_SetUserData(g_parser, &storage);
  2359. if (_XML_Parse_SINGLE_BYTES(g_parser, entity_text, (int)strlen(entity_text),
  2360. XML_TRUE)
  2361. == XML_STATUS_ERROR)
  2362. xml_failure(g_parser);
  2363. CharData_CheckXMLChars(&storage, XCS("DDDDDDDDDDDDDDDDDCDD"));
  2364. /* Finally, without passing the cdata to the default handler */
  2365. XML_ParserReset(g_parser, NULL);
  2366. XML_SetDefaultHandlerExpand(g_parser, record_default_handler);
  2367. XML_SetCharacterDataHandler(g_parser, record_cdata_nodefault_handler);
  2368. CharData_Init(&storage);
  2369. XML_SetUserData(g_parser, &storage);
  2370. if (_XML_Parse_SINGLE_BYTES(g_parser, entity_text, (int)strlen(entity_text),
  2371. XML_TRUE)
  2372. == XML_STATUS_ERROR)
  2373. xml_failure(g_parser);
  2374. CharData_CheckXMLChars(&storage, XCS("DDDDDDDDDDDDDDDDDcD"));
  2375. }
  2376. END_TEST
  2377. /* Test DTD element parsing code paths */
  2378. START_TEST(test_dtd_elements) {
  2379. const char *text = "<!DOCTYPE doc [\n"
  2380. "<!ELEMENT doc (chapter)>\n"
  2381. "<!ELEMENT chapter (#PCDATA)>\n"
  2382. "]>\n"
  2383. "<doc><chapter>Wombats are go</chapter></doc>";
  2384. XML_SetElementDeclHandler(g_parser, dummy_element_decl_handler);
  2385. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_TRUE)
  2386. == XML_STATUS_ERROR)
  2387. xml_failure(g_parser);
  2388. }
  2389. END_TEST
  2390. /* Test foreign DTD handling */
  2391. START_TEST(test_set_foreign_dtd) {
  2392. const char *text1 = "<?xml version='1.0' encoding='us-ascii'?>\n";
  2393. const char *text2 = "<doc>&entity;</doc>";
  2394. ExtTest test_data = {"<!ELEMENT doc (#PCDATA)*>", NULL, NULL};
  2395. /* Check hash salt is passed through too */
  2396. XML_SetHashSalt(g_parser, 0x12345678);
  2397. XML_SetParamEntityParsing(g_parser, XML_PARAM_ENTITY_PARSING_ALWAYS);
  2398. XML_SetUserData(g_parser, &test_data);
  2399. XML_SetExternalEntityRefHandler(g_parser, external_entity_loader);
  2400. /* Add a default handler to exercise more code paths */
  2401. XML_SetDefaultHandler(g_parser, dummy_default_handler);
  2402. if (XML_UseForeignDTD(g_parser, XML_TRUE) != XML_ERROR_NONE)
  2403. fail("Could not set foreign DTD");
  2404. if (_XML_Parse_SINGLE_BYTES(g_parser, text1, (int)strlen(text1), XML_FALSE)
  2405. == XML_STATUS_ERROR)
  2406. xml_failure(g_parser);
  2407. /* Ensure that trying to set the DTD after parsing has started
  2408. * is faulted, even if it's the same setting.
  2409. */
  2410. if (XML_UseForeignDTD(g_parser, XML_TRUE)
  2411. != XML_ERROR_CANT_CHANGE_FEATURE_ONCE_PARSING)
  2412. fail("Failed to reject late foreign DTD setting");
  2413. /* Ditto for the hash salt */
  2414. if (XML_SetHashSalt(g_parser, 0x23456789))
  2415. fail("Failed to reject late hash salt change");
  2416. /* Now finish the parse */
  2417. if (_XML_Parse_SINGLE_BYTES(g_parser, text2, (int)strlen(text2), XML_TRUE)
  2418. == XML_STATUS_ERROR)
  2419. xml_failure(g_parser);
  2420. }
  2421. END_TEST
  2422. /* Test foreign DTD handling with a failing NotStandalone handler */
  2423. START_TEST(test_foreign_dtd_not_standalone) {
  2424. const char *text = "<?xml version='1.0' encoding='us-ascii'?>\n"
  2425. "<doc>&entity;</doc>";
  2426. ExtTest test_data = {"<!ELEMENT doc (#PCDATA)*>", NULL, NULL};
  2427. XML_SetParamEntityParsing(g_parser, XML_PARAM_ENTITY_PARSING_ALWAYS);
  2428. XML_SetUserData(g_parser, &test_data);
  2429. XML_SetExternalEntityRefHandler(g_parser, external_entity_loader);
  2430. XML_SetNotStandaloneHandler(g_parser, reject_not_standalone_handler);
  2431. if (XML_UseForeignDTD(g_parser, XML_TRUE) != XML_ERROR_NONE)
  2432. fail("Could not set foreign DTD");
  2433. expect_failure(text, XML_ERROR_NOT_STANDALONE,
  2434. "NotStandalonehandler failed to reject");
  2435. }
  2436. END_TEST
  2437. /* Test invalid character in a foreign DTD is faulted */
  2438. START_TEST(test_invalid_foreign_dtd) {
  2439. const char *text = "<?xml version='1.0' encoding='us-ascii'?>\n"
  2440. "<doc>&entity;</doc>";
  2441. ExtFaults test_data
  2442. = {"$", "Dollar not faulted", NULL, XML_ERROR_INVALID_TOKEN};
  2443. XML_SetParamEntityParsing(g_parser, XML_PARAM_ENTITY_PARSING_ALWAYS);
  2444. XML_SetUserData(g_parser, &test_data);
  2445. XML_SetExternalEntityRefHandler(g_parser, external_entity_faulter);
  2446. XML_UseForeignDTD(g_parser, XML_TRUE);
  2447. expect_failure(text, XML_ERROR_EXTERNAL_ENTITY_HANDLING,
  2448. "Bad DTD should not have been accepted");
  2449. }
  2450. END_TEST
  2451. /* Test foreign DTD use with a doctype */
  2452. START_TEST(test_foreign_dtd_with_doctype) {
  2453. const char *text1 = "<?xml version='1.0' encoding='us-ascii'?>\n"
  2454. "<!DOCTYPE doc [<!ENTITY entity 'hello world'>]>\n";
  2455. const char *text2 = "<doc>&entity;</doc>";
  2456. ExtTest test_data = {"<!ELEMENT doc (#PCDATA)*>", NULL, NULL};
  2457. /* Check hash salt is passed through too */
  2458. XML_SetHashSalt(g_parser, 0x12345678);
  2459. XML_SetParamEntityParsing(g_parser, XML_PARAM_ENTITY_PARSING_ALWAYS);
  2460. XML_SetUserData(g_parser, &test_data);
  2461. XML_SetExternalEntityRefHandler(g_parser, external_entity_loader);
  2462. /* Add a default handler to exercise more code paths */
  2463. XML_SetDefaultHandler(g_parser, dummy_default_handler);
  2464. if (XML_UseForeignDTD(g_parser, XML_TRUE) != XML_ERROR_NONE)
  2465. fail("Could not set foreign DTD");
  2466. if (_XML_Parse_SINGLE_BYTES(g_parser, text1, (int)strlen(text1), XML_FALSE)
  2467. == XML_STATUS_ERROR)
  2468. xml_failure(g_parser);
  2469. /* Ensure that trying to set the DTD after parsing has started
  2470. * is faulted, even if it's the same setting.
  2471. */
  2472. if (XML_UseForeignDTD(g_parser, XML_TRUE)
  2473. != XML_ERROR_CANT_CHANGE_FEATURE_ONCE_PARSING)
  2474. fail("Failed to reject late foreign DTD setting");
  2475. /* Ditto for the hash salt */
  2476. if (XML_SetHashSalt(g_parser, 0x23456789))
  2477. fail("Failed to reject late hash salt change");
  2478. /* Now finish the parse */
  2479. if (_XML_Parse_SINGLE_BYTES(g_parser, text2, (int)strlen(text2), XML_TRUE)
  2480. == XML_STATUS_ERROR)
  2481. xml_failure(g_parser);
  2482. }
  2483. END_TEST
  2484. /* Test XML_UseForeignDTD with no external subset present */
  2485. static int XMLCALL
  2486. external_entity_null_loader(XML_Parser parser, const XML_Char *context,
  2487. const XML_Char *base, const XML_Char *systemId,
  2488. const XML_Char *publicId) {
  2489. UNUSED_P(parser);
  2490. UNUSED_P(context);
  2491. UNUSED_P(base);
  2492. UNUSED_P(systemId);
  2493. UNUSED_P(publicId);
  2494. return XML_STATUS_OK;
  2495. }
  2496. START_TEST(test_foreign_dtd_without_external_subset) {
  2497. const char *text = "<!DOCTYPE doc [<!ENTITY foo 'bar'>]>\n"
  2498. "<doc>&foo;</doc>";
  2499. XML_SetParamEntityParsing(g_parser, XML_PARAM_ENTITY_PARSING_ALWAYS);
  2500. XML_SetUserData(g_parser, NULL);
  2501. XML_SetExternalEntityRefHandler(g_parser, external_entity_null_loader);
  2502. XML_UseForeignDTD(g_parser, XML_TRUE);
  2503. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_TRUE)
  2504. == XML_STATUS_ERROR)
  2505. xml_failure(g_parser);
  2506. }
  2507. END_TEST
  2508. START_TEST(test_empty_foreign_dtd) {
  2509. const char *text = "<?xml version='1.0' encoding='us-ascii'?>\n"
  2510. "<doc>&entity;</doc>";
  2511. XML_SetParamEntityParsing(g_parser, XML_PARAM_ENTITY_PARSING_ALWAYS);
  2512. XML_SetExternalEntityRefHandler(g_parser, external_entity_null_loader);
  2513. XML_UseForeignDTD(g_parser, XML_TRUE);
  2514. expect_failure(text, XML_ERROR_UNDEFINED_ENTITY,
  2515. "Undefined entity not faulted");
  2516. }
  2517. END_TEST
  2518. /* Test XML Base is set and unset appropriately */
  2519. START_TEST(test_set_base) {
  2520. const XML_Char *old_base;
  2521. const XML_Char *new_base = XCS("/local/file/name.xml");
  2522. old_base = XML_GetBase(g_parser);
  2523. if (XML_SetBase(g_parser, new_base) != XML_STATUS_OK)
  2524. fail("Unable to set base");
  2525. if (xcstrcmp(XML_GetBase(g_parser), new_base) != 0)
  2526. fail("Base setting not correct");
  2527. if (XML_SetBase(g_parser, NULL) != XML_STATUS_OK)
  2528. fail("Unable to NULL base");
  2529. if (XML_GetBase(g_parser) != NULL)
  2530. fail("Base setting not nulled");
  2531. XML_SetBase(g_parser, old_base);
  2532. }
  2533. END_TEST
  2534. /* Test attribute counts, indexing, etc */
  2535. typedef struct attrInfo {
  2536. const XML_Char *name;
  2537. const XML_Char *value;
  2538. } AttrInfo;
  2539. typedef struct elementInfo {
  2540. const XML_Char *name;
  2541. int attr_count;
  2542. const XML_Char *id_name;
  2543. AttrInfo *attributes;
  2544. } ElementInfo;
  2545. static void XMLCALL
  2546. counting_start_element_handler(void *userData, const XML_Char *name,
  2547. const XML_Char **atts) {
  2548. ElementInfo *info = (ElementInfo *)userData;
  2549. AttrInfo *attr;
  2550. int count, id, i;
  2551. while (info->name != NULL) {
  2552. if (! xcstrcmp(name, info->name))
  2553. break;
  2554. info++;
  2555. }
  2556. if (info->name == NULL)
  2557. fail("Element not recognised");
  2558. /* The attribute count is twice what you might expect. It is a
  2559. * count of items in atts, an array which contains alternating
  2560. * attribute names and attribute values. For the naive user this
  2561. * is possibly a little unexpected, but it is what the
  2562. * documentation in expat.h tells us to expect.
  2563. */
  2564. count = XML_GetSpecifiedAttributeCount(g_parser);
  2565. if (info->attr_count * 2 != count) {
  2566. fail("Not got expected attribute count");
  2567. return;
  2568. }
  2569. id = XML_GetIdAttributeIndex(g_parser);
  2570. if (id == -1 && info->id_name != NULL) {
  2571. fail("ID not present");
  2572. return;
  2573. }
  2574. if (id != -1 && xcstrcmp(atts[id], info->id_name)) {
  2575. fail("ID does not have the correct name");
  2576. return;
  2577. }
  2578. for (i = 0; i < info->attr_count; i++) {
  2579. attr = info->attributes;
  2580. while (attr->name != NULL) {
  2581. if (! xcstrcmp(atts[0], attr->name))
  2582. break;
  2583. attr++;
  2584. }
  2585. if (attr->name == NULL) {
  2586. fail("Attribute not recognised");
  2587. return;
  2588. }
  2589. if (xcstrcmp(atts[1], attr->value)) {
  2590. fail("Attribute has wrong value");
  2591. return;
  2592. }
  2593. /* Remember, two entries in atts per attribute (see above) */
  2594. atts += 2;
  2595. }
  2596. }
  2597. START_TEST(test_attributes) {
  2598. const char *text = "<!DOCTYPE doc [\n"
  2599. "<!ELEMENT doc (tag)>\n"
  2600. "<!ATTLIST doc id ID #REQUIRED>\n"
  2601. "]>"
  2602. "<doc a='1' id='one' b='2'>"
  2603. "<tag c='3'/>"
  2604. "</doc>";
  2605. AttrInfo doc_info[] = {{XCS("a"), XCS("1")},
  2606. {XCS("b"), XCS("2")},
  2607. {XCS("id"), XCS("one")},
  2608. {NULL, NULL}};
  2609. AttrInfo tag_info[] = {{XCS("c"), XCS("3")}, {NULL, NULL}};
  2610. ElementInfo info[] = {{XCS("doc"), 3, XCS("id"), NULL},
  2611. {XCS("tag"), 1, NULL, NULL},
  2612. {NULL, 0, NULL, NULL}};
  2613. info[0].attributes = doc_info;
  2614. info[1].attributes = tag_info;
  2615. XML_SetStartElementHandler(g_parser, counting_start_element_handler);
  2616. XML_SetUserData(g_parser, info);
  2617. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_TRUE)
  2618. == XML_STATUS_ERROR)
  2619. xml_failure(g_parser);
  2620. }
  2621. END_TEST
  2622. /* Test reset works correctly in the middle of processing an internal
  2623. * entity. Exercises some obscure code in XML_ParserReset().
  2624. */
  2625. START_TEST(test_reset_in_entity) {
  2626. const char *text = "<!DOCTYPE doc [\n"
  2627. "<!ENTITY wombat 'wom'>\n"
  2628. "<!ENTITY entity 'hi &wom; there'>\n"
  2629. "]>\n"
  2630. "<doc>&entity;</doc>";
  2631. XML_ParsingStatus status;
  2632. resumable = XML_TRUE;
  2633. XML_SetCharacterDataHandler(g_parser, clearing_aborting_character_handler);
  2634. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_FALSE)
  2635. == XML_STATUS_ERROR)
  2636. xml_failure(g_parser);
  2637. XML_GetParsingStatus(g_parser, &status);
  2638. if (status.parsing != XML_SUSPENDED)
  2639. fail("Parsing status not SUSPENDED");
  2640. XML_ParserReset(g_parser, NULL);
  2641. XML_GetParsingStatus(g_parser, &status);
  2642. if (status.parsing != XML_INITIALIZED)
  2643. fail("Parsing status doesn't reset to INITIALIZED");
  2644. }
  2645. END_TEST
  2646. /* Test that resume correctly passes through parse errors */
  2647. START_TEST(test_resume_invalid_parse) {
  2648. const char *text = "<doc>Hello</doc"; /* Missing closing wedge */
  2649. resumable = XML_TRUE;
  2650. XML_SetCharacterDataHandler(g_parser, clearing_aborting_character_handler);
  2651. if (XML_Parse(g_parser, text, (int)strlen(text), XML_TRUE)
  2652. == XML_STATUS_ERROR)
  2653. xml_failure(g_parser);
  2654. if (XML_ResumeParser(g_parser) == XML_STATUS_OK)
  2655. fail("Resumed invalid parse not faulted");
  2656. if (XML_GetErrorCode(g_parser) != XML_ERROR_UNCLOSED_TOKEN)
  2657. fail("Invalid parse not correctly faulted");
  2658. }
  2659. END_TEST
  2660. /* Test that re-suspended parses are correctly passed through */
  2661. START_TEST(test_resume_resuspended) {
  2662. const char *text = "<doc>Hello<meep/>world</doc>";
  2663. resumable = XML_TRUE;
  2664. XML_SetCharacterDataHandler(g_parser, clearing_aborting_character_handler);
  2665. if (XML_Parse(g_parser, text, (int)strlen(text), XML_TRUE)
  2666. == XML_STATUS_ERROR)
  2667. xml_failure(g_parser);
  2668. resumable = XML_TRUE;
  2669. XML_SetCharacterDataHandler(g_parser, clearing_aborting_character_handler);
  2670. if (XML_ResumeParser(g_parser) != XML_STATUS_SUSPENDED)
  2671. fail("Resumption not suspended");
  2672. /* This one should succeed and finish up */
  2673. if (XML_ResumeParser(g_parser) != XML_STATUS_OK)
  2674. xml_failure(g_parser);
  2675. }
  2676. END_TEST
  2677. /* Test that CDATA shows up correctly through a default handler */
  2678. START_TEST(test_cdata_default) {
  2679. const char *text = "<doc><![CDATA[Hello\nworld]]></doc>";
  2680. const XML_Char *expected = XCS("<doc><![CDATA[Hello\nworld]]></doc>");
  2681. CharData storage;
  2682. CharData_Init(&storage);
  2683. XML_SetUserData(g_parser, &storage);
  2684. XML_SetDefaultHandler(g_parser, accumulate_characters);
  2685. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_TRUE)
  2686. == XML_STATUS_ERROR)
  2687. xml_failure(g_parser);
  2688. CharData_CheckXMLChars(&storage, expected);
  2689. }
  2690. END_TEST
  2691. /* Test resetting a subordinate parser does exactly nothing */
  2692. static int XMLCALL
  2693. external_entity_resetter(XML_Parser parser, const XML_Char *context,
  2694. const XML_Char *base, const XML_Char *systemId,
  2695. const XML_Char *publicId) {
  2696. const char *text = "<!ELEMENT doc (#PCDATA)*>";
  2697. XML_Parser ext_parser;
  2698. XML_ParsingStatus status;
  2699. UNUSED_P(base);
  2700. UNUSED_P(systemId);
  2701. UNUSED_P(publicId);
  2702. ext_parser = XML_ExternalEntityParserCreate(parser, context, NULL);
  2703. if (ext_parser == NULL)
  2704. fail("Could not create external entity parser");
  2705. XML_GetParsingStatus(ext_parser, &status);
  2706. if (status.parsing != XML_INITIALIZED) {
  2707. fail("Parsing status is not INITIALIZED");
  2708. return XML_STATUS_ERROR;
  2709. }
  2710. if (_XML_Parse_SINGLE_BYTES(ext_parser, text, (int)strlen(text), XML_TRUE)
  2711. == XML_STATUS_ERROR) {
  2712. xml_failure(parser);
  2713. return XML_STATUS_ERROR;
  2714. }
  2715. XML_GetParsingStatus(ext_parser, &status);
  2716. if (status.parsing != XML_FINISHED) {
  2717. fail("Parsing status is not FINISHED");
  2718. return XML_STATUS_ERROR;
  2719. }
  2720. /* Check we can't parse here */
  2721. if (XML_Parse(ext_parser, text, (int)strlen(text), XML_TRUE)
  2722. != XML_STATUS_ERROR)
  2723. fail("Parsing when finished not faulted");
  2724. if (XML_GetErrorCode(ext_parser) != XML_ERROR_FINISHED)
  2725. fail("Parsing when finished faulted with wrong code");
  2726. XML_ParserReset(ext_parser, NULL);
  2727. XML_GetParsingStatus(ext_parser, &status);
  2728. if (status.parsing != XML_FINISHED) {
  2729. fail("Parsing status not still FINISHED");
  2730. return XML_STATUS_ERROR;
  2731. }
  2732. XML_ParserFree(ext_parser);
  2733. return XML_STATUS_OK;
  2734. }
  2735. START_TEST(test_subordinate_reset) {
  2736. const char *text = "<?xml version='1.0' encoding='us-ascii'?>\n"
  2737. "<!DOCTYPE doc SYSTEM 'foo'>\n"
  2738. "<doc>&entity;</doc>";
  2739. XML_SetParamEntityParsing(g_parser, XML_PARAM_ENTITY_PARSING_ALWAYS);
  2740. XML_SetExternalEntityRefHandler(g_parser, external_entity_resetter);
  2741. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_TRUE)
  2742. == XML_STATUS_ERROR)
  2743. xml_failure(g_parser);
  2744. }
  2745. END_TEST
  2746. /* Test suspending a subordinate parser */
  2747. static void XMLCALL
  2748. entity_suspending_decl_handler(void *userData, const XML_Char *name,
  2749. XML_Content *model) {
  2750. XML_Parser ext_parser = (XML_Parser)userData;
  2751. UNUSED_P(name);
  2752. if (XML_StopParser(ext_parser, XML_TRUE) != XML_STATUS_ERROR)
  2753. fail("Attempting to suspend a subordinate parser not faulted");
  2754. if (XML_GetErrorCode(ext_parser) != XML_ERROR_SUSPEND_PE)
  2755. fail("Suspending subordinate parser get wrong code");
  2756. XML_SetElementDeclHandler(ext_parser, NULL);
  2757. XML_FreeContentModel(g_parser, model);
  2758. }
  2759. static int XMLCALL
  2760. external_entity_suspender(XML_Parser parser, const XML_Char *context,
  2761. const XML_Char *base, const XML_Char *systemId,
  2762. const XML_Char *publicId) {
  2763. const char *text = "<!ELEMENT doc (#PCDATA)*>";
  2764. XML_Parser ext_parser;
  2765. UNUSED_P(base);
  2766. UNUSED_P(systemId);
  2767. UNUSED_P(publicId);
  2768. ext_parser = XML_ExternalEntityParserCreate(parser, context, NULL);
  2769. if (ext_parser == NULL)
  2770. fail("Could not create external entity parser");
  2771. XML_SetElementDeclHandler(ext_parser, entity_suspending_decl_handler);
  2772. XML_SetUserData(ext_parser, ext_parser);
  2773. if (_XML_Parse_SINGLE_BYTES(ext_parser, text, (int)strlen(text), XML_TRUE)
  2774. == XML_STATUS_ERROR) {
  2775. xml_failure(ext_parser);
  2776. return XML_STATUS_ERROR;
  2777. }
  2778. XML_ParserFree(ext_parser);
  2779. return XML_STATUS_OK;
  2780. }
  2781. START_TEST(test_subordinate_suspend) {
  2782. const char *text = "<?xml version='1.0' encoding='us-ascii'?>\n"
  2783. "<!DOCTYPE doc SYSTEM 'foo'>\n"
  2784. "<doc>&entity;</doc>";
  2785. XML_SetParamEntityParsing(g_parser, XML_PARAM_ENTITY_PARSING_ALWAYS);
  2786. XML_SetExternalEntityRefHandler(g_parser, external_entity_suspender);
  2787. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_TRUE)
  2788. == XML_STATUS_ERROR)
  2789. xml_failure(g_parser);
  2790. }
  2791. END_TEST
  2792. /* Test suspending a subordinate parser from an XML declaration */
  2793. /* Increases code coverage of the tests */
  2794. static void XMLCALL
  2795. entity_suspending_xdecl_handler(void *userData, const XML_Char *version,
  2796. const XML_Char *encoding, int standalone) {
  2797. XML_Parser ext_parser = (XML_Parser)userData;
  2798. UNUSED_P(version);
  2799. UNUSED_P(encoding);
  2800. UNUSED_P(standalone);
  2801. XML_StopParser(ext_parser, resumable);
  2802. XML_SetXmlDeclHandler(ext_parser, NULL);
  2803. }
  2804. static int XMLCALL
  2805. external_entity_suspend_xmldecl(XML_Parser parser, const XML_Char *context,
  2806. const XML_Char *base, const XML_Char *systemId,
  2807. const XML_Char *publicId) {
  2808. const char *text = "<?xml version='1.0' encoding='us-ascii'?>";
  2809. XML_Parser ext_parser;
  2810. XML_ParsingStatus status;
  2811. enum XML_Status rc;
  2812. UNUSED_P(base);
  2813. UNUSED_P(systemId);
  2814. UNUSED_P(publicId);
  2815. ext_parser = XML_ExternalEntityParserCreate(parser, context, NULL);
  2816. if (ext_parser == NULL)
  2817. fail("Could not create external entity parser");
  2818. XML_SetXmlDeclHandler(ext_parser, entity_suspending_xdecl_handler);
  2819. XML_SetUserData(ext_parser, ext_parser);
  2820. rc = _XML_Parse_SINGLE_BYTES(ext_parser, text, (int)strlen(text), XML_TRUE);
  2821. XML_GetParsingStatus(ext_parser, &status);
  2822. if (resumable) {
  2823. if (rc == XML_STATUS_ERROR)
  2824. xml_failure(ext_parser);
  2825. if (status.parsing != XML_SUSPENDED)
  2826. fail("Ext Parsing status not SUSPENDED");
  2827. } else {
  2828. if (rc != XML_STATUS_ERROR)
  2829. fail("Ext parsing not aborted");
  2830. if (XML_GetErrorCode(ext_parser) != XML_ERROR_ABORTED)
  2831. xml_failure(ext_parser);
  2832. if (status.parsing != XML_FINISHED)
  2833. fail("Ext Parsing status not FINISHED");
  2834. }
  2835. XML_ParserFree(ext_parser);
  2836. return XML_STATUS_OK;
  2837. }
  2838. START_TEST(test_subordinate_xdecl_suspend) {
  2839. const char *text
  2840. = "<!DOCTYPE doc [\n"
  2841. " <!ENTITY entity SYSTEM 'http://example.org/dummy.ent'>\n"
  2842. "]>\n"
  2843. "<doc>&entity;</doc>";
  2844. XML_SetParamEntityParsing(g_parser, XML_PARAM_ENTITY_PARSING_ALWAYS);
  2845. XML_SetExternalEntityRefHandler(g_parser, external_entity_suspend_xmldecl);
  2846. resumable = XML_TRUE;
  2847. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_TRUE)
  2848. == XML_STATUS_ERROR)
  2849. xml_failure(g_parser);
  2850. }
  2851. END_TEST
  2852. START_TEST(test_subordinate_xdecl_abort) {
  2853. const char *text
  2854. = "<!DOCTYPE doc [\n"
  2855. " <!ENTITY entity SYSTEM 'http://example.org/dummy.ent'>\n"
  2856. "]>\n"
  2857. "<doc>&entity;</doc>";
  2858. XML_SetParamEntityParsing(g_parser, XML_PARAM_ENTITY_PARSING_ALWAYS);
  2859. XML_SetExternalEntityRefHandler(g_parser, external_entity_suspend_xmldecl);
  2860. resumable = XML_FALSE;
  2861. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_TRUE)
  2862. == XML_STATUS_ERROR)
  2863. xml_failure(g_parser);
  2864. }
  2865. END_TEST
  2866. /* Test external entity fault handling with suspension */
  2867. static int XMLCALL
  2868. external_entity_suspending_faulter(XML_Parser parser, const XML_Char *context,
  2869. const XML_Char *base,
  2870. const XML_Char *systemId,
  2871. const XML_Char *publicId) {
  2872. XML_Parser ext_parser;
  2873. ExtFaults *fault = (ExtFaults *)XML_GetUserData(parser);
  2874. void *buffer;
  2875. int parse_len = (int)strlen(fault->parse_text);
  2876. UNUSED_P(base);
  2877. UNUSED_P(systemId);
  2878. UNUSED_P(publicId);
  2879. ext_parser = XML_ExternalEntityParserCreate(parser, context, NULL);
  2880. if (ext_parser == NULL)
  2881. fail("Could not create external entity parser");
  2882. XML_SetXmlDeclHandler(ext_parser, entity_suspending_xdecl_handler);
  2883. XML_SetUserData(ext_parser, ext_parser);
  2884. resumable = XML_TRUE;
  2885. buffer = XML_GetBuffer(ext_parser, parse_len);
  2886. if (buffer == NULL)
  2887. fail("Could not allocate parse buffer");
  2888. assert(buffer != NULL);
  2889. memcpy(buffer, fault->parse_text, parse_len);
  2890. if (XML_ParseBuffer(ext_parser, parse_len, XML_FALSE) != XML_STATUS_SUSPENDED)
  2891. fail("XML declaration did not suspend");
  2892. if (XML_ResumeParser(ext_parser) != XML_STATUS_OK)
  2893. xml_failure(ext_parser);
  2894. if (XML_ParseBuffer(ext_parser, 0, XML_TRUE) != XML_STATUS_ERROR)
  2895. fail(fault->fail_text);
  2896. if (XML_GetErrorCode(ext_parser) != fault->error)
  2897. xml_failure(ext_parser);
  2898. XML_ParserFree(ext_parser);
  2899. return XML_STATUS_ERROR;
  2900. }
  2901. START_TEST(test_ext_entity_invalid_suspended_parse) {
  2902. const char *text = "<!DOCTYPE doc [\n"
  2903. " <!ENTITY en SYSTEM 'http://example.org/dummy.ent'>\n"
  2904. "]>\n"
  2905. "<doc>&en;</doc>";
  2906. ExtFaults faults[]
  2907. = {{"<?xml version='1.0' encoding='us-ascii'?><",
  2908. "Incomplete element declaration not faulted", NULL,
  2909. XML_ERROR_UNCLOSED_TOKEN},
  2910. {/* First two bytes of a three-byte char */
  2911. "<?xml version='1.0' encoding='utf-8'?>\xe2\x82",
  2912. "Incomplete character not faulted", NULL, XML_ERROR_PARTIAL_CHAR},
  2913. {NULL, NULL, NULL, XML_ERROR_NONE}};
  2914. ExtFaults *fault;
  2915. for (fault = &faults[0]; fault->parse_text != NULL; fault++) {
  2916. XML_SetParamEntityParsing(g_parser, XML_PARAM_ENTITY_PARSING_ALWAYS);
  2917. XML_SetExternalEntityRefHandler(g_parser,
  2918. external_entity_suspending_faulter);
  2919. XML_SetUserData(g_parser, fault);
  2920. expect_failure(text, XML_ERROR_EXTERNAL_ENTITY_HANDLING,
  2921. "Parser did not report external entity error");
  2922. XML_ParserReset(g_parser, NULL);
  2923. }
  2924. }
  2925. END_TEST
  2926. /* Test setting an explicit encoding */
  2927. START_TEST(test_explicit_encoding) {
  2928. const char *text1 = "<doc>Hello ";
  2929. const char *text2 = " World</doc>";
  2930. /* Just check that we can set the encoding to NULL before starting */
  2931. if (XML_SetEncoding(g_parser, NULL) != XML_STATUS_OK)
  2932. fail("Failed to initialise encoding to NULL");
  2933. /* Say we are UTF-8 */
  2934. if (XML_SetEncoding(g_parser, XCS("utf-8")) != XML_STATUS_OK)
  2935. fail("Failed to set explicit encoding");
  2936. if (_XML_Parse_SINGLE_BYTES(g_parser, text1, (int)strlen(text1), XML_FALSE)
  2937. == XML_STATUS_ERROR)
  2938. xml_failure(g_parser);
  2939. /* Try to switch encodings mid-parse */
  2940. if (XML_SetEncoding(g_parser, XCS("us-ascii")) != XML_STATUS_ERROR)
  2941. fail("Allowed encoding change");
  2942. if (_XML_Parse_SINGLE_BYTES(g_parser, text2, (int)strlen(text2), XML_TRUE)
  2943. == XML_STATUS_ERROR)
  2944. xml_failure(g_parser);
  2945. /* Try now the parse is over */
  2946. if (XML_SetEncoding(g_parser, NULL) != XML_STATUS_OK)
  2947. fail("Failed to unset encoding");
  2948. }
  2949. END_TEST
  2950. /* Test handling of trailing CR (rather than newline) */
  2951. static void XMLCALL
  2952. cr_cdata_handler(void *userData, const XML_Char *s, int len) {
  2953. int *pfound = (int *)userData;
  2954. /* Internal processing turns the CR into a newline for the
  2955. * character data handler, but not for the default handler
  2956. */
  2957. if (len == 1 && (*s == XCS('\n') || *s == XCS('\r')))
  2958. *pfound = 1;
  2959. }
  2960. START_TEST(test_trailing_cr) {
  2961. const char *text = "<doc>\r";
  2962. int found_cr;
  2963. /* Try with a character handler, for code coverage */
  2964. XML_SetCharacterDataHandler(g_parser, cr_cdata_handler);
  2965. XML_SetUserData(g_parser, &found_cr);
  2966. found_cr = 0;
  2967. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_TRUE)
  2968. == XML_STATUS_OK)
  2969. fail("Failed to fault unclosed doc");
  2970. if (found_cr == 0)
  2971. fail("Did not catch the carriage return");
  2972. XML_ParserReset(g_parser, NULL);
  2973. /* Now with a default handler instead */
  2974. XML_SetDefaultHandler(g_parser, cr_cdata_handler);
  2975. XML_SetUserData(g_parser, &found_cr);
  2976. found_cr = 0;
  2977. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_TRUE)
  2978. == XML_STATUS_OK)
  2979. fail("Failed to fault unclosed doc");
  2980. if (found_cr == 0)
  2981. fail("Did not catch default carriage return");
  2982. }
  2983. END_TEST
  2984. /* Test trailing CR in an external entity parse */
  2985. static int XMLCALL
  2986. external_entity_cr_catcher(XML_Parser parser, const XML_Char *context,
  2987. const XML_Char *base, const XML_Char *systemId,
  2988. const XML_Char *publicId) {
  2989. const char *text = "\r";
  2990. XML_Parser ext_parser;
  2991. UNUSED_P(base);
  2992. UNUSED_P(systemId);
  2993. UNUSED_P(publicId);
  2994. ext_parser = XML_ExternalEntityParserCreate(parser, context, NULL);
  2995. if (ext_parser == NULL)
  2996. fail("Could not create external entity parser");
  2997. XML_SetCharacterDataHandler(ext_parser, cr_cdata_handler);
  2998. if (_XML_Parse_SINGLE_BYTES(ext_parser, text, (int)strlen(text), XML_TRUE)
  2999. == XML_STATUS_ERROR)
  3000. xml_failure(ext_parser);
  3001. XML_ParserFree(ext_parser);
  3002. return XML_STATUS_OK;
  3003. }
  3004. static int XMLCALL
  3005. external_entity_bad_cr_catcher(XML_Parser parser, const XML_Char *context,
  3006. const XML_Char *base, const XML_Char *systemId,
  3007. const XML_Char *publicId) {
  3008. const char *text = "<tag>\r";
  3009. XML_Parser ext_parser;
  3010. UNUSED_P(base);
  3011. UNUSED_P(systemId);
  3012. UNUSED_P(publicId);
  3013. ext_parser = XML_ExternalEntityParserCreate(parser, context, NULL);
  3014. if (ext_parser == NULL)
  3015. fail("Could not create external entity parser");
  3016. XML_SetCharacterDataHandler(ext_parser, cr_cdata_handler);
  3017. if (_XML_Parse_SINGLE_BYTES(ext_parser, text, (int)strlen(text), XML_TRUE)
  3018. == XML_STATUS_OK)
  3019. fail("Async entity error not caught");
  3020. if (XML_GetErrorCode(ext_parser) != XML_ERROR_ASYNC_ENTITY)
  3021. xml_failure(ext_parser);
  3022. XML_ParserFree(ext_parser);
  3023. return XML_STATUS_OK;
  3024. }
  3025. START_TEST(test_ext_entity_trailing_cr) {
  3026. const char *text = "<!DOCTYPE doc [\n"
  3027. " <!ENTITY en SYSTEM 'http://example.org/dummy.ent'>\n"
  3028. "]>\n"
  3029. "<doc>&en;</doc>";
  3030. int found_cr;
  3031. XML_SetParamEntityParsing(g_parser, XML_PARAM_ENTITY_PARSING_ALWAYS);
  3032. XML_SetExternalEntityRefHandler(g_parser, external_entity_cr_catcher);
  3033. XML_SetUserData(g_parser, &found_cr);
  3034. found_cr = 0;
  3035. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_TRUE)
  3036. != XML_STATUS_OK)
  3037. xml_failure(g_parser);
  3038. if (found_cr == 0)
  3039. fail("No carriage return found");
  3040. XML_ParserReset(g_parser, NULL);
  3041. /* Try again with a different trailing CR */
  3042. XML_SetParamEntityParsing(g_parser, XML_PARAM_ENTITY_PARSING_ALWAYS);
  3043. XML_SetExternalEntityRefHandler(g_parser, external_entity_bad_cr_catcher);
  3044. XML_SetUserData(g_parser, &found_cr);
  3045. found_cr = 0;
  3046. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_TRUE)
  3047. != XML_STATUS_OK)
  3048. xml_failure(g_parser);
  3049. if (found_cr == 0)
  3050. fail("No carriage return found");
  3051. }
  3052. END_TEST
  3053. /* Test handling of trailing square bracket */
  3054. static void XMLCALL
  3055. rsqb_handler(void *userData, const XML_Char *s, int len) {
  3056. int *pfound = (int *)userData;
  3057. if (len == 1 && *s == XCS(']'))
  3058. *pfound = 1;
  3059. }
  3060. START_TEST(test_trailing_rsqb) {
  3061. const char *text8 = "<doc>]";
  3062. const char text16[] = "\xFF\xFE<\000d\000o\000c\000>\000]\000";
  3063. int found_rsqb;
  3064. int text8_len = (int)strlen(text8);
  3065. XML_SetCharacterDataHandler(g_parser, rsqb_handler);
  3066. XML_SetUserData(g_parser, &found_rsqb);
  3067. found_rsqb = 0;
  3068. if (_XML_Parse_SINGLE_BYTES(g_parser, text8, text8_len, XML_TRUE)
  3069. == XML_STATUS_OK)
  3070. fail("Failed to fault unclosed doc");
  3071. if (found_rsqb == 0)
  3072. fail("Did not catch the right square bracket");
  3073. /* Try again with a different encoding */
  3074. XML_ParserReset(g_parser, NULL);
  3075. XML_SetCharacterDataHandler(g_parser, rsqb_handler);
  3076. XML_SetUserData(g_parser, &found_rsqb);
  3077. found_rsqb = 0;
  3078. if (_XML_Parse_SINGLE_BYTES(g_parser, text16, (int)sizeof(text16) - 1,
  3079. XML_TRUE)
  3080. == XML_STATUS_OK)
  3081. fail("Failed to fault unclosed doc");
  3082. if (found_rsqb == 0)
  3083. fail("Did not catch the right square bracket");
  3084. /* And finally with a default handler */
  3085. XML_ParserReset(g_parser, NULL);
  3086. XML_SetDefaultHandler(g_parser, rsqb_handler);
  3087. XML_SetUserData(g_parser, &found_rsqb);
  3088. found_rsqb = 0;
  3089. if (_XML_Parse_SINGLE_BYTES(g_parser, text16, (int)sizeof(text16) - 1,
  3090. XML_TRUE)
  3091. == XML_STATUS_OK)
  3092. fail("Failed to fault unclosed doc");
  3093. if (found_rsqb == 0)
  3094. fail("Did not catch the right square bracket");
  3095. }
  3096. END_TEST
  3097. /* Test trailing right square bracket in an external entity parse */
  3098. static int XMLCALL
  3099. external_entity_rsqb_catcher(XML_Parser parser, const XML_Char *context,
  3100. const XML_Char *base, const XML_Char *systemId,
  3101. const XML_Char *publicId) {
  3102. const char *text = "<tag>]";
  3103. XML_Parser ext_parser;
  3104. UNUSED_P(base);
  3105. UNUSED_P(systemId);
  3106. UNUSED_P(publicId);
  3107. ext_parser = XML_ExternalEntityParserCreate(parser, context, NULL);
  3108. if (ext_parser == NULL)
  3109. fail("Could not create external entity parser");
  3110. XML_SetCharacterDataHandler(ext_parser, rsqb_handler);
  3111. if (_XML_Parse_SINGLE_BYTES(ext_parser, text, (int)strlen(text), XML_TRUE)
  3112. != XML_STATUS_ERROR)
  3113. fail("Async entity error not caught");
  3114. if (XML_GetErrorCode(ext_parser) != XML_ERROR_ASYNC_ENTITY)
  3115. xml_failure(ext_parser);
  3116. XML_ParserFree(ext_parser);
  3117. return XML_STATUS_OK;
  3118. }
  3119. START_TEST(test_ext_entity_trailing_rsqb) {
  3120. const char *text = "<!DOCTYPE doc [\n"
  3121. " <!ENTITY en SYSTEM 'http://example.org/dummy.ent'>\n"
  3122. "]>\n"
  3123. "<doc>&en;</doc>";
  3124. int found_rsqb;
  3125. XML_SetParamEntityParsing(g_parser, XML_PARAM_ENTITY_PARSING_ALWAYS);
  3126. XML_SetExternalEntityRefHandler(g_parser, external_entity_rsqb_catcher);
  3127. XML_SetUserData(g_parser, &found_rsqb);
  3128. found_rsqb = 0;
  3129. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_TRUE)
  3130. != XML_STATUS_OK)
  3131. xml_failure(g_parser);
  3132. if (found_rsqb == 0)
  3133. fail("No right square bracket found");
  3134. }
  3135. END_TEST
  3136. /* Test CDATA handling in an external entity */
  3137. static int XMLCALL
  3138. external_entity_good_cdata_ascii(XML_Parser parser, const XML_Char *context,
  3139. const XML_Char *base, const XML_Char *systemId,
  3140. const XML_Char *publicId) {
  3141. const char *text = "<a><![CDATA[<greeting>Hello, world!</greeting>]]></a>";
  3142. const XML_Char *expected = XCS("<greeting>Hello, world!</greeting>");
  3143. CharData storage;
  3144. XML_Parser ext_parser;
  3145. UNUSED_P(base);
  3146. UNUSED_P(systemId);
  3147. UNUSED_P(publicId);
  3148. CharData_Init(&storage);
  3149. ext_parser = XML_ExternalEntityParserCreate(parser, context, NULL);
  3150. if (ext_parser == NULL)
  3151. fail("Could not create external entity parser");
  3152. XML_SetUserData(ext_parser, &storage);
  3153. XML_SetCharacterDataHandler(ext_parser, accumulate_characters);
  3154. if (_XML_Parse_SINGLE_BYTES(ext_parser, text, (int)strlen(text), XML_TRUE)
  3155. == XML_STATUS_ERROR)
  3156. xml_failure(ext_parser);
  3157. CharData_CheckXMLChars(&storage, expected);
  3158. XML_ParserFree(ext_parser);
  3159. return XML_STATUS_OK;
  3160. }
  3161. START_TEST(test_ext_entity_good_cdata) {
  3162. const char *text = "<!DOCTYPE doc [\n"
  3163. " <!ENTITY en SYSTEM 'http://example.org/dummy.ent'>\n"
  3164. "]>\n"
  3165. "<doc>&en;</doc>";
  3166. XML_SetParamEntityParsing(g_parser, XML_PARAM_ENTITY_PARSING_ALWAYS);
  3167. XML_SetExternalEntityRefHandler(g_parser, external_entity_good_cdata_ascii);
  3168. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_TRUE)
  3169. != XML_STATUS_OK)
  3170. xml_failure(g_parser);
  3171. }
  3172. END_TEST
  3173. /* Test user parameter settings */
  3174. /* Variable holding the expected handler userData */
  3175. static void *handler_data = NULL;
  3176. /* Count of the number of times the comment handler has been invoked */
  3177. static int comment_count = 0;
  3178. /* Count of the number of skipped entities */
  3179. static int skip_count = 0;
  3180. /* Count of the number of times the XML declaration handler is invoked */
  3181. static int xdecl_count = 0;
  3182. static void XMLCALL
  3183. xml_decl_handler(void *userData, const XML_Char *version,
  3184. const XML_Char *encoding, int standalone) {
  3185. UNUSED_P(version);
  3186. UNUSED_P(encoding);
  3187. if (userData != handler_data)
  3188. fail("User data (xml decl) not correctly set");
  3189. if (standalone != -1)
  3190. fail("Standalone not flagged as not present in XML decl");
  3191. xdecl_count++;
  3192. }
  3193. static void XMLCALL
  3194. param_check_skip_handler(void *userData, const XML_Char *entityName,
  3195. int is_parameter_entity) {
  3196. UNUSED_P(entityName);
  3197. UNUSED_P(is_parameter_entity);
  3198. if (userData != handler_data)
  3199. fail("User data (skip) not correctly set");
  3200. skip_count++;
  3201. }
  3202. static void XMLCALL
  3203. data_check_comment_handler(void *userData, const XML_Char *data) {
  3204. UNUSED_P(data);
  3205. /* Check that the userData passed through is what we expect */
  3206. if (userData != handler_data)
  3207. fail("User data (parser) not correctly set");
  3208. /* Check that the user data in the parser is appropriate */
  3209. if (XML_GetUserData(userData) != (void *)1)
  3210. fail("User data in parser not correctly set");
  3211. comment_count++;
  3212. }
  3213. static int XMLCALL
  3214. external_entity_param_checker(XML_Parser parser, const XML_Char *context,
  3215. const XML_Char *base, const XML_Char *systemId,
  3216. const XML_Char *publicId) {
  3217. const char *text = "<!-- Subordinate parser -->\n"
  3218. "<!ELEMENT doc (#PCDATA)*>";
  3219. XML_Parser ext_parser;
  3220. UNUSED_P(base);
  3221. UNUSED_P(systemId);
  3222. UNUSED_P(publicId);
  3223. ext_parser = XML_ExternalEntityParserCreate(parser, context, NULL);
  3224. if (ext_parser == NULL)
  3225. fail("Could not create external entity parser");
  3226. handler_data = ext_parser;
  3227. if (_XML_Parse_SINGLE_BYTES(ext_parser, text, (int)strlen(text), XML_TRUE)
  3228. == XML_STATUS_ERROR) {
  3229. xml_failure(parser);
  3230. return XML_STATUS_ERROR;
  3231. }
  3232. handler_data = parser;
  3233. XML_ParserFree(ext_parser);
  3234. return XML_STATUS_OK;
  3235. }
  3236. START_TEST(test_user_parameters) {
  3237. const char *text = "<?xml version='1.0' encoding='us-ascii'?>\n"
  3238. "<!-- Primary parse -->\n"
  3239. "<!DOCTYPE doc SYSTEM 'foo'>\n"
  3240. "<doc>&entity;";
  3241. const char *epilog = "<!-- Back to primary parser -->\n"
  3242. "</doc>";
  3243. comment_count = 0;
  3244. skip_count = 0;
  3245. xdecl_count = 0;
  3246. XML_SetParamEntityParsing(g_parser, XML_PARAM_ENTITY_PARSING_ALWAYS);
  3247. XML_SetXmlDeclHandler(g_parser, xml_decl_handler);
  3248. XML_SetExternalEntityRefHandler(g_parser, external_entity_param_checker);
  3249. XML_SetCommentHandler(g_parser, data_check_comment_handler);
  3250. XML_SetSkippedEntityHandler(g_parser, param_check_skip_handler);
  3251. XML_UseParserAsHandlerArg(g_parser);
  3252. XML_SetUserData(g_parser, (void *)1);
  3253. handler_data = g_parser;
  3254. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_FALSE)
  3255. == XML_STATUS_ERROR)
  3256. xml_failure(g_parser);
  3257. if (comment_count != 2)
  3258. fail("Comment handler not invoked enough times");
  3259. /* Ensure we can't change policy mid-parse */
  3260. if (XML_SetParamEntityParsing(g_parser, XML_PARAM_ENTITY_PARSING_NEVER))
  3261. fail("Changed param entity parsing policy while parsing");
  3262. if (_XML_Parse_SINGLE_BYTES(g_parser, epilog, (int)strlen(epilog), XML_TRUE)
  3263. == XML_STATUS_ERROR)
  3264. xml_failure(g_parser);
  3265. if (comment_count != 3)
  3266. fail("Comment handler not invoked enough times");
  3267. if (skip_count != 1)
  3268. fail("Skip handler not invoked enough times");
  3269. if (xdecl_count != 1)
  3270. fail("XML declaration handler not invoked");
  3271. }
  3272. END_TEST
  3273. /* Test that an explicit external entity handler argument replaces
  3274. * the parser as the first argument.
  3275. *
  3276. * We do not call the first parameter to the external entity handler
  3277. * 'parser' for once, since the first time the handler is called it
  3278. * will actually be a text string. We need to be able to access the
  3279. * global 'parser' variable to create our external entity parser from,
  3280. * since there are code paths we need to ensure get executed.
  3281. */
  3282. static int XMLCALL
  3283. external_entity_ref_param_checker(XML_Parser parameter, const XML_Char *context,
  3284. const XML_Char *base,
  3285. const XML_Char *systemId,
  3286. const XML_Char *publicId) {
  3287. const char *text = "<!ELEMENT doc (#PCDATA)*>";
  3288. XML_Parser ext_parser;
  3289. UNUSED_P(base);
  3290. UNUSED_P(systemId);
  3291. UNUSED_P(publicId);
  3292. if ((void *)parameter != handler_data)
  3293. fail("External entity ref handler parameter not correct");
  3294. /* Here we use the global 'parser' variable */
  3295. ext_parser = XML_ExternalEntityParserCreate(g_parser, context, NULL);
  3296. if (ext_parser == NULL)
  3297. fail("Could not create external entity parser");
  3298. if (_XML_Parse_SINGLE_BYTES(ext_parser, text, (int)strlen(text), XML_TRUE)
  3299. == XML_STATUS_ERROR)
  3300. xml_failure(ext_parser);
  3301. XML_ParserFree(ext_parser);
  3302. return XML_STATUS_OK;
  3303. }
  3304. START_TEST(test_ext_entity_ref_parameter) {
  3305. const char *text = "<?xml version='1.0' encoding='us-ascii'?>\n"
  3306. "<!DOCTYPE doc SYSTEM 'foo'>\n"
  3307. "<doc>&entity;</doc>";
  3308. XML_SetParamEntityParsing(g_parser, XML_PARAM_ENTITY_PARSING_ALWAYS);
  3309. XML_SetExternalEntityRefHandler(g_parser, external_entity_ref_param_checker);
  3310. /* Set a handler arg that is not NULL and not parser (which is
  3311. * what NULL would cause to be passed.
  3312. */
  3313. XML_SetExternalEntityRefHandlerArg(g_parser, (void *)text);
  3314. handler_data = (void *)text;
  3315. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_TRUE)
  3316. == XML_STATUS_ERROR)
  3317. xml_failure(g_parser);
  3318. /* Now try again with unset args */
  3319. XML_ParserReset(g_parser, NULL);
  3320. XML_SetParamEntityParsing(g_parser, XML_PARAM_ENTITY_PARSING_ALWAYS);
  3321. XML_SetExternalEntityRefHandler(g_parser, external_entity_ref_param_checker);
  3322. XML_SetExternalEntityRefHandlerArg(g_parser, NULL);
  3323. handler_data = (void *)g_parser;
  3324. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_TRUE)
  3325. == XML_STATUS_ERROR)
  3326. xml_failure(g_parser);
  3327. }
  3328. END_TEST
  3329. /* Test the parsing of an empty string */
  3330. START_TEST(test_empty_parse) {
  3331. const char *text = "<doc></doc>";
  3332. const char *partial = "<doc>";
  3333. if (XML_Parse(g_parser, NULL, 0, XML_FALSE) == XML_STATUS_ERROR)
  3334. fail("Parsing empty string faulted");
  3335. if (XML_Parse(g_parser, NULL, 0, XML_TRUE) != XML_STATUS_ERROR)
  3336. fail("Parsing final empty string not faulted");
  3337. if (XML_GetErrorCode(g_parser) != XML_ERROR_NO_ELEMENTS)
  3338. fail("Parsing final empty string faulted for wrong reason");
  3339. /* Now try with valid text before the empty end */
  3340. XML_ParserReset(g_parser, NULL);
  3341. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_FALSE)
  3342. == XML_STATUS_ERROR)
  3343. xml_failure(g_parser);
  3344. if (XML_Parse(g_parser, NULL, 0, XML_TRUE) == XML_STATUS_ERROR)
  3345. fail("Parsing final empty string faulted");
  3346. /* Now try with invalid text before the empty end */
  3347. XML_ParserReset(g_parser, NULL);
  3348. if (_XML_Parse_SINGLE_BYTES(g_parser, partial, (int)strlen(partial),
  3349. XML_FALSE)
  3350. == XML_STATUS_ERROR)
  3351. xml_failure(g_parser);
  3352. if (XML_Parse(g_parser, NULL, 0, XML_TRUE) != XML_STATUS_ERROR)
  3353. fail("Parsing final incomplete empty string not faulted");
  3354. }
  3355. END_TEST
  3356. /* Test odd corners of the XML_GetBuffer interface */
  3357. static enum XML_Status
  3358. get_feature(enum XML_FeatureEnum feature_id, long *presult) {
  3359. const XML_Feature *feature = XML_GetFeatureList();
  3360. if (feature == NULL)
  3361. return XML_STATUS_ERROR;
  3362. for (; feature->feature != XML_FEATURE_END; feature++) {
  3363. if (feature->feature == feature_id) {
  3364. *presult = feature->value;
  3365. return XML_STATUS_OK;
  3366. }
  3367. }
  3368. return XML_STATUS_ERROR;
  3369. }
  3370. /* Having an element name longer than 1024 characters exercises some
  3371. * of the pool allocation code in the parser that otherwise does not
  3372. * get executed. The count at the end of the line is the number of
  3373. * characters (bytes) in the element name by that point.x
  3374. */
  3375. static const char *get_buffer_test_text
  3376. = "<documentwitharidiculouslylongelementnametotease" /* 0x030 */
  3377. "aparticularcorneroftheallocationinXML_GetBuffers" /* 0x060 */
  3378. "othatwecanimprovethecoverageyetagain012345678901" /* 0x090 */
  3379. "123456789abcdef0123456789abcdef0123456789abcdef0" /* 0x0c0 */
  3380. "123456789abcdef0123456789abcdef0123456789abcdef0" /* 0x0f0 */
  3381. "123456789abcdef0123456789abcdef0123456789abcdef0" /* 0x120 */
  3382. "123456789abcdef0123456789abcdef0123456789abcdef0" /* 0x150 */
  3383. "123456789abcdef0123456789abcdef0123456789abcdef0" /* 0x180 */
  3384. "123456789abcdef0123456789abcdef0123456789abcdef0" /* 0x1b0 */
  3385. "123456789abcdef0123456789abcdef0123456789abcdef0" /* 0x1e0 */
  3386. "123456789abcdef0123456789abcdef0123456789abcdef0" /* 0x210 */
  3387. "123456789abcdef0123456789abcdef0123456789abcdef0" /* 0x240 */
  3388. "123456789abcdef0123456789abcdef0123456789abcdef0" /* 0x270 */
  3389. "123456789abcdef0123456789abcdef0123456789abcdef0" /* 0x2a0 */
  3390. "123456789abcdef0123456789abcdef0123456789abcdef0" /* 0x2d0 */
  3391. "123456789abcdef0123456789abcdef0123456789abcdef0" /* 0x300 */
  3392. "123456789abcdef0123456789abcdef0123456789abcdef0" /* 0x330 */
  3393. "123456789abcdef0123456789abcdef0123456789abcdef0" /* 0x360 */
  3394. "123456789abcdef0123456789abcdef0123456789abcdef0" /* 0x390 */
  3395. "123456789abcdef0123456789abcdef0123456789abcdef0" /* 0x3c0 */
  3396. "123456789abcdef0123456789abcdef0123456789abcdef0" /* 0x3f0 */
  3397. "123456789abcdef0123456789abcdef0123456789>\n<ef0"; /* 0x420 */
  3398. /* Test odd corners of the XML_GetBuffer interface */
  3399. START_TEST(test_get_buffer_1) {
  3400. const char *text = get_buffer_test_text;
  3401. void *buffer;
  3402. long context_bytes;
  3403. /* Attempt to allocate a negative length buffer */
  3404. if (XML_GetBuffer(g_parser, -12) != NULL)
  3405. fail("Negative length buffer not failed");
  3406. /* Now get a small buffer and extend it past valid length */
  3407. buffer = XML_GetBuffer(g_parser, 1536);
  3408. if (buffer == NULL)
  3409. fail("1.5K buffer failed");
  3410. assert(buffer != NULL);
  3411. memcpy(buffer, text, strlen(text));
  3412. if (XML_ParseBuffer(g_parser, (int)strlen(text), XML_FALSE)
  3413. == XML_STATUS_ERROR)
  3414. xml_failure(g_parser);
  3415. if (XML_GetBuffer(g_parser, INT_MAX) != NULL)
  3416. fail("INT_MAX buffer not failed");
  3417. /* Now try extending it a more reasonable but still too large
  3418. * amount. The allocator in XML_GetBuffer() doubles the buffer
  3419. * size until it exceeds the requested amount or INT_MAX. If it
  3420. * exceeds INT_MAX, it rejects the request, so we want a request
  3421. * between INT_MAX and INT_MAX/2. A gap of 1K seems comfortable,
  3422. * with an extra byte just to ensure that the request is off any
  3423. * boundary. The request will be inflated internally by
  3424. * XML_CONTEXT_BYTES (if defined), so we subtract that from our
  3425. * request.
  3426. */
  3427. if (get_feature(XML_FEATURE_CONTEXT_BYTES, &context_bytes) != XML_STATUS_OK)
  3428. context_bytes = 0;
  3429. if (XML_GetBuffer(g_parser, INT_MAX - (context_bytes + 1025)) != NULL)
  3430. fail("INT_MAX- buffer not failed");
  3431. /* Now try extending it a carefully crafted amount */
  3432. if (XML_GetBuffer(g_parser, 1000) == NULL)
  3433. fail("1000 buffer failed");
  3434. }
  3435. END_TEST
  3436. /* Test more corners of the XML_GetBuffer interface */
  3437. START_TEST(test_get_buffer_2) {
  3438. const char *text = get_buffer_test_text;
  3439. void *buffer;
  3440. /* Now get a decent buffer */
  3441. buffer = XML_GetBuffer(g_parser, 1536);
  3442. if (buffer == NULL)
  3443. fail("1.5K buffer failed");
  3444. assert(buffer != NULL);
  3445. memcpy(buffer, text, strlen(text));
  3446. if (XML_ParseBuffer(g_parser, (int)strlen(text), XML_FALSE)
  3447. == XML_STATUS_ERROR)
  3448. xml_failure(g_parser);
  3449. /* Extend it, to catch a different code path */
  3450. if (XML_GetBuffer(g_parser, 1024) == NULL)
  3451. fail("1024 buffer failed");
  3452. }
  3453. END_TEST
  3454. /* Test position information macros */
  3455. START_TEST(test_byte_info_at_end) {
  3456. const char *text = "<doc></doc>";
  3457. if (XML_GetCurrentByteIndex(g_parser) != -1
  3458. || XML_GetCurrentByteCount(g_parser) != 0)
  3459. fail("Byte index/count incorrect at start of parse");
  3460. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_TRUE)
  3461. == XML_STATUS_ERROR)
  3462. xml_failure(g_parser);
  3463. /* At end, the count will be zero and the index the end of string */
  3464. if (XML_GetCurrentByteCount(g_parser) != 0)
  3465. fail("Terminal byte count incorrect");
  3466. if (XML_GetCurrentByteIndex(g_parser) != (XML_Index)strlen(text))
  3467. fail("Terminal byte index incorrect");
  3468. }
  3469. END_TEST
  3470. /* Test position information from errors */
  3471. #define PRE_ERROR_STR "<doc></"
  3472. #define POST_ERROR_STR "wombat></doc>"
  3473. START_TEST(test_byte_info_at_error) {
  3474. const char *text = PRE_ERROR_STR POST_ERROR_STR;
  3475. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_TRUE)
  3476. == XML_STATUS_OK)
  3477. fail("Syntax error not faulted");
  3478. if (XML_GetCurrentByteCount(g_parser) != 0)
  3479. fail("Error byte count incorrect");
  3480. if (XML_GetCurrentByteIndex(g_parser) != strlen(PRE_ERROR_STR))
  3481. fail("Error byte index incorrect");
  3482. }
  3483. END_TEST
  3484. #undef PRE_ERROR_STR
  3485. #undef POST_ERROR_STR
  3486. /* Test position information in handler */
  3487. typedef struct ByteTestData {
  3488. int start_element_len;
  3489. int cdata_len;
  3490. int total_string_len;
  3491. } ByteTestData;
  3492. static void
  3493. byte_character_handler(void *userData, const XML_Char *s, int len) {
  3494. #ifdef XML_CONTEXT_BYTES
  3495. int offset, size;
  3496. const char *buffer;
  3497. ByteTestData *data = (ByteTestData *)userData;
  3498. UNUSED_P(s);
  3499. buffer = XML_GetInputContext(g_parser, &offset, &size);
  3500. if (buffer == NULL)
  3501. fail("Failed to get context buffer");
  3502. if (offset != data->start_element_len)
  3503. fail("Context offset in unexpected position");
  3504. if (len != data->cdata_len)
  3505. fail("CDATA length reported incorrectly");
  3506. if (size != data->total_string_len)
  3507. fail("Context size is not full buffer");
  3508. if (XML_GetCurrentByteIndex(g_parser) != offset)
  3509. fail("Character byte index incorrect");
  3510. if (XML_GetCurrentByteCount(g_parser) != len)
  3511. fail("Character byte count incorrect");
  3512. #else
  3513. UNUSED_P(s);
  3514. UNUSED_P(userData);
  3515. UNUSED_P(len);
  3516. #endif
  3517. }
  3518. #define START_ELEMENT "<e>"
  3519. #define CDATA_TEXT "Hello"
  3520. #define END_ELEMENT "</e>"
  3521. START_TEST(test_byte_info_at_cdata) {
  3522. const char *text = START_ELEMENT CDATA_TEXT END_ELEMENT;
  3523. int offset, size;
  3524. ByteTestData data;
  3525. /* Check initial context is empty */
  3526. if (XML_GetInputContext(g_parser, &offset, &size) != NULL)
  3527. fail("Unexpected context at start of parse");
  3528. data.start_element_len = (int)strlen(START_ELEMENT);
  3529. data.cdata_len = (int)strlen(CDATA_TEXT);
  3530. data.total_string_len = (int)strlen(text);
  3531. XML_SetCharacterDataHandler(g_parser, byte_character_handler);
  3532. XML_SetUserData(g_parser, &data);
  3533. if (XML_Parse(g_parser, text, (int)strlen(text), XML_TRUE) != XML_STATUS_OK)
  3534. xml_failure(g_parser);
  3535. }
  3536. END_TEST
  3537. #undef START_ELEMENT
  3538. #undef CDATA_TEXT
  3539. #undef END_ELEMENT
  3540. /* Test predefined entities are correctly recognised */
  3541. START_TEST(test_predefined_entities) {
  3542. const char *text = "<doc>&lt;&gt;&amp;&quot;&apos;</doc>";
  3543. const XML_Char *expected = XCS("<doc>&lt;&gt;&amp;&quot;&apos;</doc>");
  3544. const XML_Char *result = XCS("<>&\"'");
  3545. CharData storage;
  3546. XML_SetDefaultHandler(g_parser, accumulate_characters);
  3547. /* run_character_check uses XML_SetCharacterDataHandler(), which
  3548. * unfortunately heads off a code path that we need to exercise.
  3549. */
  3550. CharData_Init(&storage);
  3551. XML_SetUserData(g_parser, &storage);
  3552. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_TRUE)
  3553. == XML_STATUS_ERROR)
  3554. xml_failure(g_parser);
  3555. /* The default handler doesn't translate the entities */
  3556. CharData_CheckXMLChars(&storage, expected);
  3557. /* Now try again and check the translation */
  3558. XML_ParserReset(g_parser, NULL);
  3559. run_character_check(text, result);
  3560. }
  3561. END_TEST
  3562. /* Regression test that an invalid tag in an external parameter
  3563. * reference in an external DTD is correctly faulted.
  3564. *
  3565. * Only a few specific tags are legal in DTDs ignoring comments and
  3566. * processing instructions, all of which begin with an exclamation
  3567. * mark. "<el/>" is not one of them, so the parser should raise an
  3568. * error on encountering it.
  3569. */
  3570. static int XMLCALL
  3571. external_entity_param(XML_Parser parser, const XML_Char *context,
  3572. const XML_Char *base, const XML_Char *systemId,
  3573. const XML_Char *publicId) {
  3574. const char *text1 = "<!ELEMENT doc EMPTY>\n"
  3575. "<!ENTITY % e1 SYSTEM '004-2.ent'>\n"
  3576. "<!ENTITY % e2 '%e1;'>\n"
  3577. "%e1;\n";
  3578. const char *text2 = "<!ELEMENT el EMPTY>\n"
  3579. "<el/>\n";
  3580. XML_Parser ext_parser;
  3581. UNUSED_P(base);
  3582. UNUSED_P(publicId);
  3583. if (systemId == NULL)
  3584. return XML_STATUS_OK;
  3585. ext_parser = XML_ExternalEntityParserCreate(parser, context, NULL);
  3586. if (ext_parser == NULL)
  3587. fail("Could not create external entity parser");
  3588. if (! xcstrcmp(systemId, XCS("004-1.ent"))) {
  3589. if (_XML_Parse_SINGLE_BYTES(ext_parser, text1, (int)strlen(text1), XML_TRUE)
  3590. != XML_STATUS_ERROR)
  3591. fail("Inner DTD with invalid tag not rejected");
  3592. if (XML_GetErrorCode(ext_parser) != XML_ERROR_EXTERNAL_ENTITY_HANDLING)
  3593. xml_failure(ext_parser);
  3594. } else if (! xcstrcmp(systemId, XCS("004-2.ent"))) {
  3595. if (_XML_Parse_SINGLE_BYTES(ext_parser, text2, (int)strlen(text2), XML_TRUE)
  3596. != XML_STATUS_ERROR)
  3597. fail("Invalid tag in external param not rejected");
  3598. if (XML_GetErrorCode(ext_parser) != XML_ERROR_SYNTAX)
  3599. xml_failure(ext_parser);
  3600. } else {
  3601. fail("Unknown system ID");
  3602. }
  3603. XML_ParserFree(ext_parser);
  3604. return XML_STATUS_ERROR;
  3605. }
  3606. START_TEST(test_invalid_tag_in_dtd) {
  3607. const char *text = "<!DOCTYPE doc SYSTEM '004-1.ent'>\n"
  3608. "<doc></doc>\n";
  3609. XML_SetParamEntityParsing(g_parser, XML_PARAM_ENTITY_PARSING_ALWAYS);
  3610. XML_SetExternalEntityRefHandler(g_parser, external_entity_param);
  3611. expect_failure(text, XML_ERROR_EXTERNAL_ENTITY_HANDLING,
  3612. "Invalid tag IN DTD external param not rejected");
  3613. }
  3614. END_TEST
  3615. /* Test entities not quite the predefined ones are not mis-recognised */
  3616. START_TEST(test_not_predefined_entities) {
  3617. const char *text[] = {"<doc>&pt;</doc>", "<doc>&amo;</doc>",
  3618. "<doc>&quid;</doc>", "<doc>&apod;</doc>", NULL};
  3619. int i = 0;
  3620. while (text[i] != NULL) {
  3621. expect_failure(text[i], XML_ERROR_UNDEFINED_ENTITY,
  3622. "Undefined entity not rejected");
  3623. XML_ParserReset(g_parser, NULL);
  3624. i++;
  3625. }
  3626. }
  3627. END_TEST
  3628. /* Test conditional inclusion (IGNORE) */
  3629. static int XMLCALL
  3630. external_entity_load_ignore(XML_Parser parser, const XML_Char *context,
  3631. const XML_Char *base, const XML_Char *systemId,
  3632. const XML_Char *publicId) {
  3633. const char *text = "<![IGNORE[<!ELEMENT e (#PCDATA)*>]]>";
  3634. XML_Parser ext_parser;
  3635. UNUSED_P(base);
  3636. UNUSED_P(systemId);
  3637. UNUSED_P(publicId);
  3638. ext_parser = XML_ExternalEntityParserCreate(parser, context, NULL);
  3639. if (ext_parser == NULL)
  3640. fail("Could not create external entity parser");
  3641. if (_XML_Parse_SINGLE_BYTES(ext_parser, text, (int)strlen(text), XML_TRUE)
  3642. == XML_STATUS_ERROR)
  3643. xml_failure(parser);
  3644. XML_ParserFree(ext_parser);
  3645. return XML_STATUS_OK;
  3646. }
  3647. START_TEST(test_ignore_section) {
  3648. const char *text = "<!DOCTYPE doc SYSTEM 'foo'>\n"
  3649. "<doc><e>&entity;</e></doc>";
  3650. const XML_Char *expected
  3651. = XCS("<![IGNORE[<!ELEMENT e (#PCDATA)*>]]>\n&entity;");
  3652. CharData storage;
  3653. CharData_Init(&storage);
  3654. XML_SetParamEntityParsing(g_parser, XML_PARAM_ENTITY_PARSING_ALWAYS);
  3655. XML_SetUserData(g_parser, &storage);
  3656. XML_SetExternalEntityRefHandler(g_parser, external_entity_load_ignore);
  3657. XML_SetDefaultHandler(g_parser, accumulate_characters);
  3658. XML_SetStartDoctypeDeclHandler(g_parser, dummy_start_doctype_handler);
  3659. XML_SetEndDoctypeDeclHandler(g_parser, dummy_end_doctype_handler);
  3660. XML_SetElementDeclHandler(g_parser, dummy_element_decl_handler);
  3661. XML_SetStartElementHandler(g_parser, dummy_start_element);
  3662. XML_SetEndElementHandler(g_parser, dummy_end_element);
  3663. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_TRUE)
  3664. == XML_STATUS_ERROR)
  3665. xml_failure(g_parser);
  3666. CharData_CheckXMLChars(&storage, expected);
  3667. }
  3668. END_TEST
  3669. static int XMLCALL
  3670. external_entity_load_ignore_utf16(XML_Parser parser, const XML_Char *context,
  3671. const XML_Char *base,
  3672. const XML_Char *systemId,
  3673. const XML_Char *publicId) {
  3674. const char text[] =
  3675. /* <![IGNORE[<!ELEMENT e (#PCDATA)*>]]> */
  3676. "<\0!\0[\0I\0G\0N\0O\0R\0E\0[\0"
  3677. "<\0!\0E\0L\0E\0M\0E\0N\0T\0 \0e\0 \0"
  3678. "(\0#\0P\0C\0D\0A\0T\0A\0)\0*\0>\0]\0]\0>\0";
  3679. XML_Parser ext_parser;
  3680. UNUSED_P(base);
  3681. UNUSED_P(systemId);
  3682. UNUSED_P(publicId);
  3683. ext_parser = XML_ExternalEntityParserCreate(parser, context, NULL);
  3684. if (ext_parser == NULL)
  3685. fail("Could not create external entity parser");
  3686. if (_XML_Parse_SINGLE_BYTES(ext_parser, text, (int)sizeof(text) - 1, XML_TRUE)
  3687. == XML_STATUS_ERROR)
  3688. xml_failure(parser);
  3689. XML_ParserFree(ext_parser);
  3690. return XML_STATUS_OK;
  3691. }
  3692. START_TEST(test_ignore_section_utf16) {
  3693. const char text[] =
  3694. /* <!DOCTYPE d SYSTEM 's'> */
  3695. "<\0!\0D\0O\0C\0T\0Y\0P\0E\0 \0d\0 "
  3696. "\0S\0Y\0S\0T\0E\0M\0 \0'\0s\0'\0>\0\n\0"
  3697. /* <d><e>&en;</e></d> */
  3698. "<\0d\0>\0<\0e\0>\0&\0e\0n\0;\0<\0/\0e\0>\0<\0/\0d\0>\0";
  3699. const XML_Char *expected = XCS("<![IGNORE[<!ELEMENT e (#PCDATA)*>]]>\n&en;");
  3700. CharData storage;
  3701. CharData_Init(&storage);
  3702. XML_SetParamEntityParsing(g_parser, XML_PARAM_ENTITY_PARSING_ALWAYS);
  3703. XML_SetUserData(g_parser, &storage);
  3704. XML_SetExternalEntityRefHandler(g_parser, external_entity_load_ignore_utf16);
  3705. XML_SetDefaultHandler(g_parser, accumulate_characters);
  3706. XML_SetStartDoctypeDeclHandler(g_parser, dummy_start_doctype_handler);
  3707. XML_SetEndDoctypeDeclHandler(g_parser, dummy_end_doctype_handler);
  3708. XML_SetElementDeclHandler(g_parser, dummy_element_decl_handler);
  3709. XML_SetStartElementHandler(g_parser, dummy_start_element);
  3710. XML_SetEndElementHandler(g_parser, dummy_end_element);
  3711. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)sizeof(text) - 1, XML_TRUE)
  3712. == XML_STATUS_ERROR)
  3713. xml_failure(g_parser);
  3714. CharData_CheckXMLChars(&storage, expected);
  3715. }
  3716. END_TEST
  3717. static int XMLCALL
  3718. external_entity_load_ignore_utf16_be(XML_Parser parser, const XML_Char *context,
  3719. const XML_Char *base,
  3720. const XML_Char *systemId,
  3721. const XML_Char *publicId) {
  3722. const char text[] =
  3723. /* <![IGNORE[<!ELEMENT e (#PCDATA)*>]]> */
  3724. "\0<\0!\0[\0I\0G\0N\0O\0R\0E\0["
  3725. "\0<\0!\0E\0L\0E\0M\0E\0N\0T\0 \0e\0 "
  3726. "\0(\0#\0P\0C\0D\0A\0T\0A\0)\0*\0>\0]\0]\0>";
  3727. XML_Parser ext_parser;
  3728. UNUSED_P(base);
  3729. UNUSED_P(systemId);
  3730. UNUSED_P(publicId);
  3731. ext_parser = XML_ExternalEntityParserCreate(parser, context, NULL);
  3732. if (ext_parser == NULL)
  3733. fail("Could not create external entity parser");
  3734. if (_XML_Parse_SINGLE_BYTES(ext_parser, text, (int)sizeof(text) - 1, XML_TRUE)
  3735. == XML_STATUS_ERROR)
  3736. xml_failure(parser);
  3737. XML_ParserFree(ext_parser);
  3738. return XML_STATUS_OK;
  3739. }
  3740. START_TEST(test_ignore_section_utf16_be) {
  3741. const char text[] =
  3742. /* <!DOCTYPE d SYSTEM 's'> */
  3743. "\0<\0!\0D\0O\0C\0T\0Y\0P\0E\0 \0d\0 "
  3744. "\0S\0Y\0S\0T\0E\0M\0 \0'\0s\0'\0>\0\n"
  3745. /* <d><e>&en;</e></d> */
  3746. "\0<\0d\0>\0<\0e\0>\0&\0e\0n\0;\0<\0/\0e\0>\0<\0/\0d\0>";
  3747. const XML_Char *expected = XCS("<![IGNORE[<!ELEMENT e (#PCDATA)*>]]>\n&en;");
  3748. CharData storage;
  3749. CharData_Init(&storage);
  3750. XML_SetParamEntityParsing(g_parser, XML_PARAM_ENTITY_PARSING_ALWAYS);
  3751. XML_SetUserData(g_parser, &storage);
  3752. XML_SetExternalEntityRefHandler(g_parser,
  3753. external_entity_load_ignore_utf16_be);
  3754. XML_SetDefaultHandler(g_parser, accumulate_characters);
  3755. XML_SetStartDoctypeDeclHandler(g_parser, dummy_start_doctype_handler);
  3756. XML_SetEndDoctypeDeclHandler(g_parser, dummy_end_doctype_handler);
  3757. XML_SetElementDeclHandler(g_parser, dummy_element_decl_handler);
  3758. XML_SetStartElementHandler(g_parser, dummy_start_element);
  3759. XML_SetEndElementHandler(g_parser, dummy_end_element);
  3760. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)sizeof(text) - 1, XML_TRUE)
  3761. == XML_STATUS_ERROR)
  3762. xml_failure(g_parser);
  3763. CharData_CheckXMLChars(&storage, expected);
  3764. }
  3765. END_TEST
  3766. /* Test mis-formatted conditional exclusion */
  3767. START_TEST(test_bad_ignore_section) {
  3768. const char *text = "<!DOCTYPE doc SYSTEM 'foo'>\n"
  3769. "<doc><e>&entity;</e></doc>";
  3770. ExtFaults faults[]
  3771. = {{"<![IGNORE[<!ELEM", "Broken-off declaration not faulted", NULL,
  3772. XML_ERROR_SYNTAX},
  3773. {"<![IGNORE[\x01]]>", "Invalid XML character not faulted", NULL,
  3774. XML_ERROR_INVALID_TOKEN},
  3775. {/* FIrst two bytes of a three-byte char */
  3776. "<![IGNORE[\xe2\x82", "Partial XML character not faulted", NULL,
  3777. XML_ERROR_PARTIAL_CHAR},
  3778. {NULL, NULL, NULL, XML_ERROR_NONE}};
  3779. ExtFaults *fault;
  3780. for (fault = &faults[0]; fault->parse_text != NULL; fault++) {
  3781. XML_SetParamEntityParsing(g_parser, XML_PARAM_ENTITY_PARSING_ALWAYS);
  3782. XML_SetExternalEntityRefHandler(g_parser, external_entity_faulter);
  3783. XML_SetUserData(g_parser, fault);
  3784. expect_failure(text, XML_ERROR_EXTERNAL_ENTITY_HANDLING,
  3785. "Incomplete IGNORE section not failed");
  3786. XML_ParserReset(g_parser, NULL);
  3787. }
  3788. }
  3789. END_TEST
  3790. /* Test recursive parsing */
  3791. static int XMLCALL
  3792. external_entity_valuer(XML_Parser parser, const XML_Char *context,
  3793. const XML_Char *base, const XML_Char *systemId,
  3794. const XML_Char *publicId) {
  3795. const char *text1 = "<!ELEMENT doc EMPTY>\n"
  3796. "<!ENTITY % e1 SYSTEM '004-2.ent'>\n"
  3797. "<!ENTITY % e2 '%e1;'>\n"
  3798. "%e1;\n";
  3799. XML_Parser ext_parser;
  3800. UNUSED_P(base);
  3801. UNUSED_P(publicId);
  3802. if (systemId == NULL)
  3803. return XML_STATUS_OK;
  3804. ext_parser = XML_ExternalEntityParserCreate(parser, context, NULL);
  3805. if (ext_parser == NULL)
  3806. fail("Could not create external entity parser");
  3807. if (! xcstrcmp(systemId, XCS("004-1.ent"))) {
  3808. if (_XML_Parse_SINGLE_BYTES(ext_parser, text1, (int)strlen(text1), XML_TRUE)
  3809. == XML_STATUS_ERROR)
  3810. xml_failure(ext_parser);
  3811. } else if (! xcstrcmp(systemId, XCS("004-2.ent"))) {
  3812. ExtFaults *fault = (ExtFaults *)XML_GetUserData(parser);
  3813. enum XML_Status status;
  3814. enum XML_Error error;
  3815. status = _XML_Parse_SINGLE_BYTES(ext_parser, fault->parse_text,
  3816. (int)strlen(fault->parse_text), XML_TRUE);
  3817. if (fault->error == XML_ERROR_NONE) {
  3818. if (status == XML_STATUS_ERROR)
  3819. xml_failure(ext_parser);
  3820. } else {
  3821. if (status != XML_STATUS_ERROR)
  3822. fail(fault->fail_text);
  3823. error = XML_GetErrorCode(ext_parser);
  3824. if (error != fault->error
  3825. && (fault->error != XML_ERROR_XML_DECL
  3826. || error != XML_ERROR_TEXT_DECL))
  3827. xml_failure(ext_parser);
  3828. }
  3829. }
  3830. XML_ParserFree(ext_parser);
  3831. return XML_STATUS_OK;
  3832. }
  3833. START_TEST(test_external_entity_values) {
  3834. const char *text = "<!DOCTYPE doc SYSTEM '004-1.ent'>\n"
  3835. "<doc></doc>\n";
  3836. ExtFaults data_004_2[] = {
  3837. {"<!ATTLIST doc a1 CDATA 'value'>", NULL, NULL, XML_ERROR_NONE},
  3838. {"<!ATTLIST $doc a1 CDATA 'value'>", "Invalid token not faulted", NULL,
  3839. XML_ERROR_INVALID_TOKEN},
  3840. {"'wombat", "Unterminated string not faulted", NULL,
  3841. XML_ERROR_UNCLOSED_TOKEN},
  3842. {"\xe2\x82", "Partial UTF-8 character not faulted", NULL,
  3843. XML_ERROR_PARTIAL_CHAR},
  3844. {"<?xml version='1.0' encoding='utf-8'?>\n", NULL, NULL, XML_ERROR_NONE},
  3845. {"<?xml?>", "Malformed XML declaration not faulted", NULL,
  3846. XML_ERROR_XML_DECL},
  3847. {/* UTF-8 BOM */
  3848. "\xEF\xBB\xBF<!ATTLIST doc a1 CDATA 'value'>", NULL, NULL,
  3849. XML_ERROR_NONE},
  3850. {"<?xml version='1.0' encoding='utf-8'?>\n$",
  3851. "Invalid token after text declaration not faulted", NULL,
  3852. XML_ERROR_INVALID_TOKEN},
  3853. {"<?xml version='1.0' encoding='utf-8'?>\n'wombat",
  3854. "Unterminated string after text decl not faulted", NULL,
  3855. XML_ERROR_UNCLOSED_TOKEN},
  3856. {"<?xml version='1.0' encoding='utf-8'?>\n\xe2\x82",
  3857. "Partial UTF-8 character after text decl not faulted", NULL,
  3858. XML_ERROR_PARTIAL_CHAR},
  3859. {"%e1;", "Recursive parameter entity not faulted", NULL,
  3860. XML_ERROR_RECURSIVE_ENTITY_REF},
  3861. {NULL, NULL, NULL, XML_ERROR_NONE}};
  3862. int i;
  3863. for (i = 0; data_004_2[i].parse_text != NULL; i++) {
  3864. XML_SetParamEntityParsing(g_parser, XML_PARAM_ENTITY_PARSING_ALWAYS);
  3865. XML_SetExternalEntityRefHandler(g_parser, external_entity_valuer);
  3866. XML_SetUserData(g_parser, &data_004_2[i]);
  3867. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_TRUE)
  3868. == XML_STATUS_ERROR)
  3869. xml_failure(g_parser);
  3870. XML_ParserReset(g_parser, NULL);
  3871. }
  3872. }
  3873. END_TEST
  3874. /* Test the recursive parse interacts with a not standalone handler */
  3875. static int XMLCALL
  3876. external_entity_not_standalone(XML_Parser parser, const XML_Char *context,
  3877. const XML_Char *base, const XML_Char *systemId,
  3878. const XML_Char *publicId) {
  3879. const char *text1 = "<!ELEMENT doc EMPTY>\n"
  3880. "<!ENTITY % e1 SYSTEM 'bar'>\n"
  3881. "%e1;\n";
  3882. const char *text2 = "<!ATTLIST doc a1 CDATA 'value'>";
  3883. XML_Parser ext_parser;
  3884. UNUSED_P(base);
  3885. UNUSED_P(publicId);
  3886. if (systemId == NULL)
  3887. return XML_STATUS_OK;
  3888. ext_parser = XML_ExternalEntityParserCreate(parser, context, NULL);
  3889. if (ext_parser == NULL)
  3890. fail("Could not create external entity parser");
  3891. if (! xcstrcmp(systemId, XCS("foo"))) {
  3892. XML_SetNotStandaloneHandler(ext_parser, reject_not_standalone_handler);
  3893. if (_XML_Parse_SINGLE_BYTES(ext_parser, text1, (int)strlen(text1), XML_TRUE)
  3894. != XML_STATUS_ERROR)
  3895. fail("Expected not standalone rejection");
  3896. if (XML_GetErrorCode(ext_parser) != XML_ERROR_NOT_STANDALONE)
  3897. xml_failure(ext_parser);
  3898. XML_SetNotStandaloneHandler(ext_parser, NULL);
  3899. XML_ParserFree(ext_parser);
  3900. return XML_STATUS_ERROR;
  3901. } else if (! xcstrcmp(systemId, XCS("bar"))) {
  3902. if (_XML_Parse_SINGLE_BYTES(ext_parser, text2, (int)strlen(text2), XML_TRUE)
  3903. == XML_STATUS_ERROR)
  3904. xml_failure(ext_parser);
  3905. }
  3906. XML_ParserFree(ext_parser);
  3907. return XML_STATUS_OK;
  3908. }
  3909. START_TEST(test_ext_entity_not_standalone) {
  3910. const char *text = "<!DOCTYPE doc SYSTEM 'foo'>\n"
  3911. "<doc></doc>";
  3912. XML_SetParamEntityParsing(g_parser, XML_PARAM_ENTITY_PARSING_ALWAYS);
  3913. XML_SetExternalEntityRefHandler(g_parser, external_entity_not_standalone);
  3914. expect_failure(text, XML_ERROR_EXTERNAL_ENTITY_HANDLING,
  3915. "Standalone rejection not caught");
  3916. }
  3917. END_TEST
  3918. static int XMLCALL
  3919. external_entity_value_aborter(XML_Parser parser, const XML_Char *context,
  3920. const XML_Char *base, const XML_Char *systemId,
  3921. const XML_Char *publicId) {
  3922. const char *text1 = "<!ELEMENT doc EMPTY>\n"
  3923. "<!ENTITY % e1 SYSTEM '004-2.ent'>\n"
  3924. "<!ENTITY % e2 '%e1;'>\n"
  3925. "%e1;\n";
  3926. const char *text2 = "<?xml version='1.0' encoding='utf-8'?>";
  3927. XML_Parser ext_parser;
  3928. UNUSED_P(base);
  3929. UNUSED_P(publicId);
  3930. if (systemId == NULL)
  3931. return XML_STATUS_OK;
  3932. ext_parser = XML_ExternalEntityParserCreate(parser, context, NULL);
  3933. if (ext_parser == NULL)
  3934. fail("Could not create external entity parser");
  3935. if (! xcstrcmp(systemId, XCS("004-1.ent"))) {
  3936. if (_XML_Parse_SINGLE_BYTES(ext_parser, text1, (int)strlen(text1), XML_TRUE)
  3937. == XML_STATUS_ERROR)
  3938. xml_failure(ext_parser);
  3939. }
  3940. if (! xcstrcmp(systemId, XCS("004-2.ent"))) {
  3941. XML_SetXmlDeclHandler(ext_parser, entity_suspending_xdecl_handler);
  3942. XML_SetUserData(ext_parser, ext_parser);
  3943. if (_XML_Parse_SINGLE_BYTES(ext_parser, text2, (int)strlen(text2), XML_TRUE)
  3944. != XML_STATUS_ERROR)
  3945. fail("Aborted parse not faulted");
  3946. if (XML_GetErrorCode(ext_parser) != XML_ERROR_ABORTED)
  3947. xml_failure(ext_parser);
  3948. }
  3949. XML_ParserFree(ext_parser);
  3950. return XML_STATUS_OK;
  3951. }
  3952. START_TEST(test_ext_entity_value_abort) {
  3953. const char *text = "<!DOCTYPE doc SYSTEM '004-1.ent'>\n"
  3954. "<doc></doc>\n";
  3955. XML_SetParamEntityParsing(g_parser, XML_PARAM_ENTITY_PARSING_ALWAYS);
  3956. XML_SetExternalEntityRefHandler(g_parser, external_entity_value_aborter);
  3957. resumable = XML_FALSE;
  3958. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_TRUE)
  3959. == XML_STATUS_ERROR)
  3960. xml_failure(g_parser);
  3961. }
  3962. END_TEST
  3963. START_TEST(test_bad_public_doctype) {
  3964. const char *text = "<?xml version='1.0' encoding='utf-8'?>\n"
  3965. "<!DOCTYPE doc PUBLIC '{BadName}' 'test'>\n"
  3966. "<doc></doc>";
  3967. /* Setting a handler provokes a particular code path */
  3968. XML_SetDoctypeDeclHandler(g_parser, dummy_start_doctype_handler,
  3969. dummy_end_doctype_handler);
  3970. expect_failure(text, XML_ERROR_PUBLICID, "Bad Public ID not failed");
  3971. }
  3972. END_TEST
  3973. /* Test based on ibm/valid/P32/ibm32v04.xml */
  3974. START_TEST(test_attribute_enum_value) {
  3975. const char *text = "<?xml version='1.0' standalone='no'?>\n"
  3976. "<!DOCTYPE animal SYSTEM 'test.dtd'>\n"
  3977. "<animal>This is a \n <a/> \n\nyellow tiger</animal>";
  3978. ExtTest dtd_data
  3979. = {"<!ELEMENT animal (#PCDATA|a)*>\n"
  3980. "<!ELEMENT a EMPTY>\n"
  3981. "<!ATTLIST animal xml:space (default|preserve) 'preserve'>",
  3982. NULL, NULL};
  3983. const XML_Char *expected = XCS("This is a \n \n\nyellow tiger");
  3984. XML_SetExternalEntityRefHandler(g_parser, external_entity_loader);
  3985. XML_SetUserData(g_parser, &dtd_data);
  3986. XML_SetParamEntityParsing(g_parser, XML_PARAM_ENTITY_PARSING_ALWAYS);
  3987. /* An attribute list handler provokes a different code path */
  3988. XML_SetAttlistDeclHandler(g_parser, dummy_attlist_decl_handler);
  3989. run_ext_character_check(text, &dtd_data, expected);
  3990. }
  3991. END_TEST
  3992. /* Slightly bizarrely, the library seems to silently ignore entity
  3993. * definitions for predefined entities, even when they are wrong. The
  3994. * language of the XML 1.0 spec is somewhat unhelpful as to what ought
  3995. * to happen, so this is currently treated as acceptable.
  3996. */
  3997. START_TEST(test_predefined_entity_redefinition) {
  3998. const char *text = "<!DOCTYPE doc [\n"
  3999. "<!ENTITY apos 'foo'>\n"
  4000. "]>\n"
  4001. "<doc>&apos;</doc>";
  4002. run_character_check(text, XCS("'"));
  4003. }
  4004. END_TEST
  4005. /* Test that the parser stops processing the DTD after an unresolved
  4006. * parameter entity is encountered.
  4007. */
  4008. START_TEST(test_dtd_stop_processing) {
  4009. const char *text = "<!DOCTYPE doc [\n"
  4010. "%foo;\n"
  4011. "<!ENTITY bar 'bas'>\n"
  4012. "]><doc/>";
  4013. XML_SetEntityDeclHandler(g_parser, dummy_entity_decl_handler);
  4014. dummy_handler_flags = 0;
  4015. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_TRUE)
  4016. == XML_STATUS_ERROR)
  4017. xml_failure(g_parser);
  4018. if (dummy_handler_flags != 0)
  4019. fail("DTD processing still going after undefined PE");
  4020. }
  4021. END_TEST
  4022. /* Test public notations with no system ID */
  4023. START_TEST(test_public_notation_no_sysid) {
  4024. const char *text = "<!DOCTYPE doc [\n"
  4025. "<!NOTATION note PUBLIC 'foo'>\n"
  4026. "<!ELEMENT doc EMPTY>\n"
  4027. "]>\n<doc/>";
  4028. dummy_handler_flags = 0;
  4029. XML_SetNotationDeclHandler(g_parser, dummy_notation_decl_handler);
  4030. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_TRUE)
  4031. == XML_STATUS_ERROR)
  4032. xml_failure(g_parser);
  4033. if (dummy_handler_flags != DUMMY_NOTATION_DECL_HANDLER_FLAG)
  4034. fail("Notation declaration handler not called");
  4035. }
  4036. END_TEST
  4037. static void XMLCALL
  4038. record_element_start_handler(void *userData, const XML_Char *name,
  4039. const XML_Char **atts) {
  4040. UNUSED_P(atts);
  4041. CharData_AppendXMLChars((CharData *)userData, name, (int)xcstrlen(name));
  4042. }
  4043. START_TEST(test_nested_groups) {
  4044. const char *text
  4045. = "<!DOCTYPE doc [\n"
  4046. "<!ELEMENT doc "
  4047. /* Sixteen elements per line */
  4048. "(e,(e?,(e?,(e?,(e?,(e?,(e?,(e?,(e?,(e?,(e?,(e?,(e?,(e?,(e?,(e?,"
  4049. "(e?,(e?,(e?,(e?,(e?,(e?,(e?,(e?,(e?,(e?,(e?,(e?,(e?,(e?,(e?,(e?"
  4050. "))))))))))))))))))))))))))))))))>\n"
  4051. "<!ELEMENT e EMPTY>"
  4052. "]>\n"
  4053. "<doc><e/></doc>";
  4054. CharData storage;
  4055. CharData_Init(&storage);
  4056. XML_SetElementDeclHandler(g_parser, dummy_element_decl_handler);
  4057. XML_SetStartElementHandler(g_parser, record_element_start_handler);
  4058. XML_SetUserData(g_parser, &storage);
  4059. dummy_handler_flags = 0;
  4060. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_TRUE)
  4061. == XML_STATUS_ERROR)
  4062. xml_failure(g_parser);
  4063. CharData_CheckXMLChars(&storage, XCS("doce"));
  4064. if (dummy_handler_flags != DUMMY_ELEMENT_DECL_HANDLER_FLAG)
  4065. fail("Element handler not fired");
  4066. }
  4067. END_TEST
  4068. START_TEST(test_group_choice) {
  4069. const char *text = "<!DOCTYPE doc [\n"
  4070. "<!ELEMENT doc (a|b|c)+>\n"
  4071. "<!ELEMENT a EMPTY>\n"
  4072. "<!ELEMENT b (#PCDATA)>\n"
  4073. "<!ELEMENT c ANY>\n"
  4074. "]>\n"
  4075. "<doc>\n"
  4076. "<a/>\n"
  4077. "<b attr='foo'>This is a foo</b>\n"
  4078. "<c></c>\n"
  4079. "</doc>\n";
  4080. XML_SetElementDeclHandler(g_parser, dummy_element_decl_handler);
  4081. dummy_handler_flags = 0;
  4082. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_TRUE)
  4083. == XML_STATUS_ERROR)
  4084. xml_failure(g_parser);
  4085. if (dummy_handler_flags != DUMMY_ELEMENT_DECL_HANDLER_FLAG)
  4086. fail("Element handler flag not raised");
  4087. }
  4088. END_TEST
  4089. static int XMLCALL
  4090. external_entity_public(XML_Parser parser, const XML_Char *context,
  4091. const XML_Char *base, const XML_Char *systemId,
  4092. const XML_Char *publicId) {
  4093. const char *text1 = (const char *)XML_GetUserData(parser);
  4094. const char *text2 = "<!ATTLIST doc a CDATA 'value'>";
  4095. const char *text = NULL;
  4096. XML_Parser ext_parser;
  4097. int parse_res;
  4098. UNUSED_P(base);
  4099. ext_parser = XML_ExternalEntityParserCreate(parser, context, NULL);
  4100. if (ext_parser == NULL)
  4101. return XML_STATUS_ERROR;
  4102. if (systemId != NULL && ! xcstrcmp(systemId, XCS("http://example.org/"))) {
  4103. text = text1;
  4104. } else if (publicId != NULL && ! xcstrcmp(publicId, XCS("foo"))) {
  4105. text = text2;
  4106. } else
  4107. fail("Unexpected parameters to external entity parser");
  4108. assert(text != NULL);
  4109. parse_res
  4110. = _XML_Parse_SINGLE_BYTES(ext_parser, text, (int)strlen(text), XML_TRUE);
  4111. XML_ParserFree(ext_parser);
  4112. return parse_res;
  4113. }
  4114. START_TEST(test_standalone_parameter_entity) {
  4115. const char *text = "<?xml version='1.0' standalone='yes'?>\n"
  4116. "<!DOCTYPE doc SYSTEM 'http://example.org/' [\n"
  4117. "<!ENTITY % entity '<!ELEMENT doc (#PCDATA)>'>\n"
  4118. "%entity;\n"
  4119. "]>\n"
  4120. "<doc></doc>";
  4121. char dtd_data[] = "<!ENTITY % e1 'foo'>\n";
  4122. XML_SetUserData(g_parser, dtd_data);
  4123. XML_SetParamEntityParsing(g_parser, XML_PARAM_ENTITY_PARSING_ALWAYS);
  4124. XML_SetExternalEntityRefHandler(g_parser, external_entity_public);
  4125. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_TRUE)
  4126. == XML_STATUS_ERROR)
  4127. xml_failure(g_parser);
  4128. }
  4129. END_TEST
  4130. /* Test skipping of parameter entity in an external DTD */
  4131. /* Derived from ibm/invalid/P69/ibm69i01.xml */
  4132. START_TEST(test_skipped_parameter_entity) {
  4133. const char *text = "<?xml version='1.0'?>\n"
  4134. "<!DOCTYPE root SYSTEM 'http://example.org/dtd.ent' [\n"
  4135. "<!ELEMENT root (#PCDATA|a)* >\n"
  4136. "]>\n"
  4137. "<root></root>";
  4138. ExtTest dtd_data = {"%pe2;", NULL, NULL};
  4139. XML_SetExternalEntityRefHandler(g_parser, external_entity_loader);
  4140. XML_SetUserData(g_parser, &dtd_data);
  4141. XML_SetParamEntityParsing(g_parser, XML_PARAM_ENTITY_PARSING_ALWAYS);
  4142. XML_SetSkippedEntityHandler(g_parser, dummy_skip_handler);
  4143. dummy_handler_flags = 0;
  4144. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_TRUE)
  4145. == XML_STATUS_ERROR)
  4146. xml_failure(g_parser);
  4147. if (dummy_handler_flags != DUMMY_SKIP_HANDLER_FLAG)
  4148. fail("Skip handler not executed");
  4149. }
  4150. END_TEST
  4151. /* Test recursive parameter entity definition rejected in external DTD */
  4152. START_TEST(test_recursive_external_parameter_entity) {
  4153. const char *text = "<?xml version='1.0'?>\n"
  4154. "<!DOCTYPE root SYSTEM 'http://example.org/dtd.ent' [\n"
  4155. "<!ELEMENT root (#PCDATA|a)* >\n"
  4156. "]>\n"
  4157. "<root></root>";
  4158. ExtFaults dtd_data = {"<!ENTITY % pe2 '&#37;pe2;'>\n%pe2;",
  4159. "Recursive external parameter entity not faulted", NULL,
  4160. XML_ERROR_RECURSIVE_ENTITY_REF};
  4161. XML_SetExternalEntityRefHandler(g_parser, external_entity_faulter);
  4162. XML_SetUserData(g_parser, &dtd_data);
  4163. XML_SetParamEntityParsing(g_parser, XML_PARAM_ENTITY_PARSING_ALWAYS);
  4164. expect_failure(text, XML_ERROR_EXTERNAL_ENTITY_HANDLING,
  4165. "Recursive external parameter not spotted");
  4166. }
  4167. END_TEST
  4168. /* Test undefined parameter entity in external entity handler */
  4169. static int XMLCALL
  4170. external_entity_devaluer(XML_Parser parser, const XML_Char *context,
  4171. const XML_Char *base, const XML_Char *systemId,
  4172. const XML_Char *publicId) {
  4173. const char *text = "<!ELEMENT doc EMPTY>\n"
  4174. "<!ENTITY % e1 SYSTEM 'bar'>\n"
  4175. "%e1;\n";
  4176. XML_Parser ext_parser;
  4177. intptr_t clear_handler = (intptr_t)XML_GetUserData(parser);
  4178. UNUSED_P(base);
  4179. UNUSED_P(publicId);
  4180. if (systemId == NULL || ! xcstrcmp(systemId, XCS("bar")))
  4181. return XML_STATUS_OK;
  4182. if (xcstrcmp(systemId, XCS("foo")))
  4183. fail("Unexpected system ID");
  4184. ext_parser = XML_ExternalEntityParserCreate(parser, context, NULL);
  4185. if (ext_parser == NULL)
  4186. fail("Could note create external entity parser");
  4187. if (clear_handler)
  4188. XML_SetExternalEntityRefHandler(ext_parser, NULL);
  4189. if (_XML_Parse_SINGLE_BYTES(ext_parser, text, (int)strlen(text), XML_TRUE)
  4190. == XML_STATUS_ERROR)
  4191. xml_failure(ext_parser);
  4192. XML_ParserFree(ext_parser);
  4193. return XML_STATUS_OK;
  4194. }
  4195. START_TEST(test_undefined_ext_entity_in_external_dtd) {
  4196. const char *text = "<!DOCTYPE doc SYSTEM 'foo'>\n"
  4197. "<doc></doc>\n";
  4198. XML_SetParamEntityParsing(g_parser, XML_PARAM_ENTITY_PARSING_ALWAYS);
  4199. XML_SetExternalEntityRefHandler(g_parser, external_entity_devaluer);
  4200. XML_SetUserData(g_parser, (void *)(intptr_t)XML_FALSE);
  4201. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_TRUE)
  4202. == XML_STATUS_ERROR)
  4203. xml_failure(g_parser);
  4204. /* Now repeat without the external entity ref handler invoking
  4205. * another copy of itself.
  4206. */
  4207. XML_ParserReset(g_parser, NULL);
  4208. XML_SetParamEntityParsing(g_parser, XML_PARAM_ENTITY_PARSING_ALWAYS);
  4209. XML_SetExternalEntityRefHandler(g_parser, external_entity_devaluer);
  4210. XML_SetUserData(g_parser, (void *)(intptr_t)XML_TRUE);
  4211. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_TRUE)
  4212. == XML_STATUS_ERROR)
  4213. xml_failure(g_parser);
  4214. }
  4215. END_TEST
  4216. static void XMLCALL
  4217. aborting_xdecl_handler(void *userData, const XML_Char *version,
  4218. const XML_Char *encoding, int standalone) {
  4219. UNUSED_P(userData);
  4220. UNUSED_P(version);
  4221. UNUSED_P(encoding);
  4222. UNUSED_P(standalone);
  4223. XML_StopParser(g_parser, resumable);
  4224. XML_SetXmlDeclHandler(g_parser, NULL);
  4225. }
  4226. /* Test suspending the parse on receiving an XML declaration works */
  4227. START_TEST(test_suspend_xdecl) {
  4228. const char *text = long_character_data_text;
  4229. XML_SetXmlDeclHandler(g_parser, aborting_xdecl_handler);
  4230. resumable = XML_TRUE;
  4231. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_TRUE)
  4232. != XML_STATUS_SUSPENDED)
  4233. xml_failure(g_parser);
  4234. if (XML_GetErrorCode(g_parser) != XML_ERROR_NONE)
  4235. xml_failure(g_parser);
  4236. /* Attempt to start a new parse while suspended */
  4237. if (XML_Parse(g_parser, text, (int)strlen(text), XML_TRUE)
  4238. != XML_STATUS_ERROR)
  4239. fail("Attempt to parse while suspended not faulted");
  4240. if (XML_GetErrorCode(g_parser) != XML_ERROR_SUSPENDED)
  4241. fail("Suspended parse not faulted with correct error");
  4242. }
  4243. END_TEST
  4244. /* Test aborting the parse in an epilog works */
  4245. static void XMLCALL
  4246. selective_aborting_default_handler(void *userData, const XML_Char *s, int len) {
  4247. const XML_Char *match = (const XML_Char *)userData;
  4248. if (match == NULL
  4249. || (xcstrlen(match) == (unsigned)len && ! xcstrncmp(match, s, len))) {
  4250. XML_StopParser(g_parser, resumable);
  4251. XML_SetDefaultHandler(g_parser, NULL);
  4252. }
  4253. }
  4254. START_TEST(test_abort_epilog) {
  4255. const char *text = "<doc></doc>\n\r\n";
  4256. XML_Char match[] = XCS("\r");
  4257. XML_SetDefaultHandler(g_parser, selective_aborting_default_handler);
  4258. XML_SetUserData(g_parser, match);
  4259. resumable = XML_FALSE;
  4260. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_TRUE)
  4261. != XML_STATUS_ERROR)
  4262. fail("Abort not triggered");
  4263. if (XML_GetErrorCode(g_parser) != XML_ERROR_ABORTED)
  4264. xml_failure(g_parser);
  4265. }
  4266. END_TEST
  4267. /* Test a different code path for abort in the epilog */
  4268. START_TEST(test_abort_epilog_2) {
  4269. const char *text = "<doc></doc>\n";
  4270. XML_Char match[] = XCS("\n");
  4271. XML_SetDefaultHandler(g_parser, selective_aborting_default_handler);
  4272. XML_SetUserData(g_parser, match);
  4273. resumable = XML_FALSE;
  4274. expect_failure(text, XML_ERROR_ABORTED, "Abort not triggered");
  4275. }
  4276. END_TEST
  4277. /* Test suspension from the epilog */
  4278. START_TEST(test_suspend_epilog) {
  4279. const char *text = "<doc></doc>\n";
  4280. XML_Char match[] = XCS("\n");
  4281. XML_SetDefaultHandler(g_parser, selective_aborting_default_handler);
  4282. XML_SetUserData(g_parser, match);
  4283. resumable = XML_TRUE;
  4284. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_TRUE)
  4285. != XML_STATUS_SUSPENDED)
  4286. xml_failure(g_parser);
  4287. }
  4288. END_TEST
  4289. static void XMLCALL
  4290. suspending_end_handler(void *userData, const XML_Char *s) {
  4291. UNUSED_P(s);
  4292. XML_StopParser((XML_Parser)userData, 1);
  4293. }
  4294. START_TEST(test_suspend_in_sole_empty_tag) {
  4295. const char *text = "<doc/>";
  4296. enum XML_Status rc;
  4297. XML_SetEndElementHandler(g_parser, suspending_end_handler);
  4298. XML_SetUserData(g_parser, g_parser);
  4299. rc = _XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_TRUE);
  4300. if (rc == XML_STATUS_ERROR)
  4301. xml_failure(g_parser);
  4302. else if (rc != XML_STATUS_SUSPENDED)
  4303. fail("Suspend not triggered");
  4304. rc = XML_ResumeParser(g_parser);
  4305. if (rc == XML_STATUS_ERROR)
  4306. xml_failure(g_parser);
  4307. else if (rc != XML_STATUS_OK)
  4308. fail("Resume failed");
  4309. }
  4310. END_TEST
  4311. START_TEST(test_unfinished_epilog) {
  4312. const char *text = "<doc></doc><";
  4313. expect_failure(text, XML_ERROR_UNCLOSED_TOKEN,
  4314. "Incomplete epilog entry not faulted");
  4315. }
  4316. END_TEST
  4317. START_TEST(test_partial_char_in_epilog) {
  4318. const char *text = "<doc></doc>\xe2\x82";
  4319. /* First check that no fault is raised if the parse is not finished */
  4320. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_FALSE)
  4321. == XML_STATUS_ERROR)
  4322. xml_failure(g_parser);
  4323. /* Now check that it is faulted once we finish */
  4324. if (XML_ParseBuffer(g_parser, 0, XML_TRUE) != XML_STATUS_ERROR)
  4325. fail("Partial character in epilog not faulted");
  4326. if (XML_GetErrorCode(g_parser) != XML_ERROR_PARTIAL_CHAR)
  4327. xml_failure(g_parser);
  4328. }
  4329. END_TEST
  4330. START_TEST(test_hash_collision) {
  4331. /* For full coverage of the lookup routine, we need to ensure a
  4332. * hash collision even though we can only tell that we have one
  4333. * through breakpoint debugging or coverage statistics. The
  4334. * following will cause a hash collision on machines with a 64-bit
  4335. * long type; others will have to experiment. The full coverage
  4336. * tests invoked from qa.sh usually provide a hash collision, but
  4337. * not always. This is an attempt to provide insurance.
  4338. */
  4339. #define COLLIDING_HASH_SALT (unsigned long)_SIP_ULL(0xffffffffU, 0xff99fc90U)
  4340. const char *text
  4341. = "<doc>\n"
  4342. "<a1/><a2/><a3/><a4/><a5/><a6/><a7/><a8/>\n"
  4343. "<b1></b1><b2 attr='foo'>This is a foo</b2><b3></b3><b4></b4>\n"
  4344. "<b5></b5><b6></b6><b7></b7><b8></b8>\n"
  4345. "<c1/><c2/><c3/><c4/><c5/><c6/><c7/><c8/>\n"
  4346. "<d1/><d2/><d3/><d4/><d5/><d6/><d7/>\n"
  4347. "<d8>This triggers the table growth and collides with b2</d8>\n"
  4348. "</doc>\n";
  4349. XML_SetHashSalt(g_parser, COLLIDING_HASH_SALT);
  4350. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_TRUE)
  4351. == XML_STATUS_ERROR)
  4352. xml_failure(g_parser);
  4353. }
  4354. END_TEST
  4355. #undef COLLIDING_HASH_SALT
  4356. /* Test resuming a parse suspended in entity substitution */
  4357. static void XMLCALL
  4358. start_element_suspender(void *userData, const XML_Char *name,
  4359. const XML_Char **atts) {
  4360. UNUSED_P(userData);
  4361. UNUSED_P(atts);
  4362. if (! xcstrcmp(name, XCS("suspend")))
  4363. XML_StopParser(g_parser, XML_TRUE);
  4364. if (! xcstrcmp(name, XCS("abort")))
  4365. XML_StopParser(g_parser, XML_FALSE);
  4366. }
  4367. START_TEST(test_suspend_resume_internal_entity) {
  4368. const char *text
  4369. = "<!DOCTYPE doc [\n"
  4370. "<!ENTITY foo '<suspend>Hi<suspend>Ho</suspend></suspend>'>\n"
  4371. "]>\n"
  4372. "<doc>&foo;</doc>\n";
  4373. const XML_Char *expected1 = XCS("Hi");
  4374. const XML_Char *expected2 = XCS("HiHo");
  4375. CharData storage;
  4376. CharData_Init(&storage);
  4377. XML_SetStartElementHandler(g_parser, start_element_suspender);
  4378. XML_SetCharacterDataHandler(g_parser, accumulate_characters);
  4379. XML_SetUserData(g_parser, &storage);
  4380. if (XML_Parse(g_parser, text, (int)strlen(text), XML_TRUE)
  4381. != XML_STATUS_SUSPENDED)
  4382. xml_failure(g_parser);
  4383. CharData_CheckXMLChars(&storage, XCS(""));
  4384. if (XML_ResumeParser(g_parser) != XML_STATUS_SUSPENDED)
  4385. xml_failure(g_parser);
  4386. CharData_CheckXMLChars(&storage, expected1);
  4387. if (XML_ResumeParser(g_parser) != XML_STATUS_OK)
  4388. xml_failure(g_parser);
  4389. CharData_CheckXMLChars(&storage, expected2);
  4390. }
  4391. END_TEST
  4392. /* Test syntax error is caught at parse resumption */
  4393. START_TEST(test_resume_entity_with_syntax_error) {
  4394. const char *text = "<!DOCTYPE doc [\n"
  4395. "<!ENTITY foo '<suspend>Hi</wombat>'>\n"
  4396. "]>\n"
  4397. "<doc>&foo;</doc>\n";
  4398. XML_SetStartElementHandler(g_parser, start_element_suspender);
  4399. if (XML_Parse(g_parser, text, (int)strlen(text), XML_TRUE)
  4400. != XML_STATUS_SUSPENDED)
  4401. xml_failure(g_parser);
  4402. if (XML_ResumeParser(g_parser) != XML_STATUS_ERROR)
  4403. fail("Syntax error in entity not faulted");
  4404. if (XML_GetErrorCode(g_parser) != XML_ERROR_TAG_MISMATCH)
  4405. xml_failure(g_parser);
  4406. }
  4407. END_TEST
  4408. /* Test suspending and resuming in a parameter entity substitution */
  4409. static void XMLCALL
  4410. element_decl_suspender(void *userData, const XML_Char *name,
  4411. XML_Content *model) {
  4412. UNUSED_P(userData);
  4413. UNUSED_P(name);
  4414. XML_StopParser(g_parser, XML_TRUE);
  4415. XML_FreeContentModel(g_parser, model);
  4416. }
  4417. START_TEST(test_suspend_resume_parameter_entity) {
  4418. const char *text = "<!DOCTYPE doc [\n"
  4419. "<!ENTITY % foo '<!ELEMENT doc (#PCDATA)*>'>\n"
  4420. "%foo;\n"
  4421. "]>\n"
  4422. "<doc>Hello, world</doc>";
  4423. const XML_Char *expected = XCS("Hello, world");
  4424. CharData storage;
  4425. CharData_Init(&storage);
  4426. XML_SetParamEntityParsing(g_parser, XML_PARAM_ENTITY_PARSING_ALWAYS);
  4427. XML_SetElementDeclHandler(g_parser, element_decl_suspender);
  4428. XML_SetCharacterDataHandler(g_parser, accumulate_characters);
  4429. XML_SetUserData(g_parser, &storage);
  4430. if (XML_Parse(g_parser, text, (int)strlen(text), XML_TRUE)
  4431. != XML_STATUS_SUSPENDED)
  4432. xml_failure(g_parser);
  4433. CharData_CheckXMLChars(&storage, XCS(""));
  4434. if (XML_ResumeParser(g_parser) != XML_STATUS_OK)
  4435. xml_failure(g_parser);
  4436. CharData_CheckXMLChars(&storage, expected);
  4437. }
  4438. END_TEST
  4439. /* Test attempting to use parser after an error is faulted */
  4440. START_TEST(test_restart_on_error) {
  4441. const char *text = "<$doc><doc></doc>";
  4442. if (XML_Parse(g_parser, text, (int)strlen(text), XML_TRUE)
  4443. != XML_STATUS_ERROR)
  4444. fail("Invalid tag name not faulted");
  4445. if (XML_GetErrorCode(g_parser) != XML_ERROR_INVALID_TOKEN)
  4446. xml_failure(g_parser);
  4447. if (XML_Parse(g_parser, NULL, 0, XML_TRUE) != XML_STATUS_ERROR)
  4448. fail("Restarting invalid parse not faulted");
  4449. if (XML_GetErrorCode(g_parser) != XML_ERROR_INVALID_TOKEN)
  4450. xml_failure(g_parser);
  4451. }
  4452. END_TEST
  4453. /* Test that angle brackets in an attribute default value are faulted */
  4454. START_TEST(test_reject_lt_in_attribute_value) {
  4455. const char *text = "<!DOCTYPE doc [<!ATTLIST doc a CDATA '<bar>'>]>\n"
  4456. "<doc></doc>";
  4457. expect_failure(text, XML_ERROR_INVALID_TOKEN,
  4458. "Bad attribute default not faulted");
  4459. }
  4460. END_TEST
  4461. START_TEST(test_reject_unfinished_param_in_att_value) {
  4462. const char *text = "<!DOCTYPE doc [<!ATTLIST doc a CDATA '&foo'>]>\n"
  4463. "<doc></doc>";
  4464. expect_failure(text, XML_ERROR_INVALID_TOKEN,
  4465. "Bad attribute default not faulted");
  4466. }
  4467. END_TEST
  4468. START_TEST(test_trailing_cr_in_att_value) {
  4469. const char *text = "<doc a='value\r'/>";
  4470. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_TRUE)
  4471. == XML_STATUS_ERROR)
  4472. xml_failure(g_parser);
  4473. }
  4474. END_TEST
  4475. /* Try parsing a general entity within a parameter entity in a
  4476. * standalone internal DTD. Covers a corner case in the parser.
  4477. */
  4478. START_TEST(test_standalone_internal_entity) {
  4479. const char *text = "<?xml version='1.0' standalone='yes' ?>\n"
  4480. "<!DOCTYPE doc [\n"
  4481. " <!ELEMENT doc (#PCDATA)>\n"
  4482. " <!ENTITY % pe '<!ATTLIST doc att2 CDATA \"&ge;\">'>\n"
  4483. " <!ENTITY ge 'AttDefaultValue'>\n"
  4484. " %pe;\n"
  4485. "]>\n"
  4486. "<doc att2='any'/>";
  4487. XML_SetParamEntityParsing(g_parser, XML_PARAM_ENTITY_PARSING_ALWAYS);
  4488. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_TRUE)
  4489. == XML_STATUS_ERROR)
  4490. xml_failure(g_parser);
  4491. }
  4492. END_TEST
  4493. /* Test that a reference to an unknown external entity is skipped */
  4494. START_TEST(test_skipped_external_entity) {
  4495. const char *text = "<!DOCTYPE doc SYSTEM 'http://example.org/'>\n"
  4496. "<doc></doc>\n";
  4497. ExtTest test_data = {"<!ELEMENT doc EMPTY>\n"
  4498. "<!ENTITY % e2 '%e1;'>\n",
  4499. NULL, NULL};
  4500. XML_SetUserData(g_parser, &test_data);
  4501. XML_SetParamEntityParsing(g_parser, XML_PARAM_ENTITY_PARSING_ALWAYS);
  4502. XML_SetExternalEntityRefHandler(g_parser, external_entity_loader);
  4503. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_TRUE)
  4504. == XML_STATUS_ERROR)
  4505. xml_failure(g_parser);
  4506. }
  4507. END_TEST
  4508. /* Test a different form of unknown external entity */
  4509. typedef struct ext_hdlr_data {
  4510. const char *parse_text;
  4511. XML_ExternalEntityRefHandler handler;
  4512. } ExtHdlrData;
  4513. static int XMLCALL
  4514. external_entity_oneshot_loader(XML_Parser parser, const XML_Char *context,
  4515. const XML_Char *base, const XML_Char *systemId,
  4516. const XML_Char *publicId) {
  4517. ExtHdlrData *test_data = (ExtHdlrData *)XML_GetUserData(parser);
  4518. XML_Parser ext_parser;
  4519. UNUSED_P(base);
  4520. UNUSED_P(systemId);
  4521. UNUSED_P(publicId);
  4522. ext_parser = XML_ExternalEntityParserCreate(parser, context, NULL);
  4523. if (ext_parser == NULL)
  4524. fail("Could not create external entity parser.");
  4525. /* Use the requested entity parser for further externals */
  4526. XML_SetExternalEntityRefHandler(ext_parser, test_data->handler);
  4527. if (_XML_Parse_SINGLE_BYTES(ext_parser, test_data->parse_text,
  4528. (int)strlen(test_data->parse_text), XML_TRUE)
  4529. == XML_STATUS_ERROR) {
  4530. xml_failure(ext_parser);
  4531. }
  4532. XML_ParserFree(ext_parser);
  4533. return XML_STATUS_OK;
  4534. }
  4535. START_TEST(test_skipped_null_loaded_ext_entity) {
  4536. const char *text = "<!DOCTYPE doc SYSTEM 'http://example.org/one.ent'>\n"
  4537. "<doc />";
  4538. ExtHdlrData test_data
  4539. = {"<!ENTITY % pe1 SYSTEM 'http://example.org/two.ent'>\n"
  4540. "<!ENTITY % pe2 '%pe1;'>\n"
  4541. "%pe2;\n",
  4542. external_entity_null_loader};
  4543. XML_SetUserData(g_parser, &test_data);
  4544. XML_SetParamEntityParsing(g_parser, XML_PARAM_ENTITY_PARSING_ALWAYS);
  4545. XML_SetExternalEntityRefHandler(g_parser, external_entity_oneshot_loader);
  4546. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_TRUE)
  4547. == XML_STATUS_ERROR)
  4548. xml_failure(g_parser);
  4549. }
  4550. END_TEST
  4551. START_TEST(test_skipped_unloaded_ext_entity) {
  4552. const char *text = "<!DOCTYPE doc SYSTEM 'http://example.org/one.ent'>\n"
  4553. "<doc />";
  4554. ExtHdlrData test_data
  4555. = {"<!ENTITY % pe1 SYSTEM 'http://example.org/two.ent'>\n"
  4556. "<!ENTITY % pe2 '%pe1;'>\n"
  4557. "%pe2;\n",
  4558. NULL};
  4559. XML_SetUserData(g_parser, &test_data);
  4560. XML_SetParamEntityParsing(g_parser, XML_PARAM_ENTITY_PARSING_ALWAYS);
  4561. XML_SetExternalEntityRefHandler(g_parser, external_entity_oneshot_loader);
  4562. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_TRUE)
  4563. == XML_STATUS_ERROR)
  4564. xml_failure(g_parser);
  4565. }
  4566. END_TEST
  4567. /* Test that a parameter entity value ending with a carriage return
  4568. * has it translated internally into a newline.
  4569. */
  4570. START_TEST(test_param_entity_with_trailing_cr) {
  4571. #define PARAM_ENTITY_NAME "pe"
  4572. #define PARAM_ENTITY_CORE_VALUE "<!ATTLIST doc att CDATA \"default\">"
  4573. const char *text = "<!DOCTYPE doc SYSTEM 'http://example.org/'>\n"
  4574. "<doc/>";
  4575. ExtTest test_data
  4576. = {"<!ENTITY % " PARAM_ENTITY_NAME " '" PARAM_ENTITY_CORE_VALUE "\r'>\n"
  4577. "%" PARAM_ENTITY_NAME ";\n",
  4578. NULL, NULL};
  4579. XML_SetUserData(g_parser, &test_data);
  4580. XML_SetParamEntityParsing(g_parser, XML_PARAM_ENTITY_PARSING_ALWAYS);
  4581. XML_SetExternalEntityRefHandler(g_parser, external_entity_loader);
  4582. XML_SetEntityDeclHandler(g_parser, param_entity_match_handler);
  4583. entity_name_to_match = XCS(PARAM_ENTITY_NAME);
  4584. entity_value_to_match = XCS(PARAM_ENTITY_CORE_VALUE) XCS("\n");
  4585. entity_match_flag = ENTITY_MATCH_NOT_FOUND;
  4586. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_TRUE)
  4587. == XML_STATUS_ERROR)
  4588. xml_failure(g_parser);
  4589. if (entity_match_flag == ENTITY_MATCH_FAIL)
  4590. fail("Parameter entity CR->NEWLINE conversion failed");
  4591. else if (entity_match_flag == ENTITY_MATCH_NOT_FOUND)
  4592. fail("Parameter entity not parsed");
  4593. }
  4594. #undef PARAM_ENTITY_NAME
  4595. #undef PARAM_ENTITY_CORE_VALUE
  4596. END_TEST
  4597. START_TEST(test_invalid_character_entity) {
  4598. const char *text = "<!DOCTYPE doc [\n"
  4599. " <!ENTITY entity '&#x110000;'>\n"
  4600. "]>\n"
  4601. "<doc>&entity;</doc>";
  4602. expect_failure(text, XML_ERROR_BAD_CHAR_REF,
  4603. "Out of range character reference not faulted");
  4604. }
  4605. END_TEST
  4606. START_TEST(test_invalid_character_entity_2) {
  4607. const char *text = "<!DOCTYPE doc [\n"
  4608. " <!ENTITY entity '&#xg0;'>\n"
  4609. "]>\n"
  4610. "<doc>&entity;</doc>";
  4611. expect_failure(text, XML_ERROR_INVALID_TOKEN,
  4612. "Out of range character reference not faulted");
  4613. }
  4614. END_TEST
  4615. START_TEST(test_invalid_character_entity_3) {
  4616. const char text[] =
  4617. /* <!DOCTYPE doc [\n */
  4618. "\0<\0!\0D\0O\0C\0T\0Y\0P\0E\0 \0d\0o\0c\0 \0[\0\n"
  4619. /* U+0E04 = KHO KHWAI
  4620. * U+0E08 = CHO CHAN */
  4621. /* <!ENTITY entity '&\u0e04\u0e08;'>\n */
  4622. "\0<\0!\0E\0N\0T\0I\0T\0Y\0 \0e\0n\0t\0i\0t\0y\0 "
  4623. "\0'\0&\x0e\x04\x0e\x08\0;\0'\0>\0\n"
  4624. /* ]>\n */
  4625. "\0]\0>\0\n"
  4626. /* <doc>&entity;</doc> */
  4627. "\0<\0d\0o\0c\0>\0&\0e\0n\0t\0i\0t\0y\0;\0<\0/\0d\0o\0c\0>";
  4628. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)sizeof(text) - 1, XML_TRUE)
  4629. != XML_STATUS_ERROR)
  4630. fail("Invalid start of entity name not faulted");
  4631. if (XML_GetErrorCode(g_parser) != XML_ERROR_UNDEFINED_ENTITY)
  4632. xml_failure(g_parser);
  4633. }
  4634. END_TEST
  4635. START_TEST(test_invalid_character_entity_4) {
  4636. const char *text = "<!DOCTYPE doc [\n"
  4637. " <!ENTITY entity '&#1114112;'>\n" /* = &#x110000 */
  4638. "]>\n"
  4639. "<doc>&entity;</doc>";
  4640. expect_failure(text, XML_ERROR_BAD_CHAR_REF,
  4641. "Out of range character reference not faulted");
  4642. }
  4643. END_TEST
  4644. /* Test that processing instructions are picked up by a default handler */
  4645. START_TEST(test_pi_handled_in_default) {
  4646. const char *text = "<?test processing instruction?>\n<doc/>";
  4647. const XML_Char *expected = XCS("<?test processing instruction?>\n<doc/>");
  4648. CharData storage;
  4649. CharData_Init(&storage);
  4650. XML_SetDefaultHandler(g_parser, accumulate_characters);
  4651. XML_SetUserData(g_parser, &storage);
  4652. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_TRUE)
  4653. == XML_STATUS_ERROR)
  4654. xml_failure(g_parser);
  4655. CharData_CheckXMLChars(&storage, expected);
  4656. }
  4657. END_TEST
  4658. /* Test that comments are picked up by a default handler */
  4659. START_TEST(test_comment_handled_in_default) {
  4660. const char *text = "<!-- This is a comment -->\n<doc/>";
  4661. const XML_Char *expected = XCS("<!-- This is a comment -->\n<doc/>");
  4662. CharData storage;
  4663. CharData_Init(&storage);
  4664. XML_SetDefaultHandler(g_parser, accumulate_characters);
  4665. XML_SetUserData(g_parser, &storage);
  4666. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_TRUE)
  4667. == XML_STATUS_ERROR)
  4668. xml_failure(g_parser);
  4669. CharData_CheckXMLChars(&storage, expected);
  4670. }
  4671. END_TEST
  4672. /* Test PIs that look almost but not quite like XML declarations */
  4673. static void XMLCALL
  4674. accumulate_pi_characters(void *userData, const XML_Char *target,
  4675. const XML_Char *data) {
  4676. CharData *storage = (CharData *)userData;
  4677. CharData_AppendXMLChars(storage, target, -1);
  4678. CharData_AppendXMLChars(storage, XCS(": "), 2);
  4679. CharData_AppendXMLChars(storage, data, -1);
  4680. CharData_AppendXMLChars(storage, XCS("\n"), 1);
  4681. }
  4682. START_TEST(test_pi_yml) {
  4683. const char *text = "<?yml something like data?><doc/>";
  4684. const XML_Char *expected = XCS("yml: something like data\n");
  4685. CharData storage;
  4686. CharData_Init(&storage);
  4687. XML_SetProcessingInstructionHandler(g_parser, accumulate_pi_characters);
  4688. XML_SetUserData(g_parser, &storage);
  4689. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_TRUE)
  4690. == XML_STATUS_ERROR)
  4691. xml_failure(g_parser);
  4692. CharData_CheckXMLChars(&storage, expected);
  4693. }
  4694. END_TEST
  4695. START_TEST(test_pi_xnl) {
  4696. const char *text = "<?xnl nothing like data?><doc/>";
  4697. const XML_Char *expected = XCS("xnl: nothing like data\n");
  4698. CharData storage;
  4699. CharData_Init(&storage);
  4700. XML_SetProcessingInstructionHandler(g_parser, accumulate_pi_characters);
  4701. XML_SetUserData(g_parser, &storage);
  4702. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_TRUE)
  4703. == XML_STATUS_ERROR)
  4704. xml_failure(g_parser);
  4705. CharData_CheckXMLChars(&storage, expected);
  4706. }
  4707. END_TEST
  4708. START_TEST(test_pi_xmm) {
  4709. const char *text = "<?xmm everything like data?><doc/>";
  4710. const XML_Char *expected = XCS("xmm: everything like data\n");
  4711. CharData storage;
  4712. CharData_Init(&storage);
  4713. XML_SetProcessingInstructionHandler(g_parser, accumulate_pi_characters);
  4714. XML_SetUserData(g_parser, &storage);
  4715. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_TRUE)
  4716. == XML_STATUS_ERROR)
  4717. xml_failure(g_parser);
  4718. CharData_CheckXMLChars(&storage, expected);
  4719. }
  4720. END_TEST
  4721. START_TEST(test_utf16_pi) {
  4722. const char text[] =
  4723. /* <?{KHO KHWAI}{CHO CHAN}?>
  4724. * where {KHO KHWAI} = U+0E04
  4725. * and {CHO CHAN} = U+0E08
  4726. */
  4727. "<\0?\0\x04\x0e\x08\x0e?\0>\0"
  4728. /* <q/> */
  4729. "<\0q\0/\0>\0";
  4730. #ifdef XML_UNICODE
  4731. const XML_Char *expected = XCS("\x0e04\x0e08: \n");
  4732. #else
  4733. const XML_Char *expected = XCS("\xe0\xb8\x84\xe0\xb8\x88: \n");
  4734. #endif
  4735. CharData storage;
  4736. CharData_Init(&storage);
  4737. XML_SetProcessingInstructionHandler(g_parser, accumulate_pi_characters);
  4738. XML_SetUserData(g_parser, &storage);
  4739. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)sizeof(text) - 1, XML_TRUE)
  4740. == XML_STATUS_ERROR)
  4741. xml_failure(g_parser);
  4742. CharData_CheckXMLChars(&storage, expected);
  4743. }
  4744. END_TEST
  4745. START_TEST(test_utf16_be_pi) {
  4746. const char text[] =
  4747. /* <?{KHO KHWAI}{CHO CHAN}?>
  4748. * where {KHO KHWAI} = U+0E04
  4749. * and {CHO CHAN} = U+0E08
  4750. */
  4751. "\0<\0?\x0e\x04\x0e\x08\0?\0>"
  4752. /* <q/> */
  4753. "\0<\0q\0/\0>";
  4754. #ifdef XML_UNICODE
  4755. const XML_Char *expected = XCS("\x0e04\x0e08: \n");
  4756. #else
  4757. const XML_Char *expected = XCS("\xe0\xb8\x84\xe0\xb8\x88: \n");
  4758. #endif
  4759. CharData storage;
  4760. CharData_Init(&storage);
  4761. XML_SetProcessingInstructionHandler(g_parser, accumulate_pi_characters);
  4762. XML_SetUserData(g_parser, &storage);
  4763. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)sizeof(text) - 1, XML_TRUE)
  4764. == XML_STATUS_ERROR)
  4765. xml_failure(g_parser);
  4766. CharData_CheckXMLChars(&storage, expected);
  4767. }
  4768. END_TEST
  4769. /* Test that comments can be picked up and translated */
  4770. static void XMLCALL
  4771. accumulate_comment(void *userData, const XML_Char *data) {
  4772. CharData *storage = (CharData *)userData;
  4773. CharData_AppendXMLChars(storage, data, -1);
  4774. }
  4775. START_TEST(test_utf16_be_comment) {
  4776. const char text[] =
  4777. /* <!-- Comment A --> */
  4778. "\0<\0!\0-\0-\0 \0C\0o\0m\0m\0e\0n\0t\0 \0A\0 \0-\0-\0>\0\n"
  4779. /* <doc/> */
  4780. "\0<\0d\0o\0c\0/\0>";
  4781. const XML_Char *expected = XCS(" Comment A ");
  4782. CharData storage;
  4783. CharData_Init(&storage);
  4784. XML_SetCommentHandler(g_parser, accumulate_comment);
  4785. XML_SetUserData(g_parser, &storage);
  4786. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)sizeof(text) - 1, XML_TRUE)
  4787. == XML_STATUS_ERROR)
  4788. xml_failure(g_parser);
  4789. CharData_CheckXMLChars(&storage, expected);
  4790. }
  4791. END_TEST
  4792. START_TEST(test_utf16_le_comment) {
  4793. const char text[] =
  4794. /* <!-- Comment B --> */
  4795. "<\0!\0-\0-\0 \0C\0o\0m\0m\0e\0n\0t\0 \0B\0 \0-\0-\0>\0\n\0"
  4796. /* <doc/> */
  4797. "<\0d\0o\0c\0/\0>\0";
  4798. const XML_Char *expected = XCS(" Comment B ");
  4799. CharData storage;
  4800. CharData_Init(&storage);
  4801. XML_SetCommentHandler(g_parser, accumulate_comment);
  4802. XML_SetUserData(g_parser, &storage);
  4803. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)sizeof(text) - 1, XML_TRUE)
  4804. == XML_STATUS_ERROR)
  4805. xml_failure(g_parser);
  4806. CharData_CheckXMLChars(&storage, expected);
  4807. }
  4808. END_TEST
  4809. /* Test that the unknown encoding handler with map entries that expect
  4810. * conversion but no conversion function is faulted
  4811. */
  4812. static int XMLCALL
  4813. failing_converter(void *data, const char *s) {
  4814. UNUSED_P(data);
  4815. UNUSED_P(s);
  4816. /* Always claim to have failed */
  4817. return -1;
  4818. }
  4819. static int XMLCALL
  4820. prefix_converter(void *data, const char *s) {
  4821. UNUSED_P(data);
  4822. /* If the first byte is 0xff, raise an error */
  4823. if (s[0] == (char)-1)
  4824. return -1;
  4825. /* Just add the low bits of the first byte to the second */
  4826. return (s[1] + (s[0] & 0x7f)) & 0x01ff;
  4827. }
  4828. static int XMLCALL
  4829. MiscEncodingHandler(void *data, const XML_Char *encoding, XML_Encoding *info) {
  4830. int i;
  4831. int high_map = -2; /* Assume a 2-byte sequence */
  4832. if (! xcstrcmp(encoding, XCS("invalid-9"))
  4833. || ! xcstrcmp(encoding, XCS("ascii-like"))
  4834. || ! xcstrcmp(encoding, XCS("invalid-len"))
  4835. || ! xcstrcmp(encoding, XCS("invalid-a"))
  4836. || ! xcstrcmp(encoding, XCS("invalid-surrogate"))
  4837. || ! xcstrcmp(encoding, XCS("invalid-high")))
  4838. high_map = -1;
  4839. for (i = 0; i < 128; ++i)
  4840. info->map[i] = i;
  4841. for (; i < 256; ++i)
  4842. info->map[i] = high_map;
  4843. /* If required, put an invalid value in the ASCII entries */
  4844. if (! xcstrcmp(encoding, XCS("invalid-9")))
  4845. info->map[9] = 5;
  4846. /* If required, have a top-bit set character starts a 5-byte sequence */
  4847. if (! xcstrcmp(encoding, XCS("invalid-len")))
  4848. info->map[0x81] = -5;
  4849. /* If required, make a top-bit set character a valid ASCII character */
  4850. if (! xcstrcmp(encoding, XCS("invalid-a")))
  4851. info->map[0x82] = 'a';
  4852. /* If required, give a top-bit set character a forbidden value,
  4853. * what would otherwise be the first of a surrogate pair.
  4854. */
  4855. if (! xcstrcmp(encoding, XCS("invalid-surrogate")))
  4856. info->map[0x83] = 0xd801;
  4857. /* If required, give a top-bit set character too high a value */
  4858. if (! xcstrcmp(encoding, XCS("invalid-high")))
  4859. info->map[0x84] = 0x010101;
  4860. info->data = data;
  4861. info->release = NULL;
  4862. if (! xcstrcmp(encoding, XCS("failing-conv")))
  4863. info->convert = failing_converter;
  4864. else if (! xcstrcmp(encoding, XCS("prefix-conv")))
  4865. info->convert = prefix_converter;
  4866. else
  4867. info->convert = NULL;
  4868. return XML_STATUS_OK;
  4869. }
  4870. START_TEST(test_missing_encoding_conversion_fn) {
  4871. const char *text = "<?xml version='1.0' encoding='no-conv'?>\n"
  4872. "<doc>\x81</doc>";
  4873. XML_SetUnknownEncodingHandler(g_parser, MiscEncodingHandler, NULL);
  4874. /* MiscEncodingHandler sets up an encoding with every top-bit-set
  4875. * character introducing a two-byte sequence. For this, it
  4876. * requires a convert function. The above function call doesn't
  4877. * pass one through, so when BadEncodingHandler actually gets
  4878. * called it should supply an invalid encoding.
  4879. */
  4880. expect_failure(text, XML_ERROR_UNKNOWN_ENCODING,
  4881. "Encoding with missing convert() not faulted");
  4882. }
  4883. END_TEST
  4884. START_TEST(test_failing_encoding_conversion_fn) {
  4885. const char *text = "<?xml version='1.0' encoding='failing-conv'?>\n"
  4886. "<doc>\x81</doc>";
  4887. XML_SetUnknownEncodingHandler(g_parser, MiscEncodingHandler, NULL);
  4888. /* BadEncodingHandler sets up an encoding with every top-bit-set
  4889. * character introducing a two-byte sequence. For this, it
  4890. * requires a convert function. The above function call passes
  4891. * one that insists all possible sequences are invalid anyway.
  4892. */
  4893. expect_failure(text, XML_ERROR_INVALID_TOKEN,
  4894. "Encoding with failing convert() not faulted");
  4895. }
  4896. END_TEST
  4897. /* Test unknown encoding conversions */
  4898. START_TEST(test_unknown_encoding_success) {
  4899. const char *text = "<?xml version='1.0' encoding='prefix-conv'?>\n"
  4900. /* Equivalent to <eoc>Hello, world</eoc> */
  4901. "<\x81\x64\x80oc>Hello, world</\x81\x64\x80oc>";
  4902. XML_SetUnknownEncodingHandler(g_parser, MiscEncodingHandler, NULL);
  4903. run_character_check(text, XCS("Hello, world"));
  4904. }
  4905. END_TEST
  4906. /* Test bad name character in unknown encoding */
  4907. START_TEST(test_unknown_encoding_bad_name) {
  4908. const char *text = "<?xml version='1.0' encoding='prefix-conv'?>\n"
  4909. "<\xff\x64oc>Hello, world</\xff\x64oc>";
  4910. XML_SetUnknownEncodingHandler(g_parser, MiscEncodingHandler, NULL);
  4911. expect_failure(text, XML_ERROR_INVALID_TOKEN,
  4912. "Bad name start in unknown encoding not faulted");
  4913. }
  4914. END_TEST
  4915. /* Test bad mid-name character in unknown encoding */
  4916. START_TEST(test_unknown_encoding_bad_name_2) {
  4917. const char *text = "<?xml version='1.0' encoding='prefix-conv'?>\n"
  4918. "<d\xffoc>Hello, world</d\xffoc>";
  4919. XML_SetUnknownEncodingHandler(g_parser, MiscEncodingHandler, NULL);
  4920. expect_failure(text, XML_ERROR_INVALID_TOKEN,
  4921. "Bad name in unknown encoding not faulted");
  4922. }
  4923. END_TEST
  4924. /* Test element name that is long enough to fill the conversion buffer
  4925. * in an unknown encoding, finishing with an encoded character.
  4926. */
  4927. START_TEST(test_unknown_encoding_long_name_1) {
  4928. const char *text = "<?xml version='1.0' encoding='prefix-conv'?>\n"
  4929. "<abcdefghabcdefghabcdefghijkl\x80m\x80n\x80o\x80p>"
  4930. "Hi"
  4931. "</abcdefghabcdefghabcdefghijkl\x80m\x80n\x80o\x80p>";
  4932. const XML_Char *expected = XCS("abcdefghabcdefghabcdefghijklmnop");
  4933. CharData storage;
  4934. CharData_Init(&storage);
  4935. XML_SetUnknownEncodingHandler(g_parser, MiscEncodingHandler, NULL);
  4936. XML_SetStartElementHandler(g_parser, record_element_start_handler);
  4937. XML_SetUserData(g_parser, &storage);
  4938. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_TRUE)
  4939. == XML_STATUS_ERROR)
  4940. xml_failure(g_parser);
  4941. CharData_CheckXMLChars(&storage, expected);
  4942. }
  4943. END_TEST
  4944. /* Test element name that is long enough to fill the conversion buffer
  4945. * in an unknown encoding, finishing with an simple character.
  4946. */
  4947. START_TEST(test_unknown_encoding_long_name_2) {
  4948. const char *text = "<?xml version='1.0' encoding='prefix-conv'?>\n"
  4949. "<abcdefghabcdefghabcdefghijklmnop>"
  4950. "Hi"
  4951. "</abcdefghabcdefghabcdefghijklmnop>";
  4952. const XML_Char *expected = XCS("abcdefghabcdefghabcdefghijklmnop");
  4953. CharData storage;
  4954. CharData_Init(&storage);
  4955. XML_SetUnknownEncodingHandler(g_parser, MiscEncodingHandler, NULL);
  4956. XML_SetStartElementHandler(g_parser, record_element_start_handler);
  4957. XML_SetUserData(g_parser, &storage);
  4958. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_TRUE)
  4959. == XML_STATUS_ERROR)
  4960. xml_failure(g_parser);
  4961. CharData_CheckXMLChars(&storage, expected);
  4962. }
  4963. END_TEST
  4964. START_TEST(test_invalid_unknown_encoding) {
  4965. const char *text = "<?xml version='1.0' encoding='invalid-9'?>\n"
  4966. "<doc>Hello world</doc>";
  4967. XML_SetUnknownEncodingHandler(g_parser, MiscEncodingHandler, NULL);
  4968. expect_failure(text, XML_ERROR_UNKNOWN_ENCODING,
  4969. "Invalid unknown encoding not faulted");
  4970. }
  4971. END_TEST
  4972. START_TEST(test_unknown_ascii_encoding_ok) {
  4973. const char *text = "<?xml version='1.0' encoding='ascii-like'?>\n"
  4974. "<doc>Hello, world</doc>";
  4975. XML_SetUnknownEncodingHandler(g_parser, MiscEncodingHandler, NULL);
  4976. run_character_check(text, XCS("Hello, world"));
  4977. }
  4978. END_TEST
  4979. START_TEST(test_unknown_ascii_encoding_fail) {
  4980. const char *text = "<?xml version='1.0' encoding='ascii-like'?>\n"
  4981. "<doc>Hello, \x80 world</doc>";
  4982. XML_SetUnknownEncodingHandler(g_parser, MiscEncodingHandler, NULL);
  4983. expect_failure(text, XML_ERROR_INVALID_TOKEN,
  4984. "Invalid character not faulted");
  4985. }
  4986. END_TEST
  4987. START_TEST(test_unknown_encoding_invalid_length) {
  4988. const char *text = "<?xml version='1.0' encoding='invalid-len'?>\n"
  4989. "<doc>Hello, world</doc>";
  4990. XML_SetUnknownEncodingHandler(g_parser, MiscEncodingHandler, NULL);
  4991. expect_failure(text, XML_ERROR_UNKNOWN_ENCODING,
  4992. "Invalid unknown encoding not faulted");
  4993. }
  4994. END_TEST
  4995. START_TEST(test_unknown_encoding_invalid_topbit) {
  4996. const char *text = "<?xml version='1.0' encoding='invalid-a'?>\n"
  4997. "<doc>Hello, world</doc>";
  4998. XML_SetUnknownEncodingHandler(g_parser, MiscEncodingHandler, NULL);
  4999. expect_failure(text, XML_ERROR_UNKNOWN_ENCODING,
  5000. "Invalid unknown encoding not faulted");
  5001. }
  5002. END_TEST
  5003. START_TEST(test_unknown_encoding_invalid_surrogate) {
  5004. const char *text = "<?xml version='1.0' encoding='invalid-surrogate'?>\n"
  5005. "<doc>Hello, \x82 world</doc>";
  5006. XML_SetUnknownEncodingHandler(g_parser, MiscEncodingHandler, NULL);
  5007. expect_failure(text, XML_ERROR_INVALID_TOKEN,
  5008. "Invalid unknown encoding not faulted");
  5009. }
  5010. END_TEST
  5011. START_TEST(test_unknown_encoding_invalid_high) {
  5012. const char *text = "<?xml version='1.0' encoding='invalid-high'?>\n"
  5013. "<doc>Hello, world</doc>";
  5014. XML_SetUnknownEncodingHandler(g_parser, MiscEncodingHandler, NULL);
  5015. expect_failure(text, XML_ERROR_UNKNOWN_ENCODING,
  5016. "Invalid unknown encoding not faulted");
  5017. }
  5018. END_TEST
  5019. START_TEST(test_unknown_encoding_invalid_attr_value) {
  5020. const char *text = "<?xml version='1.0' encoding='prefix-conv'?>\n"
  5021. "<doc attr='\xff\x30'/>";
  5022. XML_SetUnknownEncodingHandler(g_parser, MiscEncodingHandler, NULL);
  5023. expect_failure(text, XML_ERROR_INVALID_TOKEN,
  5024. "Invalid attribute valid not faulted");
  5025. }
  5026. END_TEST
  5027. /* Test an external entity parser set to use latin-1 detects UTF-16
  5028. * BOMs correctly.
  5029. */
  5030. enum ee_parse_flags { EE_PARSE_NONE = 0x00, EE_PARSE_FULL_BUFFER = 0x01 };
  5031. typedef struct ExtTest2 {
  5032. const char *parse_text;
  5033. int parse_len;
  5034. const XML_Char *encoding;
  5035. CharData *storage;
  5036. enum ee_parse_flags flags;
  5037. } ExtTest2;
  5038. static int XMLCALL
  5039. external_entity_loader2(XML_Parser parser, const XML_Char *context,
  5040. const XML_Char *base, const XML_Char *systemId,
  5041. const XML_Char *publicId) {
  5042. ExtTest2 *test_data = (ExtTest2 *)XML_GetUserData(parser);
  5043. XML_Parser extparser;
  5044. UNUSED_P(base);
  5045. UNUSED_P(systemId);
  5046. UNUSED_P(publicId);
  5047. extparser = XML_ExternalEntityParserCreate(parser, context, NULL);
  5048. if (extparser == NULL)
  5049. fail("Coulr not create external entity parser");
  5050. if (test_data->encoding != NULL) {
  5051. if (! XML_SetEncoding(extparser, test_data->encoding))
  5052. fail("XML_SetEncoding() ignored for external entity");
  5053. }
  5054. if (test_data->flags & EE_PARSE_FULL_BUFFER) {
  5055. if (XML_Parse(extparser, test_data->parse_text, test_data->parse_len,
  5056. XML_TRUE)
  5057. == XML_STATUS_ERROR) {
  5058. xml_failure(extparser);
  5059. }
  5060. } else if (_XML_Parse_SINGLE_BYTES(extparser, test_data->parse_text,
  5061. test_data->parse_len, XML_TRUE)
  5062. == XML_STATUS_ERROR) {
  5063. xml_failure(extparser);
  5064. }
  5065. XML_ParserFree(extparser);
  5066. return XML_STATUS_OK;
  5067. }
  5068. /* Test that UTF-16 BOM does not select UTF-16 given explicit encoding */
  5069. static void XMLCALL
  5070. ext2_accumulate_characters(void *userData, const XML_Char *s, int len) {
  5071. ExtTest2 *test_data = (ExtTest2 *)userData;
  5072. accumulate_characters(test_data->storage, s, len);
  5073. }
  5074. START_TEST(test_ext_entity_latin1_utf16le_bom) {
  5075. const char *text = "<!DOCTYPE doc [\n"
  5076. " <!ENTITY en SYSTEM 'http://example.org/dummy.ent'>\n"
  5077. "]>\n"
  5078. "<doc>&en;</doc>";
  5079. ExtTest2 test_data
  5080. = {/* If UTF-16, 0xfeff is the BOM and 0x204c is black left bullet */
  5081. /* If Latin-1, 0xff = Y-diaeresis, 0xfe = lowercase thorn,
  5082. * 0x4c = L and 0x20 is a space
  5083. */
  5084. "\xff\xfe\x4c\x20", 4, XCS("iso-8859-1"), NULL, EE_PARSE_NONE};
  5085. #ifdef XML_UNICODE
  5086. const XML_Char *expected = XCS("\x00ff\x00feL ");
  5087. #else
  5088. /* In UTF-8, y-diaeresis is 0xc3 0xbf, lowercase thorn is 0xc3 0xbe */
  5089. const XML_Char *expected = XCS("\xc3\xbf\xc3\xbeL ");
  5090. #endif
  5091. CharData storage;
  5092. CharData_Init(&storage);
  5093. test_data.storage = &storage;
  5094. XML_SetExternalEntityRefHandler(g_parser, external_entity_loader2);
  5095. XML_SetUserData(g_parser, &test_data);
  5096. XML_SetCharacterDataHandler(g_parser, ext2_accumulate_characters);
  5097. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_TRUE)
  5098. == XML_STATUS_ERROR)
  5099. xml_failure(g_parser);
  5100. CharData_CheckXMLChars(&storage, expected);
  5101. }
  5102. END_TEST
  5103. START_TEST(test_ext_entity_latin1_utf16be_bom) {
  5104. const char *text = "<!DOCTYPE doc [\n"
  5105. " <!ENTITY en SYSTEM 'http://example.org/dummy.ent'>\n"
  5106. "]>\n"
  5107. "<doc>&en;</doc>";
  5108. ExtTest2 test_data
  5109. = {/* If UTF-16, 0xfeff is the BOM and 0x204c is black left bullet */
  5110. /* If Latin-1, 0xff = Y-diaeresis, 0xfe = lowercase thorn,
  5111. * 0x4c = L and 0x20 is a space
  5112. */
  5113. "\xfe\xff\x20\x4c", 4, XCS("iso-8859-1"), NULL, EE_PARSE_NONE};
  5114. #ifdef XML_UNICODE
  5115. const XML_Char *expected = XCS("\x00fe\x00ff L");
  5116. #else
  5117. /* In UTF-8, y-diaeresis is 0xc3 0xbf, lowercase thorn is 0xc3 0xbe */
  5118. const XML_Char *expected = XCS("\xc3\xbe\xc3\xbf L");
  5119. #endif
  5120. CharData storage;
  5121. CharData_Init(&storage);
  5122. test_data.storage = &storage;
  5123. XML_SetExternalEntityRefHandler(g_parser, external_entity_loader2);
  5124. XML_SetUserData(g_parser, &test_data);
  5125. XML_SetCharacterDataHandler(g_parser, ext2_accumulate_characters);
  5126. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_TRUE)
  5127. == XML_STATUS_ERROR)
  5128. xml_failure(g_parser);
  5129. CharData_CheckXMLChars(&storage, expected);
  5130. }
  5131. END_TEST
  5132. /* Parsing the full buffer rather than a byte at a time makes a
  5133. * difference to the encoding scanning code, so repeat the above tests
  5134. * without breaking them down by byte.
  5135. */
  5136. START_TEST(test_ext_entity_latin1_utf16le_bom2) {
  5137. const char *text = "<!DOCTYPE doc [\n"
  5138. " <!ENTITY en SYSTEM 'http://example.org/dummy.ent'>\n"
  5139. "]>\n"
  5140. "<doc>&en;</doc>";
  5141. ExtTest2 test_data
  5142. = {/* If UTF-16, 0xfeff is the BOM and 0x204c is black left bullet */
  5143. /* If Latin-1, 0xff = Y-diaeresis, 0xfe = lowercase thorn,
  5144. * 0x4c = L and 0x20 is a space
  5145. */
  5146. "\xff\xfe\x4c\x20", 4, XCS("iso-8859-1"), NULL, EE_PARSE_FULL_BUFFER};
  5147. #ifdef XML_UNICODE
  5148. const XML_Char *expected = XCS("\x00ff\x00feL ");
  5149. #else
  5150. /* In UTF-8, y-diaeresis is 0xc3 0xbf, lowercase thorn is 0xc3 0xbe */
  5151. const XML_Char *expected = XCS("\xc3\xbf\xc3\xbeL ");
  5152. #endif
  5153. CharData storage;
  5154. CharData_Init(&storage);
  5155. test_data.storage = &storage;
  5156. XML_SetExternalEntityRefHandler(g_parser, external_entity_loader2);
  5157. XML_SetUserData(g_parser, &test_data);
  5158. XML_SetCharacterDataHandler(g_parser, ext2_accumulate_characters);
  5159. if (XML_Parse(g_parser, text, (int)strlen(text), XML_TRUE)
  5160. == XML_STATUS_ERROR)
  5161. xml_failure(g_parser);
  5162. CharData_CheckXMLChars(&storage, expected);
  5163. }
  5164. END_TEST
  5165. START_TEST(test_ext_entity_latin1_utf16be_bom2) {
  5166. const char *text = "<!DOCTYPE doc [\n"
  5167. " <!ENTITY en SYSTEM 'http://example.org/dummy.ent'>\n"
  5168. "]>\n"
  5169. "<doc>&en;</doc>";
  5170. ExtTest2 test_data
  5171. = {/* If UTF-16, 0xfeff is the BOM and 0x204c is black left bullet */
  5172. /* If Latin-1, 0xff = Y-diaeresis, 0xfe = lowercase thorn,
  5173. * 0x4c = L and 0x20 is a space
  5174. */
  5175. "\xfe\xff\x20\x4c", 4, XCS("iso-8859-1"), NULL, EE_PARSE_FULL_BUFFER};
  5176. #ifdef XML_UNICODE
  5177. const XML_Char *expected = XCS("\x00fe\x00ff L");
  5178. #else
  5179. /* In UTF-8, y-diaeresis is 0xc3 0xbf, lowercase thorn is 0xc3 0xbe */
  5180. const XML_Char *expected = "\xc3\xbe\xc3\xbf L";
  5181. #endif
  5182. CharData storage;
  5183. CharData_Init(&storage);
  5184. test_data.storage = &storage;
  5185. XML_SetExternalEntityRefHandler(g_parser, external_entity_loader2);
  5186. XML_SetUserData(g_parser, &test_data);
  5187. XML_SetCharacterDataHandler(g_parser, ext2_accumulate_characters);
  5188. if (XML_Parse(g_parser, text, (int)strlen(text), XML_TRUE)
  5189. == XML_STATUS_ERROR)
  5190. xml_failure(g_parser);
  5191. CharData_CheckXMLChars(&storage, expected);
  5192. }
  5193. END_TEST
  5194. /* Test little-endian UTF-16 given an explicit big-endian encoding */
  5195. START_TEST(test_ext_entity_utf16_be) {
  5196. const char *text = "<!DOCTYPE doc [\n"
  5197. " <!ENTITY en SYSTEM 'http://example.org/dummy.ent'>\n"
  5198. "]>\n"
  5199. "<doc>&en;</doc>";
  5200. ExtTest2 test_data
  5201. = {"<\0e\0/\0>\0", 8, XCS("utf-16be"), NULL, EE_PARSE_NONE};
  5202. #ifdef XML_UNICODE
  5203. const XML_Char *expected = XCS("\x3c00\x6500\x2f00\x3e00");
  5204. #else
  5205. const XML_Char *expected = XCS("\xe3\xb0\x80" /* U+3C00 */
  5206. "\xe6\x94\x80" /* U+6500 */
  5207. "\xe2\xbc\x80" /* U+2F00 */
  5208. "\xe3\xb8\x80"); /* U+3E00 */
  5209. #endif
  5210. CharData storage;
  5211. CharData_Init(&storage);
  5212. test_data.storage = &storage;
  5213. XML_SetExternalEntityRefHandler(g_parser, external_entity_loader2);
  5214. XML_SetUserData(g_parser, &test_data);
  5215. XML_SetCharacterDataHandler(g_parser, ext2_accumulate_characters);
  5216. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_TRUE)
  5217. == XML_STATUS_ERROR)
  5218. xml_failure(g_parser);
  5219. CharData_CheckXMLChars(&storage, expected);
  5220. }
  5221. END_TEST
  5222. /* Test big-endian UTF-16 given an explicit little-endian encoding */
  5223. START_TEST(test_ext_entity_utf16_le) {
  5224. const char *text = "<!DOCTYPE doc [\n"
  5225. " <!ENTITY en SYSTEM 'http://example.org/dummy.ent'>\n"
  5226. "]>\n"
  5227. "<doc>&en;</doc>";
  5228. ExtTest2 test_data
  5229. = {"\0<\0e\0/\0>", 8, XCS("utf-16le"), NULL, EE_PARSE_NONE};
  5230. #ifdef XML_UNICODE
  5231. const XML_Char *expected = XCS("\x3c00\x6500\x2f00\x3e00");
  5232. #else
  5233. const XML_Char *expected = XCS("\xe3\xb0\x80" /* U+3C00 */
  5234. "\xe6\x94\x80" /* U+6500 */
  5235. "\xe2\xbc\x80" /* U+2F00 */
  5236. "\xe3\xb8\x80"); /* U+3E00 */
  5237. #endif
  5238. CharData storage;
  5239. CharData_Init(&storage);
  5240. test_data.storage = &storage;
  5241. XML_SetExternalEntityRefHandler(g_parser, external_entity_loader2);
  5242. XML_SetUserData(g_parser, &test_data);
  5243. XML_SetCharacterDataHandler(g_parser, ext2_accumulate_characters);
  5244. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_TRUE)
  5245. == XML_STATUS_ERROR)
  5246. xml_failure(g_parser);
  5247. CharData_CheckXMLChars(&storage, expected);
  5248. }
  5249. END_TEST
  5250. /* Test little-endian UTF-16 given no explicit encoding.
  5251. * The existing default encoding (UTF-8) is assumed to hold without a
  5252. * BOM to contradict it, so the entity value will in fact provoke an
  5253. * error because 0x00 is not a valid XML character. We parse the
  5254. * whole buffer in one go rather than feeding it in byte by byte to
  5255. * exercise different code paths in the initial scanning routines.
  5256. */
  5257. typedef struct ExtFaults2 {
  5258. const char *parse_text;
  5259. int parse_len;
  5260. const char *fail_text;
  5261. const XML_Char *encoding;
  5262. enum XML_Error error;
  5263. } ExtFaults2;
  5264. static int XMLCALL
  5265. external_entity_faulter2(XML_Parser parser, const XML_Char *context,
  5266. const XML_Char *base, const XML_Char *systemId,
  5267. const XML_Char *publicId) {
  5268. ExtFaults2 *test_data = (ExtFaults2 *)XML_GetUserData(parser);
  5269. XML_Parser extparser;
  5270. UNUSED_P(base);
  5271. UNUSED_P(systemId);
  5272. UNUSED_P(publicId);
  5273. extparser = XML_ExternalEntityParserCreate(parser, context, NULL);
  5274. if (extparser == NULL)
  5275. fail("Could not create external entity parser");
  5276. if (test_data->encoding != NULL) {
  5277. if (! XML_SetEncoding(extparser, test_data->encoding))
  5278. fail("XML_SetEncoding() ignored for external entity");
  5279. }
  5280. if (XML_Parse(extparser, test_data->parse_text, test_data->parse_len,
  5281. XML_TRUE)
  5282. != XML_STATUS_ERROR)
  5283. fail(test_data->fail_text);
  5284. if (XML_GetErrorCode(extparser) != test_data->error)
  5285. xml_failure(extparser);
  5286. XML_ParserFree(extparser);
  5287. return XML_STATUS_ERROR;
  5288. }
  5289. START_TEST(test_ext_entity_utf16_unknown) {
  5290. const char *text = "<!DOCTYPE doc [\n"
  5291. " <!ENTITY en SYSTEM 'http://example.org/dummy.ent'>\n"
  5292. "]>\n"
  5293. "<doc>&en;</doc>";
  5294. ExtFaults2 test_data
  5295. = {"a\0b\0c\0", 6, "Invalid character in entity not faulted", NULL,
  5296. XML_ERROR_INVALID_TOKEN};
  5297. XML_SetExternalEntityRefHandler(g_parser, external_entity_faulter2);
  5298. XML_SetUserData(g_parser, &test_data);
  5299. expect_failure(text, XML_ERROR_EXTERNAL_ENTITY_HANDLING,
  5300. "Invalid character should not have been accepted");
  5301. }
  5302. END_TEST
  5303. /* Test not-quite-UTF-8 BOM (0xEF 0xBB 0xBF) */
  5304. START_TEST(test_ext_entity_utf8_non_bom) {
  5305. const char *text = "<!DOCTYPE doc [\n"
  5306. " <!ENTITY en SYSTEM 'http://example.org/dummy.ent'>\n"
  5307. "]>\n"
  5308. "<doc>&en;</doc>";
  5309. ExtTest2 test_data
  5310. = {"\xef\xbb\x80", /* Arabic letter DAD medial form, U+FEC0 */
  5311. 3, NULL, NULL, EE_PARSE_NONE};
  5312. #ifdef XML_UNICODE
  5313. const XML_Char *expected = XCS("\xfec0");
  5314. #else
  5315. const XML_Char *expected = XCS("\xef\xbb\x80");
  5316. #endif
  5317. CharData storage;
  5318. CharData_Init(&storage);
  5319. test_data.storage = &storage;
  5320. XML_SetExternalEntityRefHandler(g_parser, external_entity_loader2);
  5321. XML_SetUserData(g_parser, &test_data);
  5322. XML_SetCharacterDataHandler(g_parser, ext2_accumulate_characters);
  5323. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_TRUE)
  5324. == XML_STATUS_ERROR)
  5325. xml_failure(g_parser);
  5326. CharData_CheckXMLChars(&storage, expected);
  5327. }
  5328. END_TEST
  5329. /* Test that UTF-8 in a CDATA section is correctly passed through */
  5330. START_TEST(test_utf8_in_cdata_section) {
  5331. const char *text = "<doc><![CDATA[one \xc3\xa9 two]]></doc>";
  5332. #ifdef XML_UNICODE
  5333. const XML_Char *expected = XCS("one \x00e9 two");
  5334. #else
  5335. const XML_Char *expected = XCS("one \xc3\xa9 two");
  5336. #endif
  5337. run_character_check(text, expected);
  5338. }
  5339. END_TEST
  5340. /* Test that little-endian UTF-16 in a CDATA section is handled */
  5341. START_TEST(test_utf8_in_cdata_section_2) {
  5342. const char *text = "<doc><![CDATA[\xc3\xa9]\xc3\xa9two]]></doc>";
  5343. #ifdef XML_UNICODE
  5344. const XML_Char *expected = XCS("\x00e9]\x00e9two");
  5345. #else
  5346. const XML_Char *expected = XCS("\xc3\xa9]\xc3\xa9two");
  5347. #endif
  5348. run_character_check(text, expected);
  5349. }
  5350. END_TEST
  5351. /* Test trailing spaces in elements are accepted */
  5352. static void XMLCALL
  5353. record_element_end_handler(void *userData, const XML_Char *name) {
  5354. CharData *storage = (CharData *)userData;
  5355. CharData_AppendXMLChars(storage, XCS("/"), 1);
  5356. CharData_AppendXMLChars(storage, name, -1);
  5357. }
  5358. START_TEST(test_trailing_spaces_in_elements) {
  5359. const char *text = "<doc >Hi</doc >";
  5360. const XML_Char *expected = XCS("doc/doc");
  5361. CharData storage;
  5362. CharData_Init(&storage);
  5363. XML_SetElementHandler(g_parser, record_element_start_handler,
  5364. record_element_end_handler);
  5365. XML_SetUserData(g_parser, &storage);
  5366. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_TRUE)
  5367. == XML_STATUS_ERROR)
  5368. xml_failure(g_parser);
  5369. CharData_CheckXMLChars(&storage, expected);
  5370. }
  5371. END_TEST
  5372. START_TEST(test_utf16_attribute) {
  5373. const char text[] =
  5374. /* <d {KHO KHWAI}{CHO CHAN}='a'/>
  5375. * where {KHO KHWAI} = U+0E04 = 0xe0 0xb8 0x84 in UTF-8
  5376. * and {CHO CHAN} = U+0E08 = 0xe0 0xb8 0x88 in UTF-8
  5377. */
  5378. "<\0d\0 \0\x04\x0e\x08\x0e=\0'\0a\0'\0/\0>\0";
  5379. const XML_Char *expected = XCS("a");
  5380. CharData storage;
  5381. CharData_Init(&storage);
  5382. XML_SetStartElementHandler(g_parser, accumulate_attribute);
  5383. XML_SetUserData(g_parser, &storage);
  5384. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)sizeof(text) - 1, XML_TRUE)
  5385. == XML_STATUS_ERROR)
  5386. xml_failure(g_parser);
  5387. CharData_CheckXMLChars(&storage, expected);
  5388. }
  5389. END_TEST
  5390. START_TEST(test_utf16_second_attr) {
  5391. /* <d a='1' {KHO KHWAI}{CHO CHAN}='2'/>
  5392. * where {KHO KHWAI} = U+0E04 = 0xe0 0xb8 0x84 in UTF-8
  5393. * and {CHO CHAN} = U+0E08 = 0xe0 0xb8 0x88 in UTF-8
  5394. */
  5395. const char text[] = "<\0d\0 \0a\0=\0'\0\x31\0'\0 \0"
  5396. "\x04\x0e\x08\x0e=\0'\0\x32\0'\0/\0>\0";
  5397. const XML_Char *expected = XCS("1");
  5398. CharData storage;
  5399. CharData_Init(&storage);
  5400. XML_SetStartElementHandler(g_parser, accumulate_attribute);
  5401. XML_SetUserData(g_parser, &storage);
  5402. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)sizeof(text) - 1, XML_TRUE)
  5403. == XML_STATUS_ERROR)
  5404. xml_failure(g_parser);
  5405. CharData_CheckXMLChars(&storage, expected);
  5406. }
  5407. END_TEST
  5408. START_TEST(test_attr_after_solidus) {
  5409. const char *text = "<doc attr1='a' / attr2='b'>";
  5410. expect_failure(text, XML_ERROR_INVALID_TOKEN, "Misplaced / not faulted");
  5411. }
  5412. END_TEST
  5413. static void XMLCALL
  5414. accumulate_entity_decl(void *userData, const XML_Char *entityName,
  5415. int is_parameter_entity, const XML_Char *value,
  5416. int value_length, const XML_Char *base,
  5417. const XML_Char *systemId, const XML_Char *publicId,
  5418. const XML_Char *notationName) {
  5419. CharData *storage = (CharData *)userData;
  5420. UNUSED_P(is_parameter_entity);
  5421. UNUSED_P(base);
  5422. UNUSED_P(systemId);
  5423. UNUSED_P(publicId);
  5424. UNUSED_P(notationName);
  5425. CharData_AppendXMLChars(storage, entityName, -1);
  5426. CharData_AppendXMLChars(storage, XCS("="), 1);
  5427. CharData_AppendXMLChars(storage, value, value_length);
  5428. CharData_AppendXMLChars(storage, XCS("\n"), 1);
  5429. }
  5430. START_TEST(test_utf16_pe) {
  5431. /* <!DOCTYPE doc [
  5432. * <!ENTITY % {KHO KHWAI}{CHO CHAN} '<!ELEMENT doc (#PCDATA)>'>
  5433. * %{KHO KHWAI}{CHO CHAN};
  5434. * ]>
  5435. * <doc></doc>
  5436. *
  5437. * where {KHO KHWAI} = U+0E04 = 0xe0 0xb8 0x84 in UTF-8
  5438. * and {CHO CHAN} = U+0E08 = 0xe0 0xb8 0x88 in UTF-8
  5439. */
  5440. const char text[] = "\0<\0!\0D\0O\0C\0T\0Y\0P\0E\0 \0d\0o\0c\0 \0[\0\n"
  5441. "\0<\0!\0E\0N\0T\0I\0T\0Y\0 \0%\0 \x0e\x04\x0e\x08\0 "
  5442. "\0'\0<\0!\0E\0L\0E\0M\0E\0N\0T\0 "
  5443. "\0d\0o\0c\0 \0(\0#\0P\0C\0D\0A\0T\0A\0)\0>\0'\0>\0\n"
  5444. "\0%\x0e\x04\x0e\x08\0;\0\n"
  5445. "\0]\0>\0\n"
  5446. "\0<\0d\0o\0c\0>\0<\0/\0d\0o\0c\0>";
  5447. #ifdef XML_UNICODE
  5448. const XML_Char *expected = XCS("\x0e04\x0e08=<!ELEMENT doc (#PCDATA)>\n");
  5449. #else
  5450. const XML_Char *expected
  5451. = XCS("\xe0\xb8\x84\xe0\xb8\x88=<!ELEMENT doc (#PCDATA)>\n");
  5452. #endif
  5453. CharData storage;
  5454. CharData_Init(&storage);
  5455. XML_SetUserData(g_parser, &storage);
  5456. XML_SetEntityDeclHandler(g_parser, accumulate_entity_decl);
  5457. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)sizeof(text) - 1, XML_TRUE)
  5458. == XML_STATUS_ERROR)
  5459. xml_failure(g_parser);
  5460. CharData_CheckXMLChars(&storage, expected);
  5461. }
  5462. END_TEST
  5463. /* Test that duff attribute description keywords are rejected */
  5464. START_TEST(test_bad_attr_desc_keyword) {
  5465. const char *text = "<!DOCTYPE doc [\n"
  5466. " <!ATTLIST doc attr CDATA #!IMPLIED>\n"
  5467. "]>\n"
  5468. "<doc />";
  5469. expect_failure(text, XML_ERROR_INVALID_TOKEN,
  5470. "Bad keyword !IMPLIED not faulted");
  5471. }
  5472. END_TEST
  5473. /* Test that an invalid attribute description keyword consisting of
  5474. * UTF-16 characters with their top bytes non-zero are correctly
  5475. * faulted
  5476. */
  5477. START_TEST(test_bad_attr_desc_keyword_utf16) {
  5478. /* <!DOCTYPE d [
  5479. * <!ATTLIST d a CDATA #{KHO KHWAI}{CHO CHAN}>
  5480. * ]><d/>
  5481. *
  5482. * where {KHO KHWAI} = U+0E04 = 0xe0 0xb8 0x84 in UTF-8
  5483. * and {CHO CHAN} = U+0E08 = 0xe0 0xb8 0x88 in UTF-8
  5484. */
  5485. const char text[]
  5486. = "\0<\0!\0D\0O\0C\0T\0Y\0P\0E\0 \0d\0 \0[\0\n"
  5487. "\0<\0!\0A\0T\0T\0L\0I\0S\0T\0 \0d\0 \0a\0 \0C\0D\0A\0T\0A\0 "
  5488. "\0#\x0e\x04\x0e\x08\0>\0\n"
  5489. "\0]\0>\0<\0d\0/\0>";
  5490. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)sizeof(text) - 1, XML_TRUE)
  5491. != XML_STATUS_ERROR)
  5492. fail("Invalid UTF16 attribute keyword not faulted");
  5493. if (XML_GetErrorCode(g_parser) != XML_ERROR_SYNTAX)
  5494. xml_failure(g_parser);
  5495. }
  5496. END_TEST
  5497. /* Test that invalid syntax in a <!DOCTYPE> is rejected. Do this
  5498. * using prefix-encoding (see above) to trigger specific code paths
  5499. */
  5500. START_TEST(test_bad_doctype) {
  5501. const char *text = "<?xml version='1.0' encoding='prefix-conv'?>\n"
  5502. "<!DOCTYPE doc [ \x80\x44 ]><doc/>";
  5503. XML_SetUnknownEncodingHandler(g_parser, MiscEncodingHandler, NULL);
  5504. expect_failure(text, XML_ERROR_SYNTAX,
  5505. "Invalid bytes in DOCTYPE not faulted");
  5506. }
  5507. END_TEST
  5508. START_TEST(test_bad_doctype_utf16) {
  5509. const char text[] =
  5510. /* <!DOCTYPE doc [ \x06f2 ]><doc/>
  5511. *
  5512. * U+06F2 = EXTENDED ARABIC-INDIC DIGIT TWO, a valid number
  5513. * (name character) but not a valid letter (name start character)
  5514. */
  5515. "\0<\0!\0D\0O\0C\0T\0Y\0P\0E\0 \0d\0o\0c\0 \0[\0 "
  5516. "\x06\xf2"
  5517. "\0 \0]\0>\0<\0d\0o\0c\0/\0>";
  5518. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)sizeof(text) - 1, XML_TRUE)
  5519. != XML_STATUS_ERROR)
  5520. fail("Invalid bytes in DOCTYPE not faulted");
  5521. if (XML_GetErrorCode(g_parser) != XML_ERROR_SYNTAX)
  5522. xml_failure(g_parser);
  5523. }
  5524. END_TEST
  5525. START_TEST(test_bad_doctype_plus) {
  5526. const char *text = "<!DOCTYPE 1+ [ <!ENTITY foo 'bar'> ]>\n"
  5527. "<1+>&foo;</1+>";
  5528. expect_failure(text, XML_ERROR_INVALID_TOKEN,
  5529. "'+' in document name not faulted");
  5530. }
  5531. END_TEST
  5532. START_TEST(test_bad_doctype_star) {
  5533. const char *text = "<!DOCTYPE 1* [ <!ENTITY foo 'bar'> ]>\n"
  5534. "<1*>&foo;</1*>";
  5535. expect_failure(text, XML_ERROR_INVALID_TOKEN,
  5536. "'*' in document name not faulted");
  5537. }
  5538. END_TEST
  5539. START_TEST(test_bad_doctype_query) {
  5540. const char *text = "<!DOCTYPE 1? [ <!ENTITY foo 'bar'> ]>\n"
  5541. "<1?>&foo;</1?>";
  5542. expect_failure(text, XML_ERROR_INVALID_TOKEN,
  5543. "'?' in document name not faulted");
  5544. }
  5545. END_TEST
  5546. START_TEST(test_unknown_encoding_bad_ignore) {
  5547. const char *text = "<?xml version='1.0' encoding='prefix-conv'?>"
  5548. "<!DOCTYPE doc SYSTEM 'foo'>"
  5549. "<doc><e>&entity;</e></doc>";
  5550. ExtFaults fault = {"<![IGNORE[<!ELEMENT \xffG (#PCDATA)*>]]>",
  5551. "Invalid character not faulted", XCS("prefix-conv"),
  5552. XML_ERROR_INVALID_TOKEN};
  5553. XML_SetUnknownEncodingHandler(g_parser, MiscEncodingHandler, NULL);
  5554. XML_SetParamEntityParsing(g_parser, XML_PARAM_ENTITY_PARSING_ALWAYS);
  5555. XML_SetExternalEntityRefHandler(g_parser, external_entity_faulter);
  5556. XML_SetUserData(g_parser, &fault);
  5557. expect_failure(text, XML_ERROR_EXTERNAL_ENTITY_HANDLING,
  5558. "Bad IGNORE section with unknown encoding not failed");
  5559. }
  5560. END_TEST
  5561. START_TEST(test_entity_in_utf16_be_attr) {
  5562. const char text[] =
  5563. /* <e a='&#228; &#x00E4;'></e> */
  5564. "\0<\0e\0 \0a\0=\0'\0&\0#\0\x32\0\x32\0\x38\0;\0 "
  5565. "\0&\0#\0x\0\x30\0\x30\0E\0\x34\0;\0'\0>\0<\0/\0e\0>";
  5566. #ifdef XML_UNICODE
  5567. const XML_Char *expected = XCS("\x00e4 \x00e4");
  5568. #else
  5569. const XML_Char *expected = XCS("\xc3\xa4 \xc3\xa4");
  5570. #endif
  5571. CharData storage;
  5572. CharData_Init(&storage);
  5573. XML_SetUserData(g_parser, &storage);
  5574. XML_SetStartElementHandler(g_parser, accumulate_attribute);
  5575. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)sizeof(text) - 1, XML_TRUE)
  5576. == XML_STATUS_ERROR)
  5577. xml_failure(g_parser);
  5578. CharData_CheckXMLChars(&storage, expected);
  5579. }
  5580. END_TEST
  5581. START_TEST(test_entity_in_utf16_le_attr) {
  5582. const char text[] =
  5583. /* <e a='&#228; &#x00E4;'></e> */
  5584. "<\0e\0 \0a\0=\0'\0&\0#\0\x32\0\x32\0\x38\0;\0 \0"
  5585. "&\0#\0x\0\x30\0\x30\0E\0\x34\0;\0'\0>\0<\0/\0e\0>\0";
  5586. #ifdef XML_UNICODE
  5587. const XML_Char *expected = XCS("\x00e4 \x00e4");
  5588. #else
  5589. const XML_Char *expected = XCS("\xc3\xa4 \xc3\xa4");
  5590. #endif
  5591. CharData storage;
  5592. CharData_Init(&storage);
  5593. XML_SetUserData(g_parser, &storage);
  5594. XML_SetStartElementHandler(g_parser, accumulate_attribute);
  5595. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)sizeof(text) - 1, XML_TRUE)
  5596. == XML_STATUS_ERROR)
  5597. xml_failure(g_parser);
  5598. CharData_CheckXMLChars(&storage, expected);
  5599. }
  5600. END_TEST
  5601. START_TEST(test_entity_public_utf16_be) {
  5602. const char text[] =
  5603. /* <!DOCTYPE d [ */
  5604. "\0<\0!\0D\0O\0C\0T\0Y\0P\0E\0 \0d\0 \0[\0\n"
  5605. /* <!ENTITY % e PUBLIC 'foo' 'bar.ent'> */
  5606. "\0<\0!\0E\0N\0T\0I\0T\0Y\0 \0%\0 \0e\0 \0P\0U\0B\0L\0I\0C\0 "
  5607. "\0'\0f\0o\0o\0'\0 \0'\0b\0a\0r\0.\0e\0n\0t\0'\0>\0\n"
  5608. /* %e; */
  5609. "\0%\0e\0;\0\n"
  5610. /* ]> */
  5611. "\0]\0>\0\n"
  5612. /* <d>&j;</d> */
  5613. "\0<\0d\0>\0&\0j\0;\0<\0/\0d\0>";
  5614. ExtTest2 test_data = {/* <!ENTITY j 'baz'> */
  5615. "\0<\0!\0E\0N\0T\0I\0T\0Y\0 \0j\0 \0'\0b\0a\0z\0'\0>",
  5616. 34, NULL, NULL, EE_PARSE_NONE};
  5617. const XML_Char *expected = XCS("baz");
  5618. CharData storage;
  5619. CharData_Init(&storage);
  5620. test_data.storage = &storage;
  5621. XML_SetParamEntityParsing(g_parser, XML_PARAM_ENTITY_PARSING_ALWAYS);
  5622. XML_SetExternalEntityRefHandler(g_parser, external_entity_loader2);
  5623. XML_SetUserData(g_parser, &test_data);
  5624. XML_SetCharacterDataHandler(g_parser, ext2_accumulate_characters);
  5625. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)sizeof(text) - 1, XML_TRUE)
  5626. == XML_STATUS_ERROR)
  5627. xml_failure(g_parser);
  5628. CharData_CheckXMLChars(&storage, expected);
  5629. }
  5630. END_TEST
  5631. START_TEST(test_entity_public_utf16_le) {
  5632. const char text[] =
  5633. /* <!DOCTYPE d [ */
  5634. "<\0!\0D\0O\0C\0T\0Y\0P\0E\0 \0d\0 \0[\0\n\0"
  5635. /* <!ENTITY % e PUBLIC 'foo' 'bar.ent'> */
  5636. "<\0!\0E\0N\0T\0I\0T\0Y\0 \0%\0 \0e\0 \0P\0U\0B\0L\0I\0C\0 \0"
  5637. "'\0f\0o\0o\0'\0 \0'\0b\0a\0r\0.\0e\0n\0t\0'\0>\0\n\0"
  5638. /* %e; */
  5639. "%\0e\0;\0\n\0"
  5640. /* ]> */
  5641. "]\0>\0\n\0"
  5642. /* <d>&j;</d> */
  5643. "<\0d\0>\0&\0j\0;\0<\0/\0d\0>\0";
  5644. ExtTest2 test_data = {/* <!ENTITY j 'baz'> */
  5645. "<\0!\0E\0N\0T\0I\0T\0Y\0 \0j\0 \0'\0b\0a\0z\0'\0>\0",
  5646. 34, NULL, NULL, EE_PARSE_NONE};
  5647. const XML_Char *expected = XCS("baz");
  5648. CharData storage;
  5649. CharData_Init(&storage);
  5650. test_data.storage = &storage;
  5651. XML_SetParamEntityParsing(g_parser, XML_PARAM_ENTITY_PARSING_ALWAYS);
  5652. XML_SetExternalEntityRefHandler(g_parser, external_entity_loader2);
  5653. XML_SetUserData(g_parser, &test_data);
  5654. XML_SetCharacterDataHandler(g_parser, ext2_accumulate_characters);
  5655. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)sizeof(text) - 1, XML_TRUE)
  5656. == XML_STATUS_ERROR)
  5657. xml_failure(g_parser);
  5658. CharData_CheckXMLChars(&storage, expected);
  5659. }
  5660. END_TEST
  5661. /* Test that a doctype with neither an internal nor external subset is
  5662. * faulted
  5663. */
  5664. START_TEST(test_short_doctype) {
  5665. const char *text = "<!DOCTYPE doc></doc>";
  5666. expect_failure(text, XML_ERROR_INVALID_TOKEN,
  5667. "DOCTYPE without subset not rejected");
  5668. }
  5669. END_TEST
  5670. START_TEST(test_short_doctype_2) {
  5671. const char *text = "<!DOCTYPE doc PUBLIC></doc>";
  5672. expect_failure(text, XML_ERROR_SYNTAX,
  5673. "DOCTYPE without Public ID not rejected");
  5674. }
  5675. END_TEST
  5676. START_TEST(test_short_doctype_3) {
  5677. const char *text = "<!DOCTYPE doc SYSTEM></doc>";
  5678. expect_failure(text, XML_ERROR_SYNTAX,
  5679. "DOCTYPE without System ID not rejected");
  5680. }
  5681. END_TEST
  5682. START_TEST(test_long_doctype) {
  5683. const char *text = "<!DOCTYPE doc PUBLIC 'foo' 'bar' 'baz'></doc>";
  5684. expect_failure(text, XML_ERROR_SYNTAX, "DOCTYPE with extra ID not rejected");
  5685. }
  5686. END_TEST
  5687. START_TEST(test_bad_entity) {
  5688. const char *text = "<!DOCTYPE doc [\n"
  5689. " <!ENTITY foo PUBLIC>\n"
  5690. "]>\n"
  5691. "<doc/>";
  5692. expect_failure(text, XML_ERROR_SYNTAX,
  5693. "ENTITY without Public ID is not rejected");
  5694. }
  5695. END_TEST
  5696. /* Test unquoted value is faulted */
  5697. START_TEST(test_bad_entity_2) {
  5698. const char *text = "<!DOCTYPE doc [\n"
  5699. " <!ENTITY % foo bar>\n"
  5700. "]>\n"
  5701. "<doc/>";
  5702. expect_failure(text, XML_ERROR_SYNTAX,
  5703. "ENTITY without Public ID is not rejected");
  5704. }
  5705. END_TEST
  5706. START_TEST(test_bad_entity_3) {
  5707. const char *text = "<!DOCTYPE doc [\n"
  5708. " <!ENTITY % foo PUBLIC>\n"
  5709. "]>\n"
  5710. "<doc/>";
  5711. expect_failure(text, XML_ERROR_SYNTAX,
  5712. "Parameter ENTITY without Public ID is not rejected");
  5713. }
  5714. END_TEST
  5715. START_TEST(test_bad_entity_4) {
  5716. const char *text = "<!DOCTYPE doc [\n"
  5717. " <!ENTITY % foo SYSTEM>\n"
  5718. "]>\n"
  5719. "<doc/>";
  5720. expect_failure(text, XML_ERROR_SYNTAX,
  5721. "Parameter ENTITY without Public ID is not rejected");
  5722. }
  5723. END_TEST
  5724. START_TEST(test_bad_notation) {
  5725. const char *text = "<!DOCTYPE doc [\n"
  5726. " <!NOTATION n SYSTEM>\n"
  5727. "]>\n"
  5728. "<doc/>";
  5729. expect_failure(text, XML_ERROR_SYNTAX,
  5730. "Notation without System ID is not rejected");
  5731. }
  5732. END_TEST
  5733. /* Test for issue #11, wrongly suppressed default handler */
  5734. typedef struct default_check {
  5735. const XML_Char *expected;
  5736. const int expectedLen;
  5737. XML_Bool seen;
  5738. } DefaultCheck;
  5739. static void XMLCALL
  5740. checking_default_handler(void *userData, const XML_Char *s, int len) {
  5741. DefaultCheck *data = (DefaultCheck *)userData;
  5742. int i;
  5743. for (i = 0; data[i].expected != NULL; i++) {
  5744. if (data[i].expectedLen == len
  5745. && ! memcmp(data[i].expected, s, len * sizeof(XML_Char))) {
  5746. data[i].seen = XML_TRUE;
  5747. break;
  5748. }
  5749. }
  5750. }
  5751. START_TEST(test_default_doctype_handler) {
  5752. const char *text = "<!DOCTYPE doc PUBLIC 'pubname' 'test.dtd' [\n"
  5753. " <!ENTITY foo 'bar'>\n"
  5754. "]>\n"
  5755. "<doc>&foo;</doc>";
  5756. DefaultCheck test_data[] = {{XCS("'pubname'"), 9, XML_FALSE},
  5757. {XCS("'test.dtd'"), 10, XML_FALSE},
  5758. {NULL, 0, XML_FALSE}};
  5759. int i;
  5760. XML_SetUserData(g_parser, &test_data);
  5761. XML_SetDefaultHandler(g_parser, checking_default_handler);
  5762. XML_SetEntityDeclHandler(g_parser, dummy_entity_decl_handler);
  5763. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_TRUE)
  5764. == XML_STATUS_ERROR)
  5765. xml_failure(g_parser);
  5766. for (i = 0; test_data[i].expected != NULL; i++)
  5767. if (! test_data[i].seen)
  5768. fail("Default handler not run for public !DOCTYPE");
  5769. }
  5770. END_TEST
  5771. START_TEST(test_empty_element_abort) {
  5772. const char *text = "<abort/>";
  5773. XML_SetStartElementHandler(g_parser, start_element_suspender);
  5774. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_TRUE)
  5775. != XML_STATUS_ERROR)
  5776. fail("Expected to error on abort");
  5777. }
  5778. END_TEST
  5779. /*
  5780. * Namespaces tests.
  5781. */
  5782. static void
  5783. namespace_setup(void) {
  5784. g_parser = XML_ParserCreateNS(NULL, XCS(' '));
  5785. if (g_parser == NULL)
  5786. fail("Parser not created.");
  5787. }
  5788. static void
  5789. namespace_teardown(void) {
  5790. basic_teardown();
  5791. }
  5792. /* Check that an element name and attribute name match the expected values.
  5793. The expected values are passed as an array reference of string pointers
  5794. provided as the userData argument; the first is the expected
  5795. element name, and the second is the expected attribute name.
  5796. */
  5797. static int triplet_start_flag = XML_FALSE;
  5798. static int triplet_end_flag = XML_FALSE;
  5799. static void XMLCALL
  5800. triplet_start_checker(void *userData, const XML_Char *name,
  5801. const XML_Char **atts) {
  5802. XML_Char **elemstr = (XML_Char **)userData;
  5803. char buffer[1024];
  5804. if (xcstrcmp(elemstr[0], name) != 0) {
  5805. sprintf(buffer, "unexpected start string: '%" XML_FMT_STR "'", name);
  5806. fail(buffer);
  5807. }
  5808. if (xcstrcmp(elemstr[1], atts[0]) != 0) {
  5809. sprintf(buffer, "unexpected attribute string: '%" XML_FMT_STR "'", atts[0]);
  5810. fail(buffer);
  5811. }
  5812. triplet_start_flag = XML_TRUE;
  5813. }
  5814. /* Check that the element name passed to the end-element handler matches
  5815. the expected value. The expected value is passed as the first element
  5816. in an array of strings passed as the userData argument.
  5817. */
  5818. static void XMLCALL
  5819. triplet_end_checker(void *userData, const XML_Char *name) {
  5820. XML_Char **elemstr = (XML_Char **)userData;
  5821. if (xcstrcmp(elemstr[0], name) != 0) {
  5822. char buffer[1024];
  5823. sprintf(buffer, "unexpected end string: '%" XML_FMT_STR "'", name);
  5824. fail(buffer);
  5825. }
  5826. triplet_end_flag = XML_TRUE;
  5827. }
  5828. START_TEST(test_return_ns_triplet) {
  5829. const char *text = "<foo:e xmlns:foo='http://example.org/' bar:a='12'\n"
  5830. " xmlns:bar='http://example.org/'>";
  5831. const char *epilog = "</foo:e>";
  5832. const XML_Char *elemstr[]
  5833. = {XCS("http://example.org/ e foo"), XCS("http://example.org/ a bar")};
  5834. XML_SetReturnNSTriplet(g_parser, XML_TRUE);
  5835. XML_SetUserData(g_parser, (void *)elemstr);
  5836. XML_SetElementHandler(g_parser, triplet_start_checker, triplet_end_checker);
  5837. XML_SetNamespaceDeclHandler(g_parser, dummy_start_namespace_decl_handler,
  5838. dummy_end_namespace_decl_handler);
  5839. triplet_start_flag = XML_FALSE;
  5840. triplet_end_flag = XML_FALSE;
  5841. dummy_handler_flags = 0;
  5842. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_FALSE)
  5843. == XML_STATUS_ERROR)
  5844. xml_failure(g_parser);
  5845. if (! triplet_start_flag)
  5846. fail("triplet_start_checker not invoked");
  5847. /* Check that unsetting "return triplets" fails while still parsing */
  5848. XML_SetReturnNSTriplet(g_parser, XML_FALSE);
  5849. if (_XML_Parse_SINGLE_BYTES(g_parser, epilog, (int)strlen(epilog), XML_TRUE)
  5850. == XML_STATUS_ERROR)
  5851. xml_failure(g_parser);
  5852. if (! triplet_end_flag)
  5853. fail("triplet_end_checker not invoked");
  5854. if (dummy_handler_flags
  5855. != (DUMMY_START_NS_DECL_HANDLER_FLAG | DUMMY_END_NS_DECL_HANDLER_FLAG))
  5856. fail("Namespace handlers not called");
  5857. }
  5858. END_TEST
  5859. static void XMLCALL
  5860. overwrite_start_checker(void *userData, const XML_Char *name,
  5861. const XML_Char **atts) {
  5862. CharData *storage = (CharData *)userData;
  5863. CharData_AppendXMLChars(storage, XCS("start "), 6);
  5864. CharData_AppendXMLChars(storage, name, -1);
  5865. while (*atts != NULL) {
  5866. CharData_AppendXMLChars(storage, XCS("\nattribute "), 11);
  5867. CharData_AppendXMLChars(storage, *atts, -1);
  5868. atts += 2;
  5869. }
  5870. CharData_AppendXMLChars(storage, XCS("\n"), 1);
  5871. }
  5872. static void XMLCALL
  5873. overwrite_end_checker(void *userData, const XML_Char *name) {
  5874. CharData *storage = (CharData *)userData;
  5875. CharData_AppendXMLChars(storage, XCS("end "), 4);
  5876. CharData_AppendXMLChars(storage, name, -1);
  5877. CharData_AppendXMLChars(storage, XCS("\n"), 1);
  5878. }
  5879. static void
  5880. run_ns_tagname_overwrite_test(const char *text, const XML_Char *result) {
  5881. CharData storage;
  5882. CharData_Init(&storage);
  5883. XML_SetUserData(g_parser, &storage);
  5884. XML_SetElementHandler(g_parser, overwrite_start_checker,
  5885. overwrite_end_checker);
  5886. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_TRUE)
  5887. == XML_STATUS_ERROR)
  5888. xml_failure(g_parser);
  5889. CharData_CheckXMLChars(&storage, result);
  5890. }
  5891. /* Regression test for SF bug #566334. */
  5892. START_TEST(test_ns_tagname_overwrite) {
  5893. const char *text = "<n:e xmlns:n='http://example.org/'>\n"
  5894. " <n:f n:attr='foo'/>\n"
  5895. " <n:g n:attr2='bar'/>\n"
  5896. "</n:e>";
  5897. const XML_Char *result = XCS("start http://example.org/ e\n")
  5898. XCS("start http://example.org/ f\n")
  5899. XCS("attribute http://example.org/ attr\n")
  5900. XCS("end http://example.org/ f\n")
  5901. XCS("start http://example.org/ g\n")
  5902. XCS("attribute http://example.org/ attr2\n")
  5903. XCS("end http://example.org/ g\n")
  5904. XCS("end http://example.org/ e\n");
  5905. run_ns_tagname_overwrite_test(text, result);
  5906. }
  5907. END_TEST
  5908. /* Regression test for SF bug #566334. */
  5909. START_TEST(test_ns_tagname_overwrite_triplet) {
  5910. const char *text = "<n:e xmlns:n='http://example.org/'>\n"
  5911. " <n:f n:attr='foo'/>\n"
  5912. " <n:g n:attr2='bar'/>\n"
  5913. "</n:e>";
  5914. const XML_Char *result = XCS("start http://example.org/ e n\n")
  5915. XCS("start http://example.org/ f n\n")
  5916. XCS("attribute http://example.org/ attr n\n")
  5917. XCS("end http://example.org/ f n\n")
  5918. XCS("start http://example.org/ g n\n")
  5919. XCS("attribute http://example.org/ attr2 n\n")
  5920. XCS("end http://example.org/ g n\n")
  5921. XCS("end http://example.org/ e n\n");
  5922. XML_SetReturnNSTriplet(g_parser, XML_TRUE);
  5923. run_ns_tagname_overwrite_test(text, result);
  5924. }
  5925. END_TEST
  5926. /* Regression test for SF bug #620343. */
  5927. static void XMLCALL
  5928. start_element_fail(void *userData, const XML_Char *name,
  5929. const XML_Char **atts) {
  5930. UNUSED_P(userData);
  5931. UNUSED_P(name);
  5932. UNUSED_P(atts);
  5933. /* We should never get here. */
  5934. fail("should never reach start_element_fail()");
  5935. }
  5936. static void XMLCALL
  5937. start_ns_clearing_start_element(void *userData, const XML_Char *prefix,
  5938. const XML_Char *uri) {
  5939. UNUSED_P(prefix);
  5940. UNUSED_P(uri);
  5941. XML_SetStartElementHandler((XML_Parser)userData, NULL);
  5942. }
  5943. START_TEST(test_start_ns_clears_start_element) {
  5944. /* This needs to use separate start/end tags; using the empty tag
  5945. syntax doesn't cause the problematic path through Expat to be
  5946. taken.
  5947. */
  5948. const char *text = "<e xmlns='http://example.org/'></e>";
  5949. XML_SetStartElementHandler(g_parser, start_element_fail);
  5950. XML_SetStartNamespaceDeclHandler(g_parser, start_ns_clearing_start_element);
  5951. XML_SetEndNamespaceDeclHandler(g_parser, dummy_end_namespace_decl_handler);
  5952. XML_UseParserAsHandlerArg(g_parser);
  5953. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_TRUE)
  5954. == XML_STATUS_ERROR)
  5955. xml_failure(g_parser);
  5956. }
  5957. END_TEST
  5958. /* Regression test for SF bug #616863. */
  5959. static int XMLCALL
  5960. external_entity_handler(XML_Parser parser, const XML_Char *context,
  5961. const XML_Char *base, const XML_Char *systemId,
  5962. const XML_Char *publicId) {
  5963. intptr_t callno = 1 + (intptr_t)XML_GetUserData(parser);
  5964. const char *text;
  5965. XML_Parser p2;
  5966. UNUSED_P(base);
  5967. UNUSED_P(systemId);
  5968. UNUSED_P(publicId);
  5969. if (callno == 1)
  5970. text = ("<!ELEMENT doc (e+)>\n"
  5971. "<!ATTLIST doc xmlns CDATA #IMPLIED>\n"
  5972. "<!ELEMENT e EMPTY>\n");
  5973. else
  5974. text = ("<?xml version='1.0' encoding='us-ascii'?>"
  5975. "<e/>");
  5976. XML_SetUserData(parser, (void *)callno);
  5977. p2 = XML_ExternalEntityParserCreate(parser, context, NULL);
  5978. if (_XML_Parse_SINGLE_BYTES(p2, text, (int)strlen(text), XML_TRUE)
  5979. == XML_STATUS_ERROR) {
  5980. xml_failure(p2);
  5981. return XML_STATUS_ERROR;
  5982. }
  5983. XML_ParserFree(p2);
  5984. return XML_STATUS_OK;
  5985. }
  5986. START_TEST(test_default_ns_from_ext_subset_and_ext_ge) {
  5987. const char *text = "<?xml version='1.0'?>\n"
  5988. "<!DOCTYPE doc SYSTEM 'http://example.org/doc.dtd' [\n"
  5989. " <!ENTITY en SYSTEM 'http://example.org/entity.ent'>\n"
  5990. "]>\n"
  5991. "<doc xmlns='http://example.org/ns1'>\n"
  5992. "&en;\n"
  5993. "</doc>";
  5994. XML_SetParamEntityParsing(g_parser, XML_PARAM_ENTITY_PARSING_ALWAYS);
  5995. XML_SetExternalEntityRefHandler(g_parser, external_entity_handler);
  5996. /* We actually need to set this handler to tickle this bug. */
  5997. XML_SetStartElementHandler(g_parser, dummy_start_element);
  5998. XML_SetUserData(g_parser, NULL);
  5999. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_TRUE)
  6000. == XML_STATUS_ERROR)
  6001. xml_failure(g_parser);
  6002. }
  6003. END_TEST
  6004. /* Regression test #1 for SF bug #673791. */
  6005. START_TEST(test_ns_prefix_with_empty_uri_1) {
  6006. const char *text = "<doc xmlns:prefix='http://example.org/'>\n"
  6007. " <e xmlns:prefix=''/>\n"
  6008. "</doc>";
  6009. expect_failure(text, XML_ERROR_UNDECLARING_PREFIX,
  6010. "Did not report re-setting namespace"
  6011. " URI with prefix to ''.");
  6012. }
  6013. END_TEST
  6014. /* Regression test #2 for SF bug #673791. */
  6015. START_TEST(test_ns_prefix_with_empty_uri_2) {
  6016. const char *text = "<?xml version='1.0'?>\n"
  6017. "<docelem xmlns:pre=''/>";
  6018. expect_failure(text, XML_ERROR_UNDECLARING_PREFIX,
  6019. "Did not report setting namespace URI with prefix to ''.");
  6020. }
  6021. END_TEST
  6022. /* Regression test #3 for SF bug #673791. */
  6023. START_TEST(test_ns_prefix_with_empty_uri_3) {
  6024. const char *text = "<!DOCTYPE doc [\n"
  6025. " <!ELEMENT doc EMPTY>\n"
  6026. " <!ATTLIST doc\n"
  6027. " xmlns:prefix CDATA ''>\n"
  6028. "]>\n"
  6029. "<doc/>";
  6030. expect_failure(text, XML_ERROR_UNDECLARING_PREFIX,
  6031. "Didn't report attr default setting NS w/ prefix to ''.");
  6032. }
  6033. END_TEST
  6034. /* Regression test #4 for SF bug #673791. */
  6035. START_TEST(test_ns_prefix_with_empty_uri_4) {
  6036. const char *text = "<!DOCTYPE doc [\n"
  6037. " <!ELEMENT prefix:doc EMPTY>\n"
  6038. " <!ATTLIST prefix:doc\n"
  6039. " xmlns:prefix CDATA 'http://example.org/'>\n"
  6040. "]>\n"
  6041. "<prefix:doc/>";
  6042. /* Packaged info expected by the end element handler;
  6043. the weird structuring lets us re-use the triplet_end_checker()
  6044. function also used for another test. */
  6045. const XML_Char *elemstr[] = {XCS("http://example.org/ doc prefix")};
  6046. XML_SetReturnNSTriplet(g_parser, XML_TRUE);
  6047. XML_SetUserData(g_parser, (void *)elemstr);
  6048. XML_SetEndElementHandler(g_parser, triplet_end_checker);
  6049. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_TRUE)
  6050. == XML_STATUS_ERROR)
  6051. xml_failure(g_parser);
  6052. }
  6053. END_TEST
  6054. /* Test with non-xmlns prefix */
  6055. START_TEST(test_ns_unbound_prefix) {
  6056. const char *text = "<!DOCTYPE doc [\n"
  6057. " <!ELEMENT prefix:doc EMPTY>\n"
  6058. " <!ATTLIST prefix:doc\n"
  6059. " notxmlns:prefix CDATA 'http://example.org/'>\n"
  6060. "]>\n"
  6061. "<prefix:doc/>";
  6062. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_TRUE)
  6063. != XML_STATUS_ERROR)
  6064. fail("Unbound prefix incorrectly passed");
  6065. if (XML_GetErrorCode(g_parser) != XML_ERROR_UNBOUND_PREFIX)
  6066. xml_failure(g_parser);
  6067. }
  6068. END_TEST
  6069. START_TEST(test_ns_default_with_empty_uri) {
  6070. const char *text = "<doc xmlns='http://example.org/'>\n"
  6071. " <e xmlns=''/>\n"
  6072. "</doc>";
  6073. /* Add some handlers to exercise extra code paths */
  6074. XML_SetStartNamespaceDeclHandler(g_parser,
  6075. dummy_start_namespace_decl_handler);
  6076. XML_SetEndNamespaceDeclHandler(g_parser, dummy_end_namespace_decl_handler);
  6077. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_TRUE)
  6078. == XML_STATUS_ERROR)
  6079. xml_failure(g_parser);
  6080. }
  6081. END_TEST
  6082. /* Regression test for SF bug #692964: two prefixes for one namespace. */
  6083. START_TEST(test_ns_duplicate_attrs_diff_prefixes) {
  6084. const char *text = "<doc xmlns:a='http://example.org/a'\n"
  6085. " xmlns:b='http://example.org/a'\n"
  6086. " a:a='v' b:a='v' />";
  6087. expect_failure(text, XML_ERROR_DUPLICATE_ATTRIBUTE,
  6088. "did not report multiple attributes with same URI+name");
  6089. }
  6090. END_TEST
  6091. START_TEST(test_ns_duplicate_hashes) {
  6092. /* The hash of an attribute is calculated as the hash of its URI
  6093. * concatenated with a space followed by its name (after the
  6094. * colon). We wish to generate attributes with the same hash
  6095. * value modulo the attribute table size so that we can check that
  6096. * the attribute hash table works correctly. The attribute hash
  6097. * table size will be the smallest power of two greater than the
  6098. * number of attributes, but at least eight. There is
  6099. * unfortunately no programmatic way of getting the hash or the
  6100. * table size at user level, but the test code coverage percentage
  6101. * will drop if the hashes cease to point to the same row.
  6102. *
  6103. * The cunning plan is to have few enough attributes to have a
  6104. * reliable table size of 8, and have the single letter attribute
  6105. * names be 8 characters apart, producing a hash which will be the
  6106. * same modulo 8.
  6107. */
  6108. const char *text = "<doc xmlns:a='http://example.org/a'\n"
  6109. " a:a='v' a:i='w' />";
  6110. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_TRUE)
  6111. == XML_STATUS_ERROR)
  6112. xml_failure(g_parser);
  6113. }
  6114. END_TEST
  6115. /* Regression test for SF bug #695401: unbound prefix. */
  6116. START_TEST(test_ns_unbound_prefix_on_attribute) {
  6117. const char *text = "<doc a:attr=''/>";
  6118. expect_failure(text, XML_ERROR_UNBOUND_PREFIX,
  6119. "did not report unbound prefix on attribute");
  6120. }
  6121. END_TEST
  6122. /* Regression test for SF bug #695401: unbound prefix. */
  6123. START_TEST(test_ns_unbound_prefix_on_element) {
  6124. const char *text = "<a:doc/>";
  6125. expect_failure(text, XML_ERROR_UNBOUND_PREFIX,
  6126. "did not report unbound prefix on element");
  6127. }
  6128. END_TEST
  6129. /* Test that the parsing status is correctly reset by XML_ParserReset().
  6130. * We usE test_return_ns_triplet() for our example parse to improve
  6131. * coverage of tidying up code executed.
  6132. */
  6133. START_TEST(test_ns_parser_reset) {
  6134. XML_ParsingStatus status;
  6135. XML_GetParsingStatus(g_parser, &status);
  6136. if (status.parsing != XML_INITIALIZED)
  6137. fail("parsing status doesn't start INITIALIZED");
  6138. test_return_ns_triplet();
  6139. XML_GetParsingStatus(g_parser, &status);
  6140. if (status.parsing != XML_FINISHED)
  6141. fail("parsing status doesn't end FINISHED");
  6142. XML_ParserReset(g_parser, NULL);
  6143. XML_GetParsingStatus(g_parser, &status);
  6144. if (status.parsing != XML_INITIALIZED)
  6145. fail("parsing status doesn't reset to INITIALIZED");
  6146. }
  6147. END_TEST
  6148. /* Test that long element names with namespaces are handled correctly */
  6149. START_TEST(test_ns_long_element) {
  6150. const char *text
  6151. = "<foo:thisisalongenoughelementnametotriggerareallocation\n"
  6152. " xmlns:foo='http://example.org/' bar:a='12'\n"
  6153. " xmlns:bar='http://example.org/'>"
  6154. "</foo:thisisalongenoughelementnametotriggerareallocation>";
  6155. const XML_Char *elemstr[]
  6156. = {XCS("http://example.org/")
  6157. XCS(" thisisalongenoughelementnametotriggerareallocation foo"),
  6158. XCS("http://example.org/ a bar")};
  6159. XML_SetReturnNSTriplet(g_parser, XML_TRUE);
  6160. XML_SetUserData(g_parser, (void *)elemstr);
  6161. XML_SetElementHandler(g_parser, triplet_start_checker, triplet_end_checker);
  6162. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_TRUE)
  6163. == XML_STATUS_ERROR)
  6164. xml_failure(g_parser);
  6165. }
  6166. END_TEST
  6167. /* Test mixed population of prefixed and unprefixed attributes */
  6168. START_TEST(test_ns_mixed_prefix_atts) {
  6169. const char *text = "<e a='12' bar:b='13'\n"
  6170. " xmlns:bar='http://example.org/'>"
  6171. "</e>";
  6172. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_TRUE)
  6173. == XML_STATUS_ERROR)
  6174. xml_failure(g_parser);
  6175. }
  6176. END_TEST
  6177. /* Test having a long namespaced element name inside a short one.
  6178. * This exercises some internal buffer reallocation that is shared
  6179. * across elements with the same namespace URI.
  6180. */
  6181. START_TEST(test_ns_extend_uri_buffer) {
  6182. const char *text = "<foo:e xmlns:foo='http://example.org/'>"
  6183. " <foo:thisisalongenoughnametotriggerallocationaction"
  6184. " foo:a='12' />"
  6185. "</foo:e>";
  6186. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_TRUE)
  6187. == XML_STATUS_ERROR)
  6188. xml_failure(g_parser);
  6189. }
  6190. END_TEST
  6191. /* Test that xmlns is correctly rejected as an attribute in the xmlns
  6192. * namespace, but not in other namespaces
  6193. */
  6194. START_TEST(test_ns_reserved_attributes) {
  6195. const char *text1
  6196. = "<foo:e xmlns:foo='http://example.org/' xmlns:xmlns='12' />";
  6197. const char *text2
  6198. = "<foo:e xmlns:foo='http://example.org/' foo:xmlns='12' />";
  6199. expect_failure(text1, XML_ERROR_RESERVED_PREFIX_XMLNS,
  6200. "xmlns not rejected as an attribute");
  6201. XML_ParserReset(g_parser, NULL);
  6202. if (_XML_Parse_SINGLE_BYTES(g_parser, text2, (int)strlen(text2), XML_TRUE)
  6203. == XML_STATUS_ERROR)
  6204. xml_failure(g_parser);
  6205. }
  6206. END_TEST
  6207. /* Test more reserved attributes */
  6208. START_TEST(test_ns_reserved_attributes_2) {
  6209. const char *text1 = "<foo:e xmlns:foo='http://example.org/'"
  6210. " xmlns:xml='http://example.org/' />";
  6211. const char *text2
  6212. = "<foo:e xmlns:foo='http://www.w3.org/XML/1998/namespace' />";
  6213. const char *text3 = "<foo:e xmlns:foo='http://www.w3.org/2000/xmlns/' />";
  6214. expect_failure(text1, XML_ERROR_RESERVED_PREFIX_XML,
  6215. "xml not rejected as an attribute");
  6216. XML_ParserReset(g_parser, NULL);
  6217. expect_failure(text2, XML_ERROR_RESERVED_NAMESPACE_URI,
  6218. "Use of w3.org URL not faulted");
  6219. XML_ParserReset(g_parser, NULL);
  6220. expect_failure(text3, XML_ERROR_RESERVED_NAMESPACE_URI,
  6221. "Use of w3.org xmlns URL not faulted");
  6222. }
  6223. END_TEST
  6224. /* Test string pool handling of namespace names of 2048 characters */
  6225. /* Exercises a particular string pool growth path */
  6226. START_TEST(test_ns_extremely_long_prefix) {
  6227. /* C99 compilers are only required to support 4095-character
  6228. * strings, so the following needs to be split in two to be safe
  6229. * for all compilers.
  6230. */
  6231. const char *text1
  6232. = "<doc "
  6233. /* 64 character on each line */
  6234. /* ...gives a total length of 2048 */
  6235. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  6236. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  6237. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  6238. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  6239. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  6240. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  6241. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  6242. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  6243. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  6244. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  6245. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  6246. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  6247. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  6248. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  6249. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  6250. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  6251. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  6252. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  6253. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  6254. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  6255. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  6256. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  6257. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  6258. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  6259. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  6260. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  6261. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  6262. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  6263. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  6264. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  6265. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  6266. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  6267. ":a='12'";
  6268. const char *text2
  6269. = " xmlns:"
  6270. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  6271. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  6272. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  6273. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  6274. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  6275. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  6276. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  6277. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  6278. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  6279. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  6280. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  6281. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  6282. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  6283. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  6284. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  6285. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  6286. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  6287. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  6288. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  6289. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  6290. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  6291. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  6292. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  6293. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  6294. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  6295. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  6296. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  6297. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  6298. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  6299. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  6300. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  6301. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  6302. "='foo'\n>"
  6303. "</doc>";
  6304. if (_XML_Parse_SINGLE_BYTES(g_parser, text1, (int)strlen(text1), XML_FALSE)
  6305. == XML_STATUS_ERROR)
  6306. xml_failure(g_parser);
  6307. if (_XML_Parse_SINGLE_BYTES(g_parser, text2, (int)strlen(text2), XML_TRUE)
  6308. == XML_STATUS_ERROR)
  6309. xml_failure(g_parser);
  6310. }
  6311. END_TEST
  6312. /* Test unknown encoding handlers in namespace setup */
  6313. START_TEST(test_ns_unknown_encoding_success) {
  6314. const char *text = "<?xml version='1.0' encoding='prefix-conv'?>\n"
  6315. "<foo:e xmlns:foo='http://example.org/'>Hi</foo:e>";
  6316. XML_SetUnknownEncodingHandler(g_parser, MiscEncodingHandler, NULL);
  6317. run_character_check(text, XCS("Hi"));
  6318. }
  6319. END_TEST
  6320. /* Test that too many colons are rejected */
  6321. START_TEST(test_ns_double_colon) {
  6322. const char *text = "<foo:e xmlns:foo='http://example.org/' foo:a:b='bar' />";
  6323. const enum XML_Status status
  6324. = _XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_TRUE);
  6325. #ifdef XML_NS
  6326. if ((status == XML_STATUS_OK)
  6327. || (XML_GetErrorCode(g_parser) != XML_ERROR_INVALID_TOKEN)) {
  6328. fail("Double colon in attribute name not faulted"
  6329. " (despite active namespace support)");
  6330. }
  6331. #else
  6332. if (status != XML_STATUS_OK) {
  6333. fail("Double colon in attribute name faulted"
  6334. " (despite inactive namespace support");
  6335. }
  6336. #endif
  6337. }
  6338. END_TEST
  6339. START_TEST(test_ns_double_colon_element) {
  6340. const char *text = "<foo:bar:e xmlns:foo='http://example.org/' />";
  6341. const enum XML_Status status
  6342. = _XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_TRUE);
  6343. #ifdef XML_NS
  6344. if ((status == XML_STATUS_OK)
  6345. || (XML_GetErrorCode(g_parser) != XML_ERROR_INVALID_TOKEN)) {
  6346. fail("Double colon in element name not faulted"
  6347. " (despite active namespace support)");
  6348. }
  6349. #else
  6350. if (status != XML_STATUS_OK) {
  6351. fail("Double colon in element name faulted"
  6352. " (despite inactive namespace support");
  6353. }
  6354. #endif
  6355. }
  6356. END_TEST
  6357. /* Test that non-name characters after a colon are rejected */
  6358. START_TEST(test_ns_bad_attr_leafname) {
  6359. const char *text = "<foo:e xmlns:foo='http://example.org/' foo:?ar='baz' />";
  6360. expect_failure(text, XML_ERROR_INVALID_TOKEN,
  6361. "Invalid character in leafname not faulted");
  6362. }
  6363. END_TEST
  6364. START_TEST(test_ns_bad_element_leafname) {
  6365. const char *text = "<foo:?oc xmlns:foo='http://example.org/' />";
  6366. expect_failure(text, XML_ERROR_INVALID_TOKEN,
  6367. "Invalid character in element leafname not faulted");
  6368. }
  6369. END_TEST
  6370. /* Test high-byte-set UTF-16 characters are valid in a leafname */
  6371. START_TEST(test_ns_utf16_leafname) {
  6372. const char text[] =
  6373. /* <n:e xmlns:n='URI' n:{KHO KHWAI}='a' />
  6374. * where {KHO KHWAI} = U+0E04 = 0xe0 0xb8 0x84 in UTF-8
  6375. */
  6376. "<\0n\0:\0e\0 \0x\0m\0l\0n\0s\0:\0n\0=\0'\0U\0R\0I\0'\0 \0"
  6377. "n\0:\0\x04\x0e=\0'\0a\0'\0 \0/\0>\0";
  6378. const XML_Char *expected = XCS("a");
  6379. CharData storage;
  6380. CharData_Init(&storage);
  6381. XML_SetStartElementHandler(g_parser, accumulate_attribute);
  6382. XML_SetUserData(g_parser, &storage);
  6383. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)sizeof(text) - 1, XML_TRUE)
  6384. == XML_STATUS_ERROR)
  6385. xml_failure(g_parser);
  6386. CharData_CheckXMLChars(&storage, expected);
  6387. }
  6388. END_TEST
  6389. START_TEST(test_ns_utf16_element_leafname) {
  6390. const char text[] =
  6391. /* <n:{KHO KHWAI} xmlns:n='URI'/>
  6392. * where {KHO KHWAI} = U+0E04 = 0xe0 0xb8 0x84 in UTF-8
  6393. */
  6394. "\0<\0n\0:\x0e\x04\0 \0x\0m\0l\0n\0s\0:\0n\0=\0'\0U\0R\0I\0'\0/\0>";
  6395. #ifdef XML_UNICODE
  6396. const XML_Char *expected = XCS("URI \x0e04");
  6397. #else
  6398. const XML_Char *expected = XCS("URI \xe0\xb8\x84");
  6399. #endif
  6400. CharData storage;
  6401. CharData_Init(&storage);
  6402. XML_SetStartElementHandler(g_parser, start_element_event_handler);
  6403. XML_SetUserData(g_parser, &storage);
  6404. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)sizeof(text) - 1, XML_TRUE)
  6405. == XML_STATUS_ERROR)
  6406. xml_failure(g_parser);
  6407. CharData_CheckXMLChars(&storage, expected);
  6408. }
  6409. END_TEST
  6410. START_TEST(test_ns_utf16_doctype) {
  6411. const char text[] =
  6412. /* <!DOCTYPE foo:{KHO KHWAI} [ <!ENTITY bar 'baz'> ]>\n
  6413. * where {KHO KHWAI} = U+0E04 = 0xe0 0xb8 0x84 in UTF-8
  6414. */
  6415. "\0<\0!\0D\0O\0C\0T\0Y\0P\0E\0 \0f\0o\0o\0:\x0e\x04\0 "
  6416. "\0[\0 \0<\0!\0E\0N\0T\0I\0T\0Y\0 \0b\0a\0r\0 \0'\0b\0a\0z\0'\0>\0 "
  6417. "\0]\0>\0\n"
  6418. /* <foo:{KHO KHWAI} xmlns:foo='URI'>&bar;</foo:{KHO KHWAI}> */
  6419. "\0<\0f\0o\0o\0:\x0e\x04\0 "
  6420. "\0x\0m\0l\0n\0s\0:\0f\0o\0o\0=\0'\0U\0R\0I\0'\0>"
  6421. "\0&\0b\0a\0r\0;"
  6422. "\0<\0/\0f\0o\0o\0:\x0e\x04\0>";
  6423. #ifdef XML_UNICODE
  6424. const XML_Char *expected = XCS("URI \x0e04");
  6425. #else
  6426. const XML_Char *expected = XCS("URI \xe0\xb8\x84");
  6427. #endif
  6428. CharData storage;
  6429. CharData_Init(&storage);
  6430. XML_SetUserData(g_parser, &storage);
  6431. XML_SetStartElementHandler(g_parser, start_element_event_handler);
  6432. XML_SetUnknownEncodingHandler(g_parser, MiscEncodingHandler, NULL);
  6433. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)sizeof(text) - 1, XML_TRUE)
  6434. == XML_STATUS_ERROR)
  6435. xml_failure(g_parser);
  6436. CharData_CheckXMLChars(&storage, expected);
  6437. }
  6438. END_TEST
  6439. START_TEST(test_ns_invalid_doctype) {
  6440. const char *text = "<!DOCTYPE foo:!bad [ <!ENTITY bar 'baz' ]>\n"
  6441. "<foo:!bad>&bar;</foo:!bad>";
  6442. expect_failure(text, XML_ERROR_INVALID_TOKEN,
  6443. "Invalid character in document local name not faulted");
  6444. }
  6445. END_TEST
  6446. START_TEST(test_ns_double_colon_doctype) {
  6447. const char *text = "<!DOCTYPE foo:a:doc [ <!ENTITY bar 'baz' ]>\n"
  6448. "<foo:a:doc>&bar;</foo:a:doc>";
  6449. expect_failure(text, XML_ERROR_SYNTAX,
  6450. "Double colon in document name not faulted");
  6451. }
  6452. END_TEST
  6453. /* Control variable; the number of times duff_allocator() will successfully
  6454. * allocate */
  6455. #define ALLOC_ALWAYS_SUCCEED (-1)
  6456. #define REALLOC_ALWAYS_SUCCEED (-1)
  6457. static intptr_t allocation_count = ALLOC_ALWAYS_SUCCEED;
  6458. static intptr_t reallocation_count = REALLOC_ALWAYS_SUCCEED;
  6459. /* Crocked allocator for allocation failure tests */
  6460. static void *
  6461. duff_allocator(size_t size) {
  6462. if (allocation_count == 0)
  6463. return NULL;
  6464. if (allocation_count != ALLOC_ALWAYS_SUCCEED)
  6465. allocation_count--;
  6466. return malloc(size);
  6467. }
  6468. /* Crocked reallocator for allocation failure tests */
  6469. static void *
  6470. duff_reallocator(void *ptr, size_t size) {
  6471. if (reallocation_count == 0)
  6472. return NULL;
  6473. if (reallocation_count != REALLOC_ALWAYS_SUCCEED)
  6474. reallocation_count--;
  6475. return realloc(ptr, size);
  6476. }
  6477. /* Test that a failure to allocate the parser structure fails gracefully */
  6478. START_TEST(test_misc_alloc_create_parser) {
  6479. XML_Memory_Handling_Suite memsuite = {duff_allocator, realloc, free};
  6480. unsigned int i;
  6481. const unsigned int max_alloc_count = 10;
  6482. /* Something this simple shouldn't need more than 10 allocations */
  6483. for (i = 0; i < max_alloc_count; i++) {
  6484. allocation_count = i;
  6485. g_parser = XML_ParserCreate_MM(NULL, &memsuite, NULL);
  6486. if (g_parser != NULL)
  6487. break;
  6488. }
  6489. if (i == 0)
  6490. fail("Parser unexpectedly ignored failing allocator");
  6491. else if (i == max_alloc_count)
  6492. fail("Parser not created with max allocation count");
  6493. }
  6494. END_TEST
  6495. /* Test memory allocation failures for a parser with an encoding */
  6496. START_TEST(test_misc_alloc_create_parser_with_encoding) {
  6497. XML_Memory_Handling_Suite memsuite = {duff_allocator, realloc, free};
  6498. unsigned int i;
  6499. const unsigned int max_alloc_count = 10;
  6500. /* Try several levels of allocation */
  6501. for (i = 0; i < max_alloc_count; i++) {
  6502. allocation_count = i;
  6503. g_parser = XML_ParserCreate_MM(XCS("us-ascii"), &memsuite, NULL);
  6504. if (g_parser != NULL)
  6505. break;
  6506. }
  6507. if (i == 0)
  6508. fail("Parser ignored failing allocator");
  6509. else if (i == max_alloc_count)
  6510. fail("Parser not created with max allocation count");
  6511. }
  6512. END_TEST
  6513. /* Test that freeing a NULL parser doesn't cause an explosion.
  6514. * (Not actually tested anywhere else)
  6515. */
  6516. START_TEST(test_misc_null_parser) {
  6517. XML_ParserFree(NULL);
  6518. }
  6519. END_TEST
  6520. /* Test that XML_ErrorString rejects out-of-range codes */
  6521. START_TEST(test_misc_error_string) {
  6522. if (XML_ErrorString((enum XML_Error) - 1) != NULL)
  6523. fail("Negative error code not rejected");
  6524. if (XML_ErrorString((enum XML_Error)100) != NULL)
  6525. fail("Large error code not rejected");
  6526. }
  6527. END_TEST
  6528. /* Test the version information is consistent */
  6529. /* Since we are working in XML_LChars (potentially 16-bits), we
  6530. * can't use the standard C library functions for character
  6531. * manipulation and have to roll our own.
  6532. */
  6533. static int
  6534. parse_version(const XML_LChar *version_text,
  6535. XML_Expat_Version *version_struct) {
  6536. if (! version_text)
  6537. return XML_FALSE;
  6538. while (*version_text != 0x00) {
  6539. if (*version_text >= ASCII_0 && *version_text <= ASCII_9)
  6540. break;
  6541. version_text++;
  6542. }
  6543. if (*version_text == 0x00)
  6544. return XML_FALSE;
  6545. /* version_struct->major = strtoul(version_text, 10, &version_text) */
  6546. version_struct->major = 0;
  6547. while (*version_text >= ASCII_0 && *version_text <= ASCII_9) {
  6548. version_struct->major
  6549. = 10 * version_struct->major + (*version_text++ - ASCII_0);
  6550. }
  6551. if (*version_text++ != ASCII_PERIOD)
  6552. return XML_FALSE;
  6553. /* Now for the minor version number */
  6554. version_struct->minor = 0;
  6555. while (*version_text >= ASCII_0 && *version_text <= ASCII_9) {
  6556. version_struct->minor
  6557. = 10 * version_struct->minor + (*version_text++ - ASCII_0);
  6558. }
  6559. if (*version_text++ != ASCII_PERIOD)
  6560. return XML_FALSE;
  6561. /* Finally the micro version number */
  6562. version_struct->micro = 0;
  6563. while (*version_text >= ASCII_0 && *version_text <= ASCII_9) {
  6564. version_struct->micro
  6565. = 10 * version_struct->micro + (*version_text++ - ASCII_0);
  6566. }
  6567. if (*version_text != 0x00)
  6568. return XML_FALSE;
  6569. return XML_TRUE;
  6570. }
  6571. static int
  6572. versions_equal(const XML_Expat_Version *first,
  6573. const XML_Expat_Version *second) {
  6574. return (first->major == second->major && first->minor == second->minor
  6575. && first->micro == second->micro);
  6576. }
  6577. START_TEST(test_misc_version) {
  6578. XML_Expat_Version read_version = XML_ExpatVersionInfo();
  6579. /* Silence compiler warning with the following assignment */
  6580. XML_Expat_Version parsed_version = {0, 0, 0};
  6581. const XML_LChar *version_text = XML_ExpatVersion();
  6582. if (version_text == NULL)
  6583. fail("Could not obtain version text");
  6584. assert(version_text != NULL);
  6585. if (! parse_version(version_text, &parsed_version))
  6586. fail("Unable to parse version text");
  6587. if (! versions_equal(&read_version, &parsed_version))
  6588. fail("Version mismatch");
  6589. #if ! defined(XML_UNICODE) || defined(XML_UNICODE_WCHAR_T)
  6590. if (xcstrcmp(version_text, XCS("expat_2.4.3"))) /* needs bump on releases */
  6591. fail("XML_*_VERSION in expat.h out of sync?\n");
  6592. #else
  6593. /* If we have XML_UNICODE defined but not XML_UNICODE_WCHAR_T
  6594. * then XML_LChar is defined as char, for some reason.
  6595. */
  6596. if (strcmp(version_text, "expat_2.2.5")) /* needs bump on releases */
  6597. fail("XML_*_VERSION in expat.h out of sync?\n");
  6598. #endif /* ! defined(XML_UNICODE) || defined(XML_UNICODE_WCHAR_T) */
  6599. }
  6600. END_TEST
  6601. /* Test feature information */
  6602. START_TEST(test_misc_features) {
  6603. const XML_Feature *features = XML_GetFeatureList();
  6604. /* Prevent problems with double-freeing parsers */
  6605. g_parser = NULL;
  6606. if (features == NULL) {
  6607. fail("Failed to get feature information");
  6608. } else {
  6609. /* Loop through the features checking what we can */
  6610. while (features->feature != XML_FEATURE_END) {
  6611. switch (features->feature) {
  6612. case XML_FEATURE_SIZEOF_XML_CHAR:
  6613. if (features->value != sizeof(XML_Char))
  6614. fail("Incorrect size of XML_Char");
  6615. break;
  6616. case XML_FEATURE_SIZEOF_XML_LCHAR:
  6617. if (features->value != sizeof(XML_LChar))
  6618. fail("Incorrect size of XML_LChar");
  6619. break;
  6620. default:
  6621. break;
  6622. }
  6623. features++;
  6624. }
  6625. }
  6626. }
  6627. END_TEST
  6628. /* Regression test for GitHub Issue #17: memory leak parsing attribute
  6629. * values with mixed bound and unbound namespaces.
  6630. */
  6631. START_TEST(test_misc_attribute_leak) {
  6632. const char *text = "<D xmlns:L=\"D\" l:a='' L:a=''/>";
  6633. XML_Memory_Handling_Suite memsuite
  6634. = {tracking_malloc, tracking_realloc, tracking_free};
  6635. g_parser = XML_ParserCreate_MM(XCS("UTF-8"), &memsuite, XCS("\n"));
  6636. expect_failure(text, XML_ERROR_UNBOUND_PREFIX, "Unbound prefixes not found");
  6637. XML_ParserFree(g_parser);
  6638. /* Prevent the teardown trying to double free */
  6639. g_parser = NULL;
  6640. if (! tracking_report())
  6641. fail("Memory leak found");
  6642. }
  6643. END_TEST
  6644. /* Test parser created for UTF-16LE is successful */
  6645. START_TEST(test_misc_utf16le) {
  6646. const char text[] =
  6647. /* <?xml version='1.0'?><q>Hi</q> */
  6648. "<\0?\0x\0m\0l\0 \0"
  6649. "v\0e\0r\0s\0i\0o\0n\0=\0'\0\x31\0.\0\x30\0'\0?\0>\0"
  6650. "<\0q\0>\0H\0i\0<\0/\0q\0>\0";
  6651. const XML_Char *expected = XCS("Hi");
  6652. CharData storage;
  6653. g_parser = XML_ParserCreate(XCS("UTF-16LE"));
  6654. if (g_parser == NULL)
  6655. fail("Parser not created");
  6656. CharData_Init(&storage);
  6657. XML_SetUserData(g_parser, &storage);
  6658. XML_SetCharacterDataHandler(g_parser, accumulate_characters);
  6659. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)sizeof(text) - 1, XML_TRUE)
  6660. == XML_STATUS_ERROR)
  6661. xml_failure(g_parser);
  6662. CharData_CheckXMLChars(&storage, expected);
  6663. }
  6664. END_TEST
  6665. typedef struct {
  6666. XML_Parser parser;
  6667. int deep;
  6668. } DataIssue240;
  6669. static void
  6670. start_element_issue_240(void *userData, const XML_Char *name,
  6671. const XML_Char **atts) {
  6672. DataIssue240 *mydata = (DataIssue240 *)userData;
  6673. UNUSED_P(name);
  6674. UNUSED_P(atts);
  6675. mydata->deep++;
  6676. }
  6677. static void
  6678. end_element_issue_240(void *userData, const XML_Char *name) {
  6679. DataIssue240 *mydata = (DataIssue240 *)userData;
  6680. UNUSED_P(name);
  6681. mydata->deep--;
  6682. if (mydata->deep == 0) {
  6683. XML_StopParser(mydata->parser, 0);
  6684. }
  6685. }
  6686. START_TEST(test_misc_stop_during_end_handler_issue_240_1) {
  6687. XML_Parser parser;
  6688. DataIssue240 *mydata;
  6689. enum XML_Status result;
  6690. const char *const doc1 = "<doc><e1/><e><foo/></e></doc>";
  6691. parser = XML_ParserCreate(NULL);
  6692. XML_SetElementHandler(parser, start_element_issue_240, end_element_issue_240);
  6693. mydata = (DataIssue240 *)malloc(sizeof(DataIssue240));
  6694. mydata->parser = parser;
  6695. mydata->deep = 0;
  6696. XML_SetUserData(parser, mydata);
  6697. result = XML_Parse(parser, doc1, (int)strlen(doc1), 1);
  6698. XML_ParserFree(parser);
  6699. free(mydata);
  6700. if (result != XML_STATUS_ERROR)
  6701. fail("Stopping the parser did not work as expected");
  6702. }
  6703. END_TEST
  6704. START_TEST(test_misc_stop_during_end_handler_issue_240_2) {
  6705. XML_Parser parser;
  6706. DataIssue240 *mydata;
  6707. enum XML_Status result;
  6708. const char *const doc2 = "<doc><elem/></doc>";
  6709. parser = XML_ParserCreate(NULL);
  6710. XML_SetElementHandler(parser, start_element_issue_240, end_element_issue_240);
  6711. mydata = (DataIssue240 *)malloc(sizeof(DataIssue240));
  6712. mydata->parser = parser;
  6713. mydata->deep = 0;
  6714. XML_SetUserData(parser, mydata);
  6715. result = XML_Parse(parser, doc2, (int)strlen(doc2), 1);
  6716. XML_ParserFree(parser);
  6717. free(mydata);
  6718. if (result != XML_STATUS_ERROR)
  6719. fail("Stopping the parser did not work as expected");
  6720. }
  6721. END_TEST
  6722. START_TEST(test_misc_deny_internal_entity_closing_doctype_issue_317) {
  6723. const char *const inputOne = "<!DOCTYPE d [\n"
  6724. "<!ENTITY % e ']><d/>'>\n"
  6725. "\n"
  6726. "%e;";
  6727. const char *const inputTwo = "<!DOCTYPE d [\n"
  6728. "<!ENTITY % e1 ']><d/>'><!ENTITY % e2 '&e1;'>\n"
  6729. "\n"
  6730. "%e2;";
  6731. const char *const inputThree = "<!DOCTYPE d [\n"
  6732. "<!ENTITY % e ']><d'>\n"
  6733. "\n"
  6734. "%e;";
  6735. const char *const inputIssue317 = "<!DOCTYPE doc [\n"
  6736. "<!ENTITY % foo ']>\n"
  6737. "<doc>Hell<oc (#PCDATA)*>'>\n"
  6738. "%foo;\n"
  6739. "]>\n"
  6740. "<doc>Hello, world</dVc>";
  6741. const char *const inputs[] = {inputOne, inputTwo, inputThree, inputIssue317};
  6742. size_t inputIndex = 0;
  6743. for (; inputIndex < sizeof(inputs) / sizeof(inputs[0]); inputIndex++) {
  6744. XML_Parser parser;
  6745. enum XML_Status parseResult;
  6746. int setParamEntityResult;
  6747. XML_Size lineNumber;
  6748. XML_Size columnNumber;
  6749. const char *const input = inputs[inputIndex];
  6750. parser = XML_ParserCreate(NULL);
  6751. setParamEntityResult
  6752. = XML_SetParamEntityParsing(parser, XML_PARAM_ENTITY_PARSING_ALWAYS);
  6753. if (setParamEntityResult != 1)
  6754. fail("Failed to set XML_PARAM_ENTITY_PARSING_ALWAYS.");
  6755. parseResult = XML_Parse(parser, input, (int)strlen(input), 0);
  6756. if (parseResult != XML_STATUS_ERROR) {
  6757. parseResult = XML_Parse(parser, "", 0, 1);
  6758. if (parseResult != XML_STATUS_ERROR) {
  6759. fail("Parsing was expected to fail but succeeded.");
  6760. }
  6761. }
  6762. if (XML_GetErrorCode(parser) != XML_ERROR_INVALID_TOKEN)
  6763. fail("Error code does not match XML_ERROR_INVALID_TOKEN");
  6764. lineNumber = XML_GetCurrentLineNumber(parser);
  6765. if (lineNumber != 4)
  6766. fail("XML_GetCurrentLineNumber does not work as expected.");
  6767. columnNumber = XML_GetCurrentColumnNumber(parser);
  6768. if (columnNumber != 0)
  6769. fail("XML_GetCurrentColumnNumber does not work as expected.");
  6770. XML_ParserFree(parser);
  6771. }
  6772. }
  6773. END_TEST
  6774. static void
  6775. alloc_setup(void) {
  6776. XML_Memory_Handling_Suite memsuite = {duff_allocator, duff_reallocator, free};
  6777. /* Ensure the parser creation will go through */
  6778. allocation_count = ALLOC_ALWAYS_SUCCEED;
  6779. reallocation_count = REALLOC_ALWAYS_SUCCEED;
  6780. g_parser = XML_ParserCreate_MM(NULL, &memsuite, NULL);
  6781. if (g_parser == NULL)
  6782. fail("Parser not created");
  6783. }
  6784. static void
  6785. alloc_teardown(void) {
  6786. basic_teardown();
  6787. }
  6788. /* Test the effects of allocation failures on xml declaration processing */
  6789. START_TEST(test_alloc_parse_xdecl) {
  6790. const char *text = "<?xml version='1.0' encoding='utf-8'?>\n"
  6791. "<doc>Hello, world</doc>";
  6792. int i;
  6793. const int max_alloc_count = 15;
  6794. for (i = 0; i < max_alloc_count; i++) {
  6795. allocation_count = i;
  6796. XML_SetXmlDeclHandler(g_parser, dummy_xdecl_handler);
  6797. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_TRUE)
  6798. != XML_STATUS_ERROR)
  6799. break;
  6800. /* Resetting the parser is insufficient, because some memory
  6801. * allocations are cached within the parser. Instead we use
  6802. * the teardown and setup routines to ensure that we have the
  6803. * right sort of parser back in our hands.
  6804. */
  6805. alloc_teardown();
  6806. alloc_setup();
  6807. }
  6808. if (i == 0)
  6809. fail("Parse succeeded despite failing allocator");
  6810. if (i == max_alloc_count)
  6811. fail("Parse failed with max allocations");
  6812. }
  6813. END_TEST
  6814. /* As above, but with an encoding big enough to cause storing the
  6815. * version information to expand the string pool being used.
  6816. */
  6817. static int XMLCALL
  6818. long_encoding_handler(void *userData, const XML_Char *encoding,
  6819. XML_Encoding *info) {
  6820. int i;
  6821. UNUSED_P(userData);
  6822. UNUSED_P(encoding);
  6823. for (i = 0; i < 256; i++)
  6824. info->map[i] = i;
  6825. info->data = NULL;
  6826. info->convert = NULL;
  6827. info->release = NULL;
  6828. return XML_STATUS_OK;
  6829. }
  6830. START_TEST(test_alloc_parse_xdecl_2) {
  6831. const char *text
  6832. = "<?xml version='1.0' encoding='"
  6833. /* Each line is 64 characters */
  6834. "ThisIsAStupidlyLongEncodingNameIntendedToTriggerPoolGrowth123456"
  6835. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  6836. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  6837. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  6838. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  6839. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  6840. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  6841. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  6842. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  6843. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  6844. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  6845. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  6846. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  6847. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  6848. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  6849. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMN"
  6850. "'?>"
  6851. "<doc>Hello, world</doc>";
  6852. int i;
  6853. const int max_alloc_count = 20;
  6854. for (i = 0; i < max_alloc_count; i++) {
  6855. allocation_count = i;
  6856. XML_SetXmlDeclHandler(g_parser, dummy_xdecl_handler);
  6857. XML_SetUnknownEncodingHandler(g_parser, long_encoding_handler, NULL);
  6858. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_TRUE)
  6859. != XML_STATUS_ERROR)
  6860. break;
  6861. /* See comment in test_alloc_parse_xdecl() */
  6862. alloc_teardown();
  6863. alloc_setup();
  6864. }
  6865. if (i == 0)
  6866. fail("Parse succeeded despite failing allocator");
  6867. if (i == max_alloc_count)
  6868. fail("Parse failed with max allocations");
  6869. }
  6870. END_TEST
  6871. /* Test the effects of allocation failures on a straightforward parse */
  6872. START_TEST(test_alloc_parse_pi) {
  6873. const char *text = "<?xml version='1.0' encoding='utf-8'?>\n"
  6874. "<?pi unknown?>\n"
  6875. "<doc>"
  6876. "Hello, world"
  6877. "</doc>";
  6878. int i;
  6879. const int max_alloc_count = 15;
  6880. for (i = 0; i < max_alloc_count; i++) {
  6881. allocation_count = i;
  6882. XML_SetProcessingInstructionHandler(g_parser, dummy_pi_handler);
  6883. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_TRUE)
  6884. != XML_STATUS_ERROR)
  6885. break;
  6886. /* See comment in test_alloc_parse_xdecl() */
  6887. alloc_teardown();
  6888. alloc_setup();
  6889. }
  6890. if (i == 0)
  6891. fail("Parse succeeded despite failing allocator");
  6892. if (i == max_alloc_count)
  6893. fail("Parse failed with max allocations");
  6894. }
  6895. END_TEST
  6896. START_TEST(test_alloc_parse_pi_2) {
  6897. const char *text = "<?xml version='1.0' encoding='utf-8'?>\n"
  6898. "<doc>"
  6899. "Hello, world"
  6900. "<?pi unknown?>\n"
  6901. "</doc>";
  6902. int i;
  6903. const int max_alloc_count = 15;
  6904. for (i = 0; i < max_alloc_count; i++) {
  6905. allocation_count = i;
  6906. XML_SetProcessingInstructionHandler(g_parser, dummy_pi_handler);
  6907. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_TRUE)
  6908. != XML_STATUS_ERROR)
  6909. break;
  6910. /* See comment in test_alloc_parse_xdecl() */
  6911. alloc_teardown();
  6912. alloc_setup();
  6913. }
  6914. if (i == 0)
  6915. fail("Parse succeeded despite failing allocator");
  6916. if (i == max_alloc_count)
  6917. fail("Parse failed with max allocations");
  6918. }
  6919. END_TEST
  6920. START_TEST(test_alloc_parse_pi_3) {
  6921. const char *text
  6922. = "<?"
  6923. /* 64 characters per line */
  6924. "This processing instruction should be long enough to ensure that"
  6925. "it triggers the growth of an internal string pool when the "
  6926. "allocator fails at a cruicial moment FGHIJKLMNOPABCDEFGHIJKLMNOP"
  6927. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  6928. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  6929. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  6930. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  6931. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  6932. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  6933. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  6934. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  6935. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  6936. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  6937. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  6938. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  6939. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  6940. "Q?><doc/>";
  6941. int i;
  6942. const int max_alloc_count = 20;
  6943. for (i = 0; i < max_alloc_count; i++) {
  6944. allocation_count = i;
  6945. XML_SetProcessingInstructionHandler(g_parser, dummy_pi_handler);
  6946. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_TRUE)
  6947. != XML_STATUS_ERROR)
  6948. break;
  6949. /* See comment in test_alloc_parse_xdecl() */
  6950. alloc_teardown();
  6951. alloc_setup();
  6952. }
  6953. if (i == 0)
  6954. fail("Parse succeeded despite failing allocator");
  6955. if (i == max_alloc_count)
  6956. fail("Parse failed with max allocations");
  6957. }
  6958. END_TEST
  6959. START_TEST(test_alloc_parse_comment) {
  6960. const char *text = "<?xml version='1.0' encoding='utf-8'?>\n"
  6961. "<!-- Test parsing this comment -->"
  6962. "<doc>Hi</doc>";
  6963. int i;
  6964. const int max_alloc_count = 15;
  6965. for (i = 0; i < max_alloc_count; i++) {
  6966. allocation_count = i;
  6967. XML_SetCommentHandler(g_parser, dummy_comment_handler);
  6968. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_TRUE)
  6969. != XML_STATUS_ERROR)
  6970. break;
  6971. /* See comment in test_alloc_parse_xdecl() */
  6972. alloc_teardown();
  6973. alloc_setup();
  6974. }
  6975. if (i == 0)
  6976. fail("Parse succeeded despite failing allocator");
  6977. if (i == max_alloc_count)
  6978. fail("Parse failed with max allocations");
  6979. }
  6980. END_TEST
  6981. START_TEST(test_alloc_parse_comment_2) {
  6982. const char *text = "<?xml version='1.0' encoding='utf-8'?>\n"
  6983. "<doc>"
  6984. "Hello, world"
  6985. "<!-- Parse this comment too -->"
  6986. "</doc>";
  6987. int i;
  6988. const int max_alloc_count = 15;
  6989. for (i = 0; i < max_alloc_count; i++) {
  6990. allocation_count = i;
  6991. XML_SetCommentHandler(g_parser, dummy_comment_handler);
  6992. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_TRUE)
  6993. != XML_STATUS_ERROR)
  6994. break;
  6995. /* See comment in test_alloc_parse_xdecl() */
  6996. alloc_teardown();
  6997. alloc_setup();
  6998. }
  6999. if (i == 0)
  7000. fail("Parse succeeded despite failing allocator");
  7001. if (i == max_alloc_count)
  7002. fail("Parse failed with max allocations");
  7003. }
  7004. END_TEST
  7005. static int XMLCALL
  7006. external_entity_duff_loader(XML_Parser parser, const XML_Char *context,
  7007. const XML_Char *base, const XML_Char *systemId,
  7008. const XML_Char *publicId) {
  7009. XML_Parser new_parser;
  7010. unsigned int i;
  7011. const unsigned int max_alloc_count = 10;
  7012. UNUSED_P(base);
  7013. UNUSED_P(systemId);
  7014. UNUSED_P(publicId);
  7015. /* Try a few different allocation levels */
  7016. for (i = 0; i < max_alloc_count; i++) {
  7017. allocation_count = i;
  7018. new_parser = XML_ExternalEntityParserCreate(parser, context, NULL);
  7019. if (new_parser != NULL) {
  7020. XML_ParserFree(new_parser);
  7021. break;
  7022. }
  7023. }
  7024. if (i == 0)
  7025. fail("External parser creation ignored failing allocator");
  7026. else if (i == max_alloc_count)
  7027. fail("Extern parser not created with max allocation count");
  7028. /* Make sure other random allocation doesn't now fail */
  7029. allocation_count = ALLOC_ALWAYS_SUCCEED;
  7030. /* Make sure the failure code path is executed too */
  7031. return XML_STATUS_ERROR;
  7032. }
  7033. /* Test that external parser creation running out of memory is
  7034. * correctly reported. Based on the external entity test cases.
  7035. */
  7036. START_TEST(test_alloc_create_external_parser) {
  7037. const char *text = "<?xml version='1.0' encoding='us-ascii'?>\n"
  7038. "<!DOCTYPE doc SYSTEM 'foo'>\n"
  7039. "<doc>&entity;</doc>";
  7040. char foo_text[] = "<!ELEMENT doc (#PCDATA)*>";
  7041. XML_SetParamEntityParsing(g_parser, XML_PARAM_ENTITY_PARSING_ALWAYS);
  7042. XML_SetUserData(g_parser, foo_text);
  7043. XML_SetExternalEntityRefHandler(g_parser, external_entity_duff_loader);
  7044. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_TRUE)
  7045. != XML_STATUS_ERROR) {
  7046. fail("External parser allocator returned success incorrectly");
  7047. }
  7048. }
  7049. END_TEST
  7050. /* More external parser memory allocation testing */
  7051. START_TEST(test_alloc_run_external_parser) {
  7052. const char *text = "<?xml version='1.0' encoding='us-ascii'?>\n"
  7053. "<!DOCTYPE doc SYSTEM 'foo'>\n"
  7054. "<doc>&entity;</doc>";
  7055. char foo_text[] = "<!ELEMENT doc (#PCDATA)*>";
  7056. unsigned int i;
  7057. const unsigned int max_alloc_count = 15;
  7058. for (i = 0; i < max_alloc_count; i++) {
  7059. XML_SetParamEntityParsing(g_parser, XML_PARAM_ENTITY_PARSING_ALWAYS);
  7060. XML_SetUserData(g_parser, foo_text);
  7061. XML_SetExternalEntityRefHandler(g_parser, external_entity_null_loader);
  7062. allocation_count = i;
  7063. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_TRUE)
  7064. != XML_STATUS_ERROR)
  7065. break;
  7066. /* See comment in test_alloc_parse_xdecl() */
  7067. alloc_teardown();
  7068. alloc_setup();
  7069. }
  7070. if (i == 0)
  7071. fail("Parsing ignored failing allocator");
  7072. else if (i == max_alloc_count)
  7073. fail("Parsing failed with allocation count 10");
  7074. }
  7075. END_TEST
  7076. static int XMLCALL
  7077. external_entity_dbl_handler(XML_Parser parser, const XML_Char *context,
  7078. const XML_Char *base, const XML_Char *systemId,
  7079. const XML_Char *publicId) {
  7080. intptr_t callno = (intptr_t)XML_GetUserData(parser);
  7081. const char *text;
  7082. XML_Parser new_parser;
  7083. int i;
  7084. const int max_alloc_count = 20;
  7085. UNUSED_P(base);
  7086. UNUSED_P(systemId);
  7087. UNUSED_P(publicId);
  7088. if (callno == 0) {
  7089. /* First time through, check how many calls to malloc occur */
  7090. text = ("<!ELEMENT doc (e+)>\n"
  7091. "<!ATTLIST doc xmlns CDATA #IMPLIED>\n"
  7092. "<!ELEMENT e EMPTY>\n");
  7093. allocation_count = 10000;
  7094. new_parser = XML_ExternalEntityParserCreate(parser, context, NULL);
  7095. if (new_parser == NULL) {
  7096. fail("Unable to allocate first external parser");
  7097. return XML_STATUS_ERROR;
  7098. }
  7099. /* Stash the number of calls in the user data */
  7100. XML_SetUserData(parser, (void *)(intptr_t)(10000 - allocation_count));
  7101. } else {
  7102. text = ("<?xml version='1.0' encoding='us-ascii'?>"
  7103. "<e/>");
  7104. /* Try at varying levels to exercise more code paths */
  7105. for (i = 0; i < max_alloc_count; i++) {
  7106. allocation_count = callno + i;
  7107. new_parser = XML_ExternalEntityParserCreate(parser, context, NULL);
  7108. if (new_parser != NULL)
  7109. break;
  7110. }
  7111. if (i == 0) {
  7112. fail("Second external parser unexpectedly created");
  7113. XML_ParserFree(new_parser);
  7114. return XML_STATUS_ERROR;
  7115. } else if (i == max_alloc_count) {
  7116. fail("Second external parser not created");
  7117. return XML_STATUS_ERROR;
  7118. }
  7119. }
  7120. allocation_count = ALLOC_ALWAYS_SUCCEED;
  7121. if (_XML_Parse_SINGLE_BYTES(new_parser, text, (int)strlen(text), XML_TRUE)
  7122. == XML_STATUS_ERROR) {
  7123. xml_failure(new_parser);
  7124. return XML_STATUS_ERROR;
  7125. }
  7126. XML_ParserFree(new_parser);
  7127. return XML_STATUS_OK;
  7128. }
  7129. /* Test that running out of memory in dtdCopy is correctly reported.
  7130. * Based on test_default_ns_from_ext_subset_and_ext_ge()
  7131. */
  7132. START_TEST(test_alloc_dtd_copy_default_atts) {
  7133. const char *text = "<?xml version='1.0'?>\n"
  7134. "<!DOCTYPE doc SYSTEM 'http://example.org/doc.dtd' [\n"
  7135. " <!ENTITY en SYSTEM 'http://example.org/entity.ent'>\n"
  7136. "]>\n"
  7137. "<doc xmlns='http://example.org/ns1'>\n"
  7138. "&en;\n"
  7139. "</doc>";
  7140. XML_SetParamEntityParsing(g_parser, XML_PARAM_ENTITY_PARSING_ALWAYS);
  7141. XML_SetExternalEntityRefHandler(g_parser, external_entity_dbl_handler);
  7142. XML_SetUserData(g_parser, NULL);
  7143. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_TRUE)
  7144. == XML_STATUS_ERROR)
  7145. xml_failure(g_parser);
  7146. }
  7147. END_TEST
  7148. static int XMLCALL
  7149. external_entity_dbl_handler_2(XML_Parser parser, const XML_Char *context,
  7150. const XML_Char *base, const XML_Char *systemId,
  7151. const XML_Char *publicId) {
  7152. intptr_t callno = (intptr_t)XML_GetUserData(parser);
  7153. const char *text;
  7154. XML_Parser new_parser;
  7155. enum XML_Status rv;
  7156. UNUSED_P(base);
  7157. UNUSED_P(systemId);
  7158. UNUSED_P(publicId);
  7159. if (callno == 0) {
  7160. /* Try different allocation levels for whole exercise */
  7161. text = ("<!ELEMENT doc (e+)>\n"
  7162. "<!ATTLIST doc xmlns CDATA #IMPLIED>\n"
  7163. "<!ELEMENT e EMPTY>\n");
  7164. XML_SetUserData(parser, (void *)(intptr_t)1);
  7165. new_parser = XML_ExternalEntityParserCreate(parser, context, NULL);
  7166. if (new_parser == NULL)
  7167. return XML_STATUS_ERROR;
  7168. rv = _XML_Parse_SINGLE_BYTES(new_parser, text, (int)strlen(text), XML_TRUE);
  7169. } else {
  7170. /* Just run through once */
  7171. text = ("<?xml version='1.0' encoding='us-ascii'?>"
  7172. "<e/>");
  7173. new_parser = XML_ExternalEntityParserCreate(parser, context, NULL);
  7174. if (new_parser == NULL)
  7175. return XML_STATUS_ERROR;
  7176. rv = _XML_Parse_SINGLE_BYTES(new_parser, text, (int)strlen(text), XML_TRUE);
  7177. }
  7178. XML_ParserFree(new_parser);
  7179. if (rv == XML_STATUS_ERROR)
  7180. return XML_STATUS_ERROR;
  7181. return XML_STATUS_OK;
  7182. }
  7183. /* Test more external entity allocation failure paths */
  7184. START_TEST(test_alloc_external_entity) {
  7185. const char *text = "<?xml version='1.0'?>\n"
  7186. "<!DOCTYPE doc SYSTEM 'http://example.org/doc.dtd' [\n"
  7187. " <!ENTITY en SYSTEM 'http://example.org/entity.ent'>\n"
  7188. "]>\n"
  7189. "<doc xmlns='http://example.org/ns1'>\n"
  7190. "&en;\n"
  7191. "</doc>";
  7192. int i;
  7193. const int alloc_test_max_repeats = 50;
  7194. for (i = 0; i < alloc_test_max_repeats; i++) {
  7195. allocation_count = -1;
  7196. XML_SetParamEntityParsing(g_parser, XML_PARAM_ENTITY_PARSING_ALWAYS);
  7197. XML_SetExternalEntityRefHandler(g_parser, external_entity_dbl_handler_2);
  7198. XML_SetUserData(g_parser, NULL);
  7199. allocation_count = i;
  7200. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_TRUE)
  7201. == XML_STATUS_OK)
  7202. break;
  7203. /* See comment in test_alloc_parse_xdecl() */
  7204. alloc_teardown();
  7205. alloc_setup();
  7206. }
  7207. allocation_count = -1;
  7208. if (i == 0)
  7209. fail("External entity parsed despite duff allocator");
  7210. if (i == alloc_test_max_repeats)
  7211. fail("External entity not parsed at max allocation count");
  7212. }
  7213. END_TEST
  7214. /* Test more allocation failure paths */
  7215. static int XMLCALL
  7216. external_entity_alloc_set_encoding(XML_Parser parser, const XML_Char *context,
  7217. const XML_Char *base,
  7218. const XML_Char *systemId,
  7219. const XML_Char *publicId) {
  7220. /* As for external_entity_loader() */
  7221. const char *text = "<?xml encoding='iso-8859-3'?>"
  7222. "\xC3\xA9";
  7223. XML_Parser ext_parser;
  7224. enum XML_Status status;
  7225. UNUSED_P(base);
  7226. UNUSED_P(systemId);
  7227. UNUSED_P(publicId);
  7228. ext_parser = XML_ExternalEntityParserCreate(parser, context, NULL);
  7229. if (ext_parser == NULL)
  7230. return XML_STATUS_ERROR;
  7231. if (! XML_SetEncoding(ext_parser, XCS("utf-8"))) {
  7232. XML_ParserFree(ext_parser);
  7233. return XML_STATUS_ERROR;
  7234. }
  7235. status
  7236. = _XML_Parse_SINGLE_BYTES(ext_parser, text, (int)strlen(text), XML_TRUE);
  7237. XML_ParserFree(ext_parser);
  7238. if (status == XML_STATUS_ERROR)
  7239. return XML_STATUS_ERROR;
  7240. return XML_STATUS_OK;
  7241. }
  7242. START_TEST(test_alloc_ext_entity_set_encoding) {
  7243. const char *text = "<!DOCTYPE doc [\n"
  7244. " <!ENTITY en SYSTEM 'http://example.org/dummy.ent'>\n"
  7245. "]>\n"
  7246. "<doc>&en;</doc>";
  7247. int i;
  7248. const int max_allocation_count = 30;
  7249. for (i = 0; i < max_allocation_count; i++) {
  7250. XML_SetExternalEntityRefHandler(g_parser,
  7251. external_entity_alloc_set_encoding);
  7252. allocation_count = i;
  7253. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_TRUE)
  7254. == XML_STATUS_OK)
  7255. break;
  7256. allocation_count = -1;
  7257. /* See comment in test_alloc_parse_xdecl() */
  7258. alloc_teardown();
  7259. alloc_setup();
  7260. }
  7261. if (i == 0)
  7262. fail("Encoding check succeeded despite failing allocator");
  7263. if (i == max_allocation_count)
  7264. fail("Encoding failed at max allocation count");
  7265. }
  7266. END_TEST
  7267. static int XMLCALL
  7268. unknown_released_encoding_handler(void *data, const XML_Char *encoding,
  7269. XML_Encoding *info) {
  7270. UNUSED_P(data);
  7271. if (! xcstrcmp(encoding, XCS("unsupported-encoding"))) {
  7272. int i;
  7273. for (i = 0; i < 256; i++)
  7274. info->map[i] = i;
  7275. info->data = NULL;
  7276. info->convert = NULL;
  7277. info->release = dummy_release;
  7278. return XML_STATUS_OK;
  7279. }
  7280. return XML_STATUS_ERROR;
  7281. }
  7282. /* Test the effects of allocation failure in internal entities.
  7283. * Based on test_unknown_encoding_internal_entity
  7284. */
  7285. START_TEST(test_alloc_internal_entity) {
  7286. const char *text = "<?xml version='1.0' encoding='unsupported-encoding'?>\n"
  7287. "<!DOCTYPE test [<!ENTITY foo 'bar'>]>\n"
  7288. "<test a='&foo;'/>";
  7289. unsigned int i;
  7290. const unsigned int max_alloc_count = 20;
  7291. for (i = 0; i < max_alloc_count; i++) {
  7292. allocation_count = i;
  7293. XML_SetUnknownEncodingHandler(g_parser, unknown_released_encoding_handler,
  7294. NULL);
  7295. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_TRUE)
  7296. != XML_STATUS_ERROR)
  7297. break;
  7298. /* See comment in test_alloc_parse_xdecl() */
  7299. alloc_teardown();
  7300. alloc_setup();
  7301. }
  7302. if (i == 0)
  7303. fail("Internal entity worked despite failing allocations");
  7304. else if (i == max_alloc_count)
  7305. fail("Internal entity failed at max allocation count");
  7306. }
  7307. END_TEST
  7308. /* Test the robustness against allocation failure of element handling
  7309. * Based on test_dtd_default_handling().
  7310. */
  7311. START_TEST(test_alloc_dtd_default_handling) {
  7312. const char *text = "<!DOCTYPE doc [\n"
  7313. "<!ENTITY e SYSTEM 'http://example.org/e'>\n"
  7314. "<!NOTATION n SYSTEM 'http://example.org/n'>\n"
  7315. "<!ENTITY e1 SYSTEM 'http://example.org/e' NDATA n>\n"
  7316. "<!ELEMENT doc (#PCDATA)>\n"
  7317. "<!ATTLIST doc a CDATA #IMPLIED>\n"
  7318. "<?pi in dtd?>\n"
  7319. "<!--comment in dtd-->\n"
  7320. "]>\n"
  7321. "<doc><![CDATA[text in doc]]></doc>";
  7322. const XML_Char *expected = XCS("\n\n\n\n\n\n\n\n\n<doc>text in doc</doc>");
  7323. CharData storage;
  7324. int i;
  7325. const int max_alloc_count = 25;
  7326. for (i = 0; i < max_alloc_count; i++) {
  7327. allocation_count = i;
  7328. dummy_handler_flags = 0;
  7329. XML_SetDefaultHandler(g_parser, accumulate_characters);
  7330. XML_SetDoctypeDeclHandler(g_parser, dummy_start_doctype_handler,
  7331. dummy_end_doctype_handler);
  7332. XML_SetEntityDeclHandler(g_parser, dummy_entity_decl_handler);
  7333. XML_SetNotationDeclHandler(g_parser, dummy_notation_decl_handler);
  7334. XML_SetElementDeclHandler(g_parser, dummy_element_decl_handler);
  7335. XML_SetAttlistDeclHandler(g_parser, dummy_attlist_decl_handler);
  7336. XML_SetProcessingInstructionHandler(g_parser, dummy_pi_handler);
  7337. XML_SetCommentHandler(g_parser, dummy_comment_handler);
  7338. XML_SetCdataSectionHandler(g_parser, dummy_start_cdata_handler,
  7339. dummy_end_cdata_handler);
  7340. XML_SetUnparsedEntityDeclHandler(g_parser,
  7341. dummy_unparsed_entity_decl_handler);
  7342. CharData_Init(&storage);
  7343. XML_SetUserData(g_parser, &storage);
  7344. XML_SetCharacterDataHandler(g_parser, accumulate_characters);
  7345. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_TRUE)
  7346. != XML_STATUS_ERROR)
  7347. break;
  7348. /* See comment in test_alloc_parse_xdecl() */
  7349. alloc_teardown();
  7350. alloc_setup();
  7351. }
  7352. if (i == 0)
  7353. fail("Default DTD parsed despite allocation failures");
  7354. if (i == max_alloc_count)
  7355. fail("Default DTD not parsed with maximum alloc count");
  7356. CharData_CheckXMLChars(&storage, expected);
  7357. if (dummy_handler_flags
  7358. != (DUMMY_START_DOCTYPE_HANDLER_FLAG | DUMMY_END_DOCTYPE_HANDLER_FLAG
  7359. | DUMMY_ENTITY_DECL_HANDLER_FLAG | DUMMY_NOTATION_DECL_HANDLER_FLAG
  7360. | DUMMY_ELEMENT_DECL_HANDLER_FLAG | DUMMY_ATTLIST_DECL_HANDLER_FLAG
  7361. | DUMMY_COMMENT_HANDLER_FLAG | DUMMY_PI_HANDLER_FLAG
  7362. | DUMMY_START_CDATA_HANDLER_FLAG | DUMMY_END_CDATA_HANDLER_FLAG
  7363. | DUMMY_UNPARSED_ENTITY_DECL_HANDLER_FLAG))
  7364. fail("Not all handlers were called");
  7365. }
  7366. END_TEST
  7367. /* Test robustness of XML_SetEncoding() with a failing allocator */
  7368. START_TEST(test_alloc_explicit_encoding) {
  7369. int i;
  7370. const int max_alloc_count = 5;
  7371. for (i = 0; i < max_alloc_count; i++) {
  7372. allocation_count = i;
  7373. if (XML_SetEncoding(g_parser, XCS("us-ascii")) == XML_STATUS_OK)
  7374. break;
  7375. }
  7376. if (i == 0)
  7377. fail("Encoding set despite failing allocator");
  7378. else if (i == max_alloc_count)
  7379. fail("Encoding not set at max allocation count");
  7380. }
  7381. END_TEST
  7382. /* Test robustness of XML_SetBase against a failing allocator */
  7383. START_TEST(test_alloc_set_base) {
  7384. const XML_Char *new_base = XCS("/local/file/name.xml");
  7385. int i;
  7386. const int max_alloc_count = 5;
  7387. for (i = 0; i < max_alloc_count; i++) {
  7388. allocation_count = i;
  7389. if (XML_SetBase(g_parser, new_base) == XML_STATUS_OK)
  7390. break;
  7391. }
  7392. if (i == 0)
  7393. fail("Base set despite failing allocator");
  7394. else if (i == max_alloc_count)
  7395. fail("Base not set with max allocation count");
  7396. }
  7397. END_TEST
  7398. /* Test buffer extension in the face of a duff reallocator */
  7399. START_TEST(test_alloc_realloc_buffer) {
  7400. const char *text = get_buffer_test_text;
  7401. void *buffer;
  7402. int i;
  7403. const int max_realloc_count = 10;
  7404. /* Get a smallish buffer */
  7405. for (i = 0; i < max_realloc_count; i++) {
  7406. reallocation_count = i;
  7407. buffer = XML_GetBuffer(g_parser, 1536);
  7408. if (buffer == NULL)
  7409. fail("1.5K buffer reallocation failed");
  7410. assert(buffer != NULL);
  7411. memcpy(buffer, text, strlen(text));
  7412. if (XML_ParseBuffer(g_parser, (int)strlen(text), XML_FALSE)
  7413. == XML_STATUS_OK)
  7414. break;
  7415. /* See comment in test_alloc_parse_xdecl() */
  7416. alloc_teardown();
  7417. alloc_setup();
  7418. }
  7419. reallocation_count = -1;
  7420. if (i == 0)
  7421. fail("Parse succeeded with no reallocation");
  7422. else if (i == max_realloc_count)
  7423. fail("Parse failed with max reallocation count");
  7424. }
  7425. END_TEST
  7426. /* Same test for external entity parsers */
  7427. static int XMLCALL
  7428. external_entity_reallocator(XML_Parser parser, const XML_Char *context,
  7429. const XML_Char *base, const XML_Char *systemId,
  7430. const XML_Char *publicId) {
  7431. const char *text = get_buffer_test_text;
  7432. XML_Parser ext_parser;
  7433. void *buffer;
  7434. enum XML_Status status;
  7435. UNUSED_P(base);
  7436. UNUSED_P(systemId);
  7437. UNUSED_P(publicId);
  7438. ext_parser = XML_ExternalEntityParserCreate(parser, context, NULL);
  7439. if (ext_parser == NULL)
  7440. fail("Could not create external entity parser");
  7441. reallocation_count = (intptr_t)XML_GetUserData(parser);
  7442. buffer = XML_GetBuffer(ext_parser, 1536);
  7443. if (buffer == NULL)
  7444. fail("Buffer allocation failed");
  7445. assert(buffer != NULL);
  7446. memcpy(buffer, text, strlen(text));
  7447. status = XML_ParseBuffer(ext_parser, (int)strlen(text), XML_FALSE);
  7448. reallocation_count = -1;
  7449. XML_ParserFree(ext_parser);
  7450. return (status == XML_STATUS_OK) ? XML_STATUS_OK : XML_STATUS_ERROR;
  7451. }
  7452. START_TEST(test_alloc_ext_entity_realloc_buffer) {
  7453. const char *text = "<!DOCTYPE doc [\n"
  7454. " <!ENTITY en SYSTEM 'http://example.org/dummy.ent'>\n"
  7455. "]>\n"
  7456. "<doc>&en;</doc>";
  7457. int i;
  7458. const int max_realloc_count = 10;
  7459. for (i = 0; i < max_realloc_count; i++) {
  7460. XML_SetExternalEntityRefHandler(g_parser, external_entity_reallocator);
  7461. XML_SetUserData(g_parser, (void *)(intptr_t)i);
  7462. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_TRUE)
  7463. == XML_STATUS_OK)
  7464. break;
  7465. /* See comment in test_alloc_parse_xdecl() */
  7466. alloc_teardown();
  7467. alloc_setup();
  7468. }
  7469. if (i == 0)
  7470. fail("Succeeded with no reallocations");
  7471. if (i == max_realloc_count)
  7472. fail("Failed with max reallocations");
  7473. }
  7474. END_TEST
  7475. /* Test elements with many attributes are handled correctly */
  7476. START_TEST(test_alloc_realloc_many_attributes) {
  7477. const char *text = "<!DOCTYPE doc [\n"
  7478. "<!ATTLIST doc za CDATA 'default'>\n"
  7479. "<!ATTLIST doc zb CDATA 'def2'>\n"
  7480. "<!ATTLIST doc zc CDATA 'def3'>\n"
  7481. "]>\n"
  7482. "<doc a='1'"
  7483. " b='2'"
  7484. " c='3'"
  7485. " d='4'"
  7486. " e='5'"
  7487. " f='6'"
  7488. " g='7'"
  7489. " h='8'"
  7490. " i='9'"
  7491. " j='10'"
  7492. " k='11'"
  7493. " l='12'"
  7494. " m='13'"
  7495. " n='14'"
  7496. " p='15'"
  7497. " q='16'"
  7498. " r='17'"
  7499. " s='18'>"
  7500. "</doc>";
  7501. int i;
  7502. const int max_realloc_count = 10;
  7503. for (i = 0; i < max_realloc_count; i++) {
  7504. reallocation_count = i;
  7505. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_TRUE)
  7506. != XML_STATUS_ERROR)
  7507. break;
  7508. /* See comment in test_alloc_parse_xdecl() */
  7509. alloc_teardown();
  7510. alloc_setup();
  7511. }
  7512. if (i == 0)
  7513. fail("Parse succeeded despite no reallocations");
  7514. if (i == max_realloc_count)
  7515. fail("Parse failed at max reallocations");
  7516. }
  7517. END_TEST
  7518. /* Test handling of a public entity with failing allocator */
  7519. START_TEST(test_alloc_public_entity_value) {
  7520. const char *text = "<!DOCTYPE doc SYSTEM 'http://example.org/'>\n"
  7521. "<doc></doc>\n";
  7522. char dtd_text[]
  7523. = "<!ELEMENT doc EMPTY>\n"
  7524. "<!ENTITY % e1 PUBLIC 'foo' 'bar.ent'>\n"
  7525. "<!ENTITY % "
  7526. /* Each line is 64 characters */
  7527. "ThisIsAStupidlyLongParameterNameIntendedToTriggerPoolGrowth12345"
  7528. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  7529. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  7530. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  7531. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  7532. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  7533. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  7534. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  7535. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  7536. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  7537. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  7538. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  7539. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  7540. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  7541. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  7542. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  7543. " '%e1;'>\n"
  7544. "%e1;\n";
  7545. int i;
  7546. const int max_alloc_count = 50;
  7547. for (i = 0; i < max_alloc_count; i++) {
  7548. allocation_count = i;
  7549. dummy_handler_flags = 0;
  7550. XML_SetUserData(g_parser, dtd_text);
  7551. XML_SetParamEntityParsing(g_parser, XML_PARAM_ENTITY_PARSING_ALWAYS);
  7552. XML_SetExternalEntityRefHandler(g_parser, external_entity_public);
  7553. /* Provoke a particular code path */
  7554. XML_SetEntityDeclHandler(g_parser, dummy_entity_decl_handler);
  7555. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_TRUE)
  7556. != XML_STATUS_ERROR)
  7557. break;
  7558. /* See comment in test_alloc_parse_xdecl() */
  7559. alloc_teardown();
  7560. alloc_setup();
  7561. }
  7562. if (i == 0)
  7563. fail("Parsing worked despite failing allocation");
  7564. if (i == max_alloc_count)
  7565. fail("Parsing failed at max allocation count");
  7566. if (dummy_handler_flags != DUMMY_ENTITY_DECL_HANDLER_FLAG)
  7567. fail("Entity declaration handler not called");
  7568. }
  7569. END_TEST
  7570. START_TEST(test_alloc_realloc_subst_public_entity_value) {
  7571. const char *text = "<!DOCTYPE doc SYSTEM 'http://example.org/'>\n"
  7572. "<doc></doc>\n";
  7573. char dtd_text[]
  7574. = "<!ELEMENT doc EMPTY>\n"
  7575. "<!ENTITY % "
  7576. /* Each line is 64 characters */
  7577. "ThisIsAStupidlyLongParameterNameIntendedToTriggerPoolGrowth12345"
  7578. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  7579. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  7580. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  7581. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  7582. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  7583. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  7584. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  7585. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  7586. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  7587. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  7588. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  7589. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  7590. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  7591. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  7592. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  7593. " PUBLIC 'foo' 'bar.ent'>\n"
  7594. "%ThisIsAStupidlyLongParameterNameIntendedToTriggerPoolGrowth12345"
  7595. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  7596. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  7597. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  7598. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  7599. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  7600. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  7601. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  7602. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  7603. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  7604. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  7605. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  7606. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  7607. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  7608. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  7609. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP;";
  7610. int i;
  7611. const int max_realloc_count = 10;
  7612. for (i = 0; i < max_realloc_count; i++) {
  7613. reallocation_count = i;
  7614. XML_SetUserData(g_parser, dtd_text);
  7615. XML_SetParamEntityParsing(g_parser, XML_PARAM_ENTITY_PARSING_ALWAYS);
  7616. XML_SetExternalEntityRefHandler(g_parser, external_entity_public);
  7617. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_TRUE)
  7618. != XML_STATUS_ERROR)
  7619. break;
  7620. /* See comment in test_alloc_parse_xdecl() */
  7621. alloc_teardown();
  7622. alloc_setup();
  7623. }
  7624. if (i == 0)
  7625. fail("Parsing worked despite failing reallocation");
  7626. if (i == max_realloc_count)
  7627. fail("Parsing failed at max reallocation count");
  7628. }
  7629. END_TEST
  7630. START_TEST(test_alloc_parse_public_doctype) {
  7631. const char *text
  7632. = "<?xml version='1.0' encoding='utf-8'?>\n"
  7633. "<!DOCTYPE doc PUBLIC '"
  7634. /* 64 characters per line */
  7635. "http://example.com/a/long/enough/name/to/trigger/pool/growth/zz/"
  7636. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  7637. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  7638. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  7639. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  7640. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  7641. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  7642. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  7643. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  7644. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  7645. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  7646. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  7647. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  7648. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  7649. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  7650. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  7651. "' 'test'>\n"
  7652. "<doc></doc>";
  7653. int i;
  7654. const int max_alloc_count = 25;
  7655. for (i = 0; i < max_alloc_count; i++) {
  7656. allocation_count = i;
  7657. dummy_handler_flags = 0;
  7658. XML_SetDoctypeDeclHandler(g_parser, dummy_start_doctype_decl_handler,
  7659. dummy_end_doctype_decl_handler);
  7660. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_TRUE)
  7661. != XML_STATUS_ERROR)
  7662. break;
  7663. /* See comment in test_alloc_parse_xdecl() */
  7664. alloc_teardown();
  7665. alloc_setup();
  7666. }
  7667. if (i == 0)
  7668. fail("Parse succeeded despite failing allocator");
  7669. if (i == max_alloc_count)
  7670. fail("Parse failed at maximum allocation count");
  7671. if (dummy_handler_flags
  7672. != (DUMMY_START_DOCTYPE_DECL_HANDLER_FLAG
  7673. | DUMMY_END_DOCTYPE_DECL_HANDLER_FLAG))
  7674. fail("Doctype handler functions not called");
  7675. }
  7676. END_TEST
  7677. START_TEST(test_alloc_parse_public_doctype_long_name) {
  7678. const char *text
  7679. = "<?xml version='1.0' encoding='utf-8'?>\n"
  7680. "<!DOCTYPE doc PUBLIC 'http://example.com/foo' '"
  7681. /* 64 characters per line */
  7682. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNOP"
  7683. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNOP"
  7684. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNOP"
  7685. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNOP"
  7686. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNOP"
  7687. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNOP"
  7688. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNOP"
  7689. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNOP"
  7690. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNOP"
  7691. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNOP"
  7692. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNOP"
  7693. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNOP"
  7694. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNOP"
  7695. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNOP"
  7696. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNOP"
  7697. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNOP"
  7698. "'>\n"
  7699. "<doc></doc>";
  7700. int i;
  7701. const int max_alloc_count = 25;
  7702. for (i = 0; i < max_alloc_count; i++) {
  7703. allocation_count = i;
  7704. XML_SetDoctypeDeclHandler(g_parser, dummy_start_doctype_decl_handler,
  7705. dummy_end_doctype_decl_handler);
  7706. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_TRUE)
  7707. != XML_STATUS_ERROR)
  7708. break;
  7709. /* See comment in test_alloc_parse_xdecl() */
  7710. alloc_teardown();
  7711. alloc_setup();
  7712. }
  7713. if (i == 0)
  7714. fail("Parse succeeded despite failing allocator");
  7715. if (i == max_alloc_count)
  7716. fail("Parse failed at maximum allocation count");
  7717. }
  7718. END_TEST
  7719. static int XMLCALL
  7720. external_entity_alloc(XML_Parser parser, const XML_Char *context,
  7721. const XML_Char *base, const XML_Char *systemId,
  7722. const XML_Char *publicId) {
  7723. const char *text = (const char *)XML_GetUserData(parser);
  7724. XML_Parser ext_parser;
  7725. int parse_res;
  7726. UNUSED_P(base);
  7727. UNUSED_P(systemId);
  7728. UNUSED_P(publicId);
  7729. ext_parser = XML_ExternalEntityParserCreate(parser, context, NULL);
  7730. if (ext_parser == NULL)
  7731. return XML_STATUS_ERROR;
  7732. parse_res
  7733. = _XML_Parse_SINGLE_BYTES(ext_parser, text, (int)strlen(text), XML_TRUE);
  7734. XML_ParserFree(ext_parser);
  7735. return parse_res;
  7736. }
  7737. /* Test foreign DTD handling */
  7738. START_TEST(test_alloc_set_foreign_dtd) {
  7739. const char *text1 = "<?xml version='1.0' encoding='us-ascii'?>\n"
  7740. "<doc>&entity;</doc>";
  7741. char text2[] = "<!ELEMENT doc (#PCDATA)*>";
  7742. int i;
  7743. const int max_alloc_count = 25;
  7744. for (i = 0; i < max_alloc_count; i++) {
  7745. allocation_count = i;
  7746. XML_SetParamEntityParsing(g_parser, XML_PARAM_ENTITY_PARSING_ALWAYS);
  7747. XML_SetUserData(g_parser, &text2);
  7748. XML_SetExternalEntityRefHandler(g_parser, external_entity_alloc);
  7749. if (XML_UseForeignDTD(g_parser, XML_TRUE) != XML_ERROR_NONE)
  7750. fail("Could not set foreign DTD");
  7751. if (_XML_Parse_SINGLE_BYTES(g_parser, text1, (int)strlen(text1), XML_TRUE)
  7752. != XML_STATUS_ERROR)
  7753. break;
  7754. /* See comment in test_alloc_parse_xdecl() */
  7755. alloc_teardown();
  7756. alloc_setup();
  7757. }
  7758. if (i == 0)
  7759. fail("Parse succeeded despite failing allocator");
  7760. if (i == max_alloc_count)
  7761. fail("Parse failed at maximum allocation count");
  7762. }
  7763. END_TEST
  7764. /* Test based on ibm/valid/P32/ibm32v04.xml */
  7765. START_TEST(test_alloc_attribute_enum_value) {
  7766. const char *text = "<?xml version='1.0' standalone='no'?>\n"
  7767. "<!DOCTYPE animal SYSTEM 'test.dtd'>\n"
  7768. "<animal>This is a \n <a/> \n\nyellow tiger</animal>";
  7769. char dtd_text[] = "<!ELEMENT animal (#PCDATA|a)*>\n"
  7770. "<!ELEMENT a EMPTY>\n"
  7771. "<!ATTLIST animal xml:space (default|preserve) 'preserve'>";
  7772. int i;
  7773. const int max_alloc_count = 30;
  7774. for (i = 0; i < max_alloc_count; i++) {
  7775. allocation_count = i;
  7776. XML_SetExternalEntityRefHandler(g_parser, external_entity_alloc);
  7777. XML_SetUserData(g_parser, dtd_text);
  7778. XML_SetParamEntityParsing(g_parser, XML_PARAM_ENTITY_PARSING_ALWAYS);
  7779. /* An attribute list handler provokes a different code path */
  7780. XML_SetAttlistDeclHandler(g_parser, dummy_attlist_decl_handler);
  7781. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_TRUE)
  7782. != XML_STATUS_ERROR)
  7783. break;
  7784. /* See comment in test_alloc_parse_xdecl() */
  7785. alloc_teardown();
  7786. alloc_setup();
  7787. }
  7788. if (i == 0)
  7789. fail("Parse succeeded despite failing allocator");
  7790. if (i == max_alloc_count)
  7791. fail("Parse failed at maximum allocation count");
  7792. }
  7793. END_TEST
  7794. /* Test attribute enums sufficient to overflow the string pool */
  7795. START_TEST(test_alloc_realloc_attribute_enum_value) {
  7796. const char *text = "<?xml version='1.0' standalone='no'?>\n"
  7797. "<!DOCTYPE animal SYSTEM 'test.dtd'>\n"
  7798. "<animal>This is a yellow tiger</animal>";
  7799. /* We wish to define a collection of attribute enums that will
  7800. * cause the string pool storing them to have to expand. This
  7801. * means more than 1024 bytes, including the parentheses and
  7802. * separator bars.
  7803. */
  7804. char dtd_text[]
  7805. = "<!ELEMENT animal (#PCDATA)*>\n"
  7806. "<!ATTLIST animal thing "
  7807. "(default"
  7808. /* Each line is 64 characters */
  7809. "|ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNO"
  7810. "|BBCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNO"
  7811. "|CBCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNO"
  7812. "|DBCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNO"
  7813. "|EBCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNO"
  7814. "|FBCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNO"
  7815. "|GBCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNO"
  7816. "|HBCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNO"
  7817. "|IBCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNO"
  7818. "|JBCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNO"
  7819. "|KBCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNO"
  7820. "|LBCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNO"
  7821. "|MBCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNO"
  7822. "|NBCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNO"
  7823. "|OBCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNO"
  7824. "|PBCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNO)"
  7825. " 'default'>";
  7826. int i;
  7827. const int max_realloc_count = 10;
  7828. for (i = 0; i < max_realloc_count; i++) {
  7829. reallocation_count = i;
  7830. XML_SetExternalEntityRefHandler(g_parser, external_entity_alloc);
  7831. XML_SetUserData(g_parser, dtd_text);
  7832. XML_SetParamEntityParsing(g_parser, XML_PARAM_ENTITY_PARSING_ALWAYS);
  7833. /* An attribute list handler provokes a different code path */
  7834. XML_SetAttlistDeclHandler(g_parser, dummy_attlist_decl_handler);
  7835. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_TRUE)
  7836. != XML_STATUS_ERROR)
  7837. break;
  7838. /* See comment in test_alloc_parse_xdecl() */
  7839. alloc_teardown();
  7840. alloc_setup();
  7841. }
  7842. if (i == 0)
  7843. fail("Parse succeeded despite failing reallocator");
  7844. if (i == max_realloc_count)
  7845. fail("Parse failed at maximum reallocation count");
  7846. }
  7847. END_TEST
  7848. /* Test attribute enums in a #IMPLIED attribute forcing pool growth */
  7849. START_TEST(test_alloc_realloc_implied_attribute) {
  7850. /* Forcing this particular code path is a balancing act. The
  7851. * addition of the closing parenthesis and terminal NUL must be
  7852. * what pushes the string of enums over the 1024-byte limit,
  7853. * otherwise a different code path will pick up the realloc.
  7854. */
  7855. const char *text
  7856. = "<!DOCTYPE doc [\n"
  7857. "<!ELEMENT doc EMPTY>\n"
  7858. "<!ATTLIST doc a "
  7859. /* Each line is 64 characters */
  7860. "(ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNO"
  7861. "|BBCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNO"
  7862. "|CBCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNO"
  7863. "|DBCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNO"
  7864. "|EBCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNO"
  7865. "|FBCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNO"
  7866. "|GBCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNO"
  7867. "|HBCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNO"
  7868. "|IBCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNO"
  7869. "|JBCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNO"
  7870. "|KBCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNO"
  7871. "|LBCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNO"
  7872. "|MBCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNO"
  7873. "|NBCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNO"
  7874. "|OBCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNO"
  7875. "|PBCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMN)"
  7876. " #IMPLIED>\n"
  7877. "]><doc/>";
  7878. int i;
  7879. const int max_realloc_count = 10;
  7880. for (i = 0; i < max_realloc_count; i++) {
  7881. reallocation_count = i;
  7882. XML_SetAttlistDeclHandler(g_parser, dummy_attlist_decl_handler);
  7883. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_TRUE)
  7884. != XML_STATUS_ERROR)
  7885. break;
  7886. /* See comment in test_alloc_parse_xdecl() */
  7887. alloc_teardown();
  7888. alloc_setup();
  7889. }
  7890. if (i == 0)
  7891. fail("Parse succeeded despite failing reallocator");
  7892. if (i == max_realloc_count)
  7893. fail("Parse failed at maximum reallocation count");
  7894. }
  7895. END_TEST
  7896. /* Test attribute enums in a defaulted attribute forcing pool growth */
  7897. START_TEST(test_alloc_realloc_default_attribute) {
  7898. /* Forcing this particular code path is a balancing act. The
  7899. * addition of the closing parenthesis and terminal NUL must be
  7900. * what pushes the string of enums over the 1024-byte limit,
  7901. * otherwise a different code path will pick up the realloc.
  7902. */
  7903. const char *text
  7904. = "<!DOCTYPE doc [\n"
  7905. "<!ELEMENT doc EMPTY>\n"
  7906. "<!ATTLIST doc a "
  7907. /* Each line is 64 characters */
  7908. "(ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNO"
  7909. "|BBCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNO"
  7910. "|CBCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNO"
  7911. "|DBCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNO"
  7912. "|EBCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNO"
  7913. "|FBCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNO"
  7914. "|GBCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNO"
  7915. "|HBCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNO"
  7916. "|IBCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNO"
  7917. "|JBCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNO"
  7918. "|KBCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNO"
  7919. "|LBCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNO"
  7920. "|MBCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNO"
  7921. "|NBCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNO"
  7922. "|OBCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNO"
  7923. "|PBCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMN)"
  7924. " 'ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNO'"
  7925. ">\n]><doc/>";
  7926. int i;
  7927. const int max_realloc_count = 10;
  7928. for (i = 0; i < max_realloc_count; i++) {
  7929. reallocation_count = i;
  7930. XML_SetAttlistDeclHandler(g_parser, dummy_attlist_decl_handler);
  7931. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_TRUE)
  7932. != XML_STATUS_ERROR)
  7933. break;
  7934. /* See comment in test_alloc_parse_xdecl() */
  7935. alloc_teardown();
  7936. alloc_setup();
  7937. }
  7938. if (i == 0)
  7939. fail("Parse succeeded despite failing reallocator");
  7940. if (i == max_realloc_count)
  7941. fail("Parse failed at maximum reallocation count");
  7942. }
  7943. END_TEST
  7944. /* Test long notation name with dodgy allocator */
  7945. START_TEST(test_alloc_notation) {
  7946. const char *text
  7947. = "<!DOCTYPE doc [\n"
  7948. "<!NOTATION "
  7949. /* Each line is 64 characters */
  7950. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  7951. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  7952. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  7953. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  7954. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  7955. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  7956. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  7957. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  7958. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  7959. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  7960. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  7961. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  7962. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  7963. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  7964. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  7965. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  7966. " SYSTEM 'http://example.org/n'>\n"
  7967. "<!ENTITY e SYSTEM 'http://example.org/e' NDATA "
  7968. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  7969. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  7970. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  7971. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  7972. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  7973. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  7974. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  7975. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  7976. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  7977. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  7978. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  7979. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  7980. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  7981. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  7982. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  7983. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  7984. ">\n"
  7985. "<!ELEMENT doc EMPTY>\n"
  7986. "]>\n<doc/>";
  7987. int i;
  7988. const int max_alloc_count = 20;
  7989. for (i = 0; i < max_alloc_count; i++) {
  7990. allocation_count = i;
  7991. dummy_handler_flags = 0;
  7992. XML_SetNotationDeclHandler(g_parser, dummy_notation_decl_handler);
  7993. XML_SetEntityDeclHandler(g_parser, dummy_entity_decl_handler);
  7994. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_TRUE)
  7995. != XML_STATUS_ERROR)
  7996. break;
  7997. /* See comment in test_alloc_parse_xdecl() */
  7998. alloc_teardown();
  7999. alloc_setup();
  8000. }
  8001. if (i == 0)
  8002. fail("Parse succeeded despite allocation failures");
  8003. if (i == max_alloc_count)
  8004. fail("Parse failed at maximum allocation count");
  8005. if (dummy_handler_flags
  8006. != (DUMMY_ENTITY_DECL_HANDLER_FLAG | DUMMY_NOTATION_DECL_HANDLER_FLAG))
  8007. fail("Entity declaration handler not called");
  8008. }
  8009. END_TEST
  8010. /* Test public notation with dodgy allocator */
  8011. START_TEST(test_alloc_public_notation) {
  8012. const char *text
  8013. = "<!DOCTYPE doc [\n"
  8014. "<!NOTATION note PUBLIC '"
  8015. /* 64 characters per line */
  8016. "http://example.com/a/long/enough/name/to/trigger/pool/growth/zz/"
  8017. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  8018. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  8019. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  8020. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  8021. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  8022. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  8023. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  8024. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  8025. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  8026. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  8027. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  8028. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  8029. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  8030. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  8031. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  8032. "' 'foo'>\n"
  8033. "<!ENTITY e SYSTEM 'http://example.com/e' NDATA note>\n"
  8034. "<!ELEMENT doc EMPTY>\n"
  8035. "]>\n<doc/>";
  8036. int i;
  8037. const int max_alloc_count = 20;
  8038. for (i = 0; i < max_alloc_count; i++) {
  8039. allocation_count = i;
  8040. dummy_handler_flags = 0;
  8041. XML_SetNotationDeclHandler(g_parser, dummy_notation_decl_handler);
  8042. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_TRUE)
  8043. != XML_STATUS_ERROR)
  8044. break;
  8045. /* See comment in test_alloc_parse_xdecl() */
  8046. alloc_teardown();
  8047. alloc_setup();
  8048. }
  8049. if (i == 0)
  8050. fail("Parse succeeded despite allocation failures");
  8051. if (i == max_alloc_count)
  8052. fail("Parse failed at maximum allocation count");
  8053. if (dummy_handler_flags != DUMMY_NOTATION_DECL_HANDLER_FLAG)
  8054. fail("Notation handler not called");
  8055. }
  8056. END_TEST
  8057. /* Test public notation with dodgy allocator */
  8058. START_TEST(test_alloc_system_notation) {
  8059. const char *text
  8060. = "<!DOCTYPE doc [\n"
  8061. "<!NOTATION note SYSTEM '"
  8062. /* 64 characters per line */
  8063. "http://example.com/a/long/enough/name/to/trigger/pool/growth/zz/"
  8064. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  8065. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  8066. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  8067. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  8068. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  8069. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  8070. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  8071. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  8072. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  8073. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  8074. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  8075. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  8076. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  8077. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  8078. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  8079. "'>\n"
  8080. "<!ENTITY e SYSTEM 'http://example.com/e' NDATA note>\n"
  8081. "<!ELEMENT doc EMPTY>\n"
  8082. "]>\n<doc/>";
  8083. int i;
  8084. const int max_alloc_count = 20;
  8085. for (i = 0; i < max_alloc_count; i++) {
  8086. allocation_count = i;
  8087. dummy_handler_flags = 0;
  8088. XML_SetNotationDeclHandler(g_parser, dummy_notation_decl_handler);
  8089. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_TRUE)
  8090. != XML_STATUS_ERROR)
  8091. break;
  8092. /* See comment in test_alloc_parse_xdecl() */
  8093. alloc_teardown();
  8094. alloc_setup();
  8095. }
  8096. if (i == 0)
  8097. fail("Parse succeeded despite allocation failures");
  8098. if (i == max_alloc_count)
  8099. fail("Parse failed at maximum allocation count");
  8100. if (dummy_handler_flags != DUMMY_NOTATION_DECL_HANDLER_FLAG)
  8101. fail("Notation handler not called");
  8102. }
  8103. END_TEST
  8104. START_TEST(test_alloc_nested_groups) {
  8105. const char *text
  8106. = "<!DOCTYPE doc [\n"
  8107. "<!ELEMENT doc "
  8108. /* Sixteen elements per line */
  8109. "(e,(e?,(e?,(e?,(e?,(e?,(e?,(e?,(e?,(e?,(e?,(e?,(e?,(e?,(e?,(e?,"
  8110. "(e?,(e?,(e?,(e?,(e?,(e?,(e?,(e?,(e?,(e?,(e?,(e?,(e?,(e?,(e?,(e?"
  8111. "))))))))))))))))))))))))))))))))>\n"
  8112. "<!ELEMENT e EMPTY>"
  8113. "]>\n"
  8114. "<doc><e/></doc>";
  8115. CharData storage;
  8116. int i;
  8117. const int max_alloc_count = 20;
  8118. for (i = 0; i < max_alloc_count; i++) {
  8119. allocation_count = i;
  8120. CharData_Init(&storage);
  8121. XML_SetElementDeclHandler(g_parser, dummy_element_decl_handler);
  8122. XML_SetStartElementHandler(g_parser, record_element_start_handler);
  8123. XML_SetUserData(g_parser, &storage);
  8124. dummy_handler_flags = 0;
  8125. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_TRUE)
  8126. != XML_STATUS_ERROR)
  8127. break;
  8128. /* See comment in test_alloc_parse_xdecl() */
  8129. alloc_teardown();
  8130. alloc_setup();
  8131. }
  8132. if (i == 0)
  8133. fail("Parse succeeded despite failing reallocator");
  8134. if (i == max_alloc_count)
  8135. fail("Parse failed at maximum reallocation count");
  8136. CharData_CheckXMLChars(&storage, XCS("doce"));
  8137. if (dummy_handler_flags != DUMMY_ELEMENT_DECL_HANDLER_FLAG)
  8138. fail("Element handler not fired");
  8139. }
  8140. END_TEST
  8141. START_TEST(test_alloc_realloc_nested_groups) {
  8142. const char *text
  8143. = "<!DOCTYPE doc [\n"
  8144. "<!ELEMENT doc "
  8145. /* Sixteen elements per line */
  8146. "(e,(e?,(e?,(e?,(e?,(e?,(e?,(e?,(e?,(e?,(e?,(e?,(e?,(e?,(e?,(e?,"
  8147. "(e?,(e?,(e?,(e?,(e?,(e?,(e?,(e?,(e?,(e?,(e?,(e?,(e?,(e?,(e?,(e?"
  8148. "))))))))))))))))))))))))))))))))>\n"
  8149. "<!ELEMENT e EMPTY>"
  8150. "]>\n"
  8151. "<doc><e/></doc>";
  8152. CharData storage;
  8153. int i;
  8154. const int max_realloc_count = 10;
  8155. for (i = 0; i < max_realloc_count; i++) {
  8156. reallocation_count = i;
  8157. CharData_Init(&storage);
  8158. XML_SetElementDeclHandler(g_parser, dummy_element_decl_handler);
  8159. XML_SetStartElementHandler(g_parser, record_element_start_handler);
  8160. XML_SetUserData(g_parser, &storage);
  8161. dummy_handler_flags = 0;
  8162. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_TRUE)
  8163. != XML_STATUS_ERROR)
  8164. break;
  8165. /* See comment in test_alloc_parse_xdecl() */
  8166. alloc_teardown();
  8167. alloc_setup();
  8168. }
  8169. if (i == 0)
  8170. fail("Parse succeeded despite failing reallocator");
  8171. if (i == max_realloc_count)
  8172. fail("Parse failed at maximum reallocation count");
  8173. CharData_CheckXMLChars(&storage, XCS("doce"));
  8174. if (dummy_handler_flags != DUMMY_ELEMENT_DECL_HANDLER_FLAG)
  8175. fail("Element handler not fired");
  8176. }
  8177. END_TEST
  8178. START_TEST(test_alloc_large_group) {
  8179. const char *text = "<!DOCTYPE doc [\n"
  8180. "<!ELEMENT doc ("
  8181. "a1|a2|a3|a4|a5|a6|a7|a8|"
  8182. "b1|b2|b3|b4|b5|b6|b7|b8|"
  8183. "c1|c2|c3|c4|c5|c6|c7|c8|"
  8184. "d1|d2|d3|d4|d5|d6|d7|d8|"
  8185. "e1"
  8186. ")+>\n"
  8187. "]>\n"
  8188. "<doc>\n"
  8189. "<a1/>\n"
  8190. "</doc>\n";
  8191. int i;
  8192. const int max_alloc_count = 50;
  8193. for (i = 0; i < max_alloc_count; i++) {
  8194. allocation_count = i;
  8195. XML_SetElementDeclHandler(g_parser, dummy_element_decl_handler);
  8196. dummy_handler_flags = 0;
  8197. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_TRUE)
  8198. != XML_STATUS_ERROR)
  8199. break;
  8200. /* See comment in test_alloc_parse_xdecl() */
  8201. alloc_teardown();
  8202. alloc_setup();
  8203. }
  8204. if (i == 0)
  8205. fail("Parse succeeded despite failing allocator");
  8206. if (i == max_alloc_count)
  8207. fail("Parse failed at maximum allocation count");
  8208. if (dummy_handler_flags != DUMMY_ELEMENT_DECL_HANDLER_FLAG)
  8209. fail("Element handler flag not raised");
  8210. }
  8211. END_TEST
  8212. START_TEST(test_alloc_realloc_group_choice) {
  8213. const char *text = "<!DOCTYPE doc [\n"
  8214. "<!ELEMENT doc ("
  8215. "a1|a2|a3|a4|a5|a6|a7|a8|"
  8216. "b1|b2|b3|b4|b5|b6|b7|b8|"
  8217. "c1|c2|c3|c4|c5|c6|c7|c8|"
  8218. "d1|d2|d3|d4|d5|d6|d7|d8|"
  8219. "e1"
  8220. ")+>\n"
  8221. "]>\n"
  8222. "<doc>\n"
  8223. "<a1/>\n"
  8224. "<b2 attr='foo'>This is a foo</b2>\n"
  8225. "<c3></c3>\n"
  8226. "</doc>\n";
  8227. int i;
  8228. const int max_realloc_count = 10;
  8229. for (i = 0; i < max_realloc_count; i++) {
  8230. reallocation_count = i;
  8231. XML_SetElementDeclHandler(g_parser, dummy_element_decl_handler);
  8232. dummy_handler_flags = 0;
  8233. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_TRUE)
  8234. != XML_STATUS_ERROR)
  8235. break;
  8236. /* See comment in test_alloc_parse_xdecl() */
  8237. alloc_teardown();
  8238. alloc_setup();
  8239. }
  8240. if (i == 0)
  8241. fail("Parse succeeded despite failing reallocator");
  8242. if (i == max_realloc_count)
  8243. fail("Parse failed at maximum reallocation count");
  8244. if (dummy_handler_flags != DUMMY_ELEMENT_DECL_HANDLER_FLAG)
  8245. fail("Element handler flag not raised");
  8246. }
  8247. END_TEST
  8248. START_TEST(test_alloc_pi_in_epilog) {
  8249. const char *text = "<doc></doc>\n"
  8250. "<?pi in epilog?>";
  8251. int i;
  8252. const int max_alloc_count = 15;
  8253. for (i = 0; i < max_alloc_count; i++) {
  8254. allocation_count = i;
  8255. XML_SetProcessingInstructionHandler(g_parser, dummy_pi_handler);
  8256. dummy_handler_flags = 0;
  8257. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_TRUE)
  8258. != XML_STATUS_ERROR)
  8259. break;
  8260. /* See comment in test_alloc_parse_xdecl() */
  8261. alloc_teardown();
  8262. alloc_setup();
  8263. }
  8264. if (i == 0)
  8265. fail("Parse completed despite failing allocator");
  8266. if (i == max_alloc_count)
  8267. fail("Parse failed at maximum allocation count");
  8268. if (dummy_handler_flags != DUMMY_PI_HANDLER_FLAG)
  8269. fail("Processing instruction handler not invoked");
  8270. }
  8271. END_TEST
  8272. START_TEST(test_alloc_comment_in_epilog) {
  8273. const char *text = "<doc></doc>\n"
  8274. "<!-- comment in epilog -->";
  8275. int i;
  8276. const int max_alloc_count = 15;
  8277. for (i = 0; i < max_alloc_count; i++) {
  8278. allocation_count = i;
  8279. XML_SetCommentHandler(g_parser, dummy_comment_handler);
  8280. dummy_handler_flags = 0;
  8281. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_TRUE)
  8282. != XML_STATUS_ERROR)
  8283. break;
  8284. /* See comment in test_alloc_parse_xdecl() */
  8285. alloc_teardown();
  8286. alloc_setup();
  8287. }
  8288. if (i == 0)
  8289. fail("Parse completed despite failing allocator");
  8290. if (i == max_alloc_count)
  8291. fail("Parse failed at maximum allocation count");
  8292. if (dummy_handler_flags != DUMMY_COMMENT_HANDLER_FLAG)
  8293. fail("Processing instruction handler not invoked");
  8294. }
  8295. END_TEST
  8296. START_TEST(test_alloc_realloc_long_attribute_value) {
  8297. const char *text
  8298. = "<!DOCTYPE doc [<!ENTITY foo '"
  8299. /* Each line is 64 characters */
  8300. "This entity will be substituted as an attribute value, and is "
  8301. "calculated to be exactly long enough that the terminating NUL "
  8302. "that the library adds internally will trigger the string pool to"
  8303. "grow. GHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  8304. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  8305. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  8306. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  8307. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  8308. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  8309. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  8310. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  8311. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  8312. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  8313. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  8314. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  8315. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  8316. "'>]>\n"
  8317. "<doc a='&foo;'></doc>";
  8318. int i;
  8319. const int max_realloc_count = 10;
  8320. for (i = 0; i < max_realloc_count; i++) {
  8321. reallocation_count = i;
  8322. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_TRUE)
  8323. != XML_STATUS_ERROR)
  8324. break;
  8325. /* See comment in test_alloc_parse_xdecl() */
  8326. alloc_teardown();
  8327. alloc_setup();
  8328. }
  8329. if (i == 0)
  8330. fail("Parse succeeded despite failing reallocator");
  8331. if (i == max_realloc_count)
  8332. fail("Parse failed at maximum reallocation count");
  8333. }
  8334. END_TEST
  8335. START_TEST(test_alloc_attribute_whitespace) {
  8336. const char *text = "<doc a=' '></doc>";
  8337. int i;
  8338. const int max_alloc_count = 15;
  8339. for (i = 0; i < max_alloc_count; i++) {
  8340. allocation_count = i;
  8341. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_TRUE)
  8342. != XML_STATUS_ERROR)
  8343. break;
  8344. /* See comment in test_alloc_parse_xdecl() */
  8345. alloc_teardown();
  8346. alloc_setup();
  8347. }
  8348. if (i == 0)
  8349. fail("Parse succeeded despite failing allocator");
  8350. if (i == max_alloc_count)
  8351. fail("Parse failed at maximum allocation count");
  8352. }
  8353. END_TEST
  8354. START_TEST(test_alloc_attribute_predefined_entity) {
  8355. const char *text = "<doc a='&amp;'></doc>";
  8356. int i;
  8357. const int max_alloc_count = 15;
  8358. for (i = 0; i < max_alloc_count; i++) {
  8359. allocation_count = i;
  8360. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_TRUE)
  8361. != XML_STATUS_ERROR)
  8362. break;
  8363. /* See comment in test_alloc_parse_xdecl() */
  8364. alloc_teardown();
  8365. alloc_setup();
  8366. }
  8367. if (i == 0)
  8368. fail("Parse succeeded despite failing allocator");
  8369. if (i == max_alloc_count)
  8370. fail("Parse failed at maximum allocation count");
  8371. }
  8372. END_TEST
  8373. /* Test that a character reference at the end of a suitably long
  8374. * default value for an attribute can trigger pool growth, and recovers
  8375. * if the allocator fails on it.
  8376. */
  8377. START_TEST(test_alloc_long_attr_default_with_char_ref) {
  8378. const char *text
  8379. = "<!DOCTYPE doc [<!ATTLIST doc a CDATA '"
  8380. /* 64 characters per line */
  8381. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  8382. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  8383. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  8384. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  8385. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  8386. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  8387. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  8388. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  8389. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  8390. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  8391. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  8392. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  8393. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  8394. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  8395. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  8396. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHI"
  8397. "&#x31;'>]>\n"
  8398. "<doc/>";
  8399. int i;
  8400. const int max_alloc_count = 20;
  8401. for (i = 0; i < max_alloc_count; i++) {
  8402. allocation_count = i;
  8403. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_TRUE)
  8404. != XML_STATUS_ERROR)
  8405. break;
  8406. /* See comment in test_alloc_parse_xdecl() */
  8407. alloc_teardown();
  8408. alloc_setup();
  8409. }
  8410. if (i == 0)
  8411. fail("Parse succeeded despite failing allocator");
  8412. if (i == max_alloc_count)
  8413. fail("Parse failed at maximum allocation count");
  8414. }
  8415. END_TEST
  8416. /* Test that a long character reference substitution triggers a pool
  8417. * expansion correctly for an attribute value.
  8418. */
  8419. START_TEST(test_alloc_long_attr_value) {
  8420. const char *text
  8421. = "<!DOCTYPE test [<!ENTITY foo '\n"
  8422. /* 64 characters per line */
  8423. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  8424. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  8425. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  8426. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  8427. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  8428. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  8429. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  8430. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  8431. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  8432. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  8433. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  8434. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  8435. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  8436. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  8437. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  8438. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  8439. "'>]>\n"
  8440. "<test a='&foo;'/>";
  8441. int i;
  8442. const int max_alloc_count = 25;
  8443. for (i = 0; i < max_alloc_count; i++) {
  8444. allocation_count = i;
  8445. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_TRUE)
  8446. != XML_STATUS_ERROR)
  8447. break;
  8448. /* See comment in test_alloc_parse_xdecl() */
  8449. alloc_teardown();
  8450. alloc_setup();
  8451. }
  8452. if (i == 0)
  8453. fail("Parse succeeded despite failing allocator");
  8454. if (i == max_alloc_count)
  8455. fail("Parse failed at maximum allocation count");
  8456. }
  8457. END_TEST
  8458. /* Test that an error in a nested parameter entity substitution is
  8459. * handled correctly. It seems unlikely that the code path being
  8460. * exercised can be reached purely by carefully crafted XML, but an
  8461. * allocation error in the right place will definitely do it.
  8462. */
  8463. START_TEST(test_alloc_nested_entities) {
  8464. const char *text = "<!DOCTYPE doc SYSTEM 'http://example.org/one.ent'>\n"
  8465. "<doc />";
  8466. ExtFaults test_data
  8467. = {"<!ENTITY % pe1 '"
  8468. /* 64 characters per line */
  8469. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  8470. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  8471. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  8472. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  8473. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  8474. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  8475. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  8476. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  8477. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  8478. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  8479. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  8480. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  8481. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  8482. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  8483. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  8484. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  8485. "'>\n"
  8486. "<!ENTITY % pe2 '%pe1;'>\n"
  8487. "%pe2;",
  8488. "Memory Fail not faulted", NULL, XML_ERROR_NO_MEMORY};
  8489. /* Causes an allocation error in a nested storeEntityValue() */
  8490. allocation_count = 12;
  8491. XML_SetUserData(g_parser, &test_data);
  8492. XML_SetParamEntityParsing(g_parser, XML_PARAM_ENTITY_PARSING_ALWAYS);
  8493. XML_SetExternalEntityRefHandler(g_parser, external_entity_faulter);
  8494. expect_failure(text, XML_ERROR_EXTERNAL_ENTITY_HANDLING,
  8495. "Entity allocation failure not noted");
  8496. }
  8497. END_TEST
  8498. START_TEST(test_alloc_realloc_param_entity_newline) {
  8499. const char *text = "<!DOCTYPE doc SYSTEM 'http://example.org/'>\n"
  8500. "<doc/>";
  8501. char dtd_text[]
  8502. = "<!ENTITY % pe '<!ATTLIST doc att CDATA \""
  8503. /* 64 characters per line */
  8504. "This default value is carefully crafted so that the carriage "
  8505. "return right at the end of the entity string causes an internal "
  8506. "string pool to have to grow. This allows us to test the alloc "
  8507. "failure path from that point. OPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  8508. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  8509. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  8510. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  8511. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  8512. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  8513. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  8514. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  8515. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  8516. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  8517. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  8518. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  8519. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDE"
  8520. "\">\n'>"
  8521. "%pe;\n";
  8522. int i;
  8523. const int max_realloc_count = 5;
  8524. for (i = 0; i < max_realloc_count; i++) {
  8525. reallocation_count = i;
  8526. XML_SetUserData(g_parser, dtd_text);
  8527. XML_SetParamEntityParsing(g_parser, XML_PARAM_ENTITY_PARSING_ALWAYS);
  8528. XML_SetExternalEntityRefHandler(g_parser, external_entity_alloc);
  8529. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_TRUE)
  8530. != XML_STATUS_ERROR)
  8531. break;
  8532. /* See comment in test_alloc_parse_xdecl() */
  8533. alloc_teardown();
  8534. alloc_setup();
  8535. }
  8536. if (i == 0)
  8537. fail("Parse succeeded despite failing reallocator");
  8538. if (i == max_realloc_count)
  8539. fail("Parse failed at maximum reallocation count");
  8540. }
  8541. END_TEST
  8542. START_TEST(test_alloc_realloc_ce_extends_pe) {
  8543. const char *text = "<!DOCTYPE doc SYSTEM 'http://example.org/'>\n"
  8544. "<doc/>";
  8545. char dtd_text[]
  8546. = "<!ENTITY % pe '<!ATTLIST doc att CDATA \""
  8547. /* 64 characters per line */
  8548. "This default value is carefully crafted so that the character "
  8549. "entity at the end causes an internal string pool to have to "
  8550. "grow. This allows us to test the allocation failure path from "
  8551. "that point onwards. EFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  8552. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  8553. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  8554. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  8555. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  8556. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  8557. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  8558. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  8559. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  8560. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  8561. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  8562. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  8563. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFG&#x51;"
  8564. "\">\n'>"
  8565. "%pe;\n";
  8566. int i;
  8567. const int max_realloc_count = 5;
  8568. for (i = 0; i < max_realloc_count; i++) {
  8569. reallocation_count = i;
  8570. XML_SetUserData(g_parser, dtd_text);
  8571. XML_SetParamEntityParsing(g_parser, XML_PARAM_ENTITY_PARSING_ALWAYS);
  8572. XML_SetExternalEntityRefHandler(g_parser, external_entity_alloc);
  8573. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_TRUE)
  8574. != XML_STATUS_ERROR)
  8575. break;
  8576. /* See comment in test_alloc_parse_xdecl() */
  8577. alloc_teardown();
  8578. alloc_setup();
  8579. }
  8580. if (i == 0)
  8581. fail("Parse succeeded despite failing reallocator");
  8582. if (i == max_realloc_count)
  8583. fail("Parse failed at maximum reallocation count");
  8584. }
  8585. END_TEST
  8586. START_TEST(test_alloc_realloc_attributes) {
  8587. const char *text = "<!DOCTYPE doc [\n"
  8588. " <!ATTLIST doc\n"
  8589. " a1 (a|b|c) 'a'\n"
  8590. " a2 (foo|bar) #IMPLIED\n"
  8591. " a3 NMTOKEN #IMPLIED\n"
  8592. " a4 NMTOKENS #IMPLIED\n"
  8593. " a5 ID #IMPLIED\n"
  8594. " a6 IDREF #IMPLIED\n"
  8595. " a7 IDREFS #IMPLIED\n"
  8596. " a8 ENTITY #IMPLIED\n"
  8597. " a9 ENTITIES #IMPLIED\n"
  8598. " a10 CDATA #IMPLIED\n"
  8599. " >]>\n"
  8600. "<doc>wombat</doc>\n";
  8601. int i;
  8602. const int max_realloc_count = 5;
  8603. for (i = 0; i < max_realloc_count; i++) {
  8604. reallocation_count = i;
  8605. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_TRUE)
  8606. != XML_STATUS_ERROR)
  8607. break;
  8608. /* See comment in test_alloc_parse_xdecl() */
  8609. alloc_teardown();
  8610. alloc_setup();
  8611. }
  8612. if (i == 0)
  8613. fail("Parse succeeded despite failing reallocator");
  8614. if (i == max_realloc_count)
  8615. fail("Parse failed at maximum reallocation count");
  8616. }
  8617. END_TEST
  8618. START_TEST(test_alloc_long_doc_name) {
  8619. const char *text =
  8620. /* 64 characters per line */
  8621. "<LongRootElementNameThatWillCauseTheNextAllocationToExpandTheStr"
  8622. "ingPoolForTheDTDQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  8623. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  8624. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  8625. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  8626. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  8627. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  8628. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  8629. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  8630. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  8631. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  8632. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  8633. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  8634. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  8635. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  8636. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  8637. " a='1'/>";
  8638. int i;
  8639. const int max_alloc_count = 20;
  8640. for (i = 0; i < max_alloc_count; i++) {
  8641. allocation_count = i;
  8642. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_TRUE)
  8643. != XML_STATUS_ERROR)
  8644. break;
  8645. /* See comment in test_alloc_parse_xdecl() */
  8646. alloc_teardown();
  8647. alloc_setup();
  8648. }
  8649. if (i == 0)
  8650. fail("Parsing worked despite failing reallocations");
  8651. else if (i == max_alloc_count)
  8652. fail("Parsing failed even at max reallocation count");
  8653. }
  8654. END_TEST
  8655. START_TEST(test_alloc_long_base) {
  8656. const char *text = "<!DOCTYPE doc [\n"
  8657. " <!ENTITY e SYSTEM 'foo'>\n"
  8658. "]>\n"
  8659. "<doc>&e;</doc>";
  8660. char entity_text[] = "Hello world";
  8661. const XML_Char *base =
  8662. /* 64 characters per line */
  8663. /* clang-format off */
  8664. XCS("LongBaseURI/that/will/overflow/an/internal/buffer/and/cause/it/t")
  8665. XCS("o/have/to/grow/PQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789A/")
  8666. XCS("ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789A/")
  8667. XCS("ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789A/")
  8668. XCS("ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789A/")
  8669. XCS("ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789A/")
  8670. XCS("ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789A/")
  8671. XCS("ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789A/")
  8672. XCS("ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789A/")
  8673. XCS("ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789A/")
  8674. XCS("ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789A/")
  8675. XCS("ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789A/")
  8676. XCS("ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789A/")
  8677. XCS("ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789A/")
  8678. XCS("ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789A/")
  8679. XCS("ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789A/");
  8680. /* clang-format on */
  8681. int i;
  8682. const int max_alloc_count = 25;
  8683. for (i = 0; i < max_alloc_count; i++) {
  8684. allocation_count = i;
  8685. XML_SetUserData(g_parser, entity_text);
  8686. XML_SetParamEntityParsing(g_parser, XML_PARAM_ENTITY_PARSING_ALWAYS);
  8687. XML_SetExternalEntityRefHandler(g_parser, external_entity_alloc);
  8688. if (XML_SetBase(g_parser, base) == XML_STATUS_ERROR) {
  8689. XML_ParserReset(g_parser, NULL);
  8690. continue;
  8691. }
  8692. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_TRUE)
  8693. != XML_STATUS_ERROR)
  8694. break;
  8695. /* See comment in test_alloc_parse_xdecl() */
  8696. alloc_teardown();
  8697. alloc_setup();
  8698. }
  8699. if (i == 0)
  8700. fail("Parsing worked despite failing allocations");
  8701. else if (i == max_alloc_count)
  8702. fail("Parsing failed even at max allocation count");
  8703. }
  8704. END_TEST
  8705. START_TEST(test_alloc_long_public_id) {
  8706. const char *text
  8707. = "<!DOCTYPE doc [\n"
  8708. " <!ENTITY e PUBLIC '"
  8709. /* 64 characters per line */
  8710. "LongPublicIDThatShouldResultInAnInternalStringPoolGrowingAtASpec"
  8711. "ificMomentKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AB"
  8712. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AB"
  8713. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AB"
  8714. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AB"
  8715. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AB"
  8716. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AB"
  8717. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AB"
  8718. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AB"
  8719. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AB"
  8720. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AB"
  8721. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AB"
  8722. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AB"
  8723. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AB"
  8724. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AB"
  8725. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AB"
  8726. "' 'bar'>\n"
  8727. "]>\n"
  8728. "<doc>&e;</doc>";
  8729. char entity_text[] = "Hello world";
  8730. int i;
  8731. const int max_alloc_count = 40;
  8732. for (i = 0; i < max_alloc_count; i++) {
  8733. allocation_count = i;
  8734. XML_SetUserData(g_parser, entity_text);
  8735. XML_SetParamEntityParsing(g_parser, XML_PARAM_ENTITY_PARSING_ALWAYS);
  8736. XML_SetExternalEntityRefHandler(g_parser, external_entity_alloc);
  8737. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_TRUE)
  8738. != XML_STATUS_ERROR)
  8739. break;
  8740. /* See comment in test_alloc_parse_xdecl() */
  8741. alloc_teardown();
  8742. alloc_setup();
  8743. }
  8744. if (i == 0)
  8745. fail("Parsing worked despite failing allocations");
  8746. else if (i == max_alloc_count)
  8747. fail("Parsing failed even at max allocation count");
  8748. }
  8749. END_TEST
  8750. START_TEST(test_alloc_long_entity_value) {
  8751. const char *text
  8752. = "<!DOCTYPE doc [\n"
  8753. " <!ENTITY e1 '"
  8754. /* 64 characters per line */
  8755. "Long entity value that should provoke a string pool to grow whil"
  8756. "e setting up to parse the external entity below. xyz0123456789AB"
  8757. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AB"
  8758. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AB"
  8759. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AB"
  8760. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AB"
  8761. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AB"
  8762. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AB"
  8763. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AB"
  8764. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AB"
  8765. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AB"
  8766. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AB"
  8767. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AB"
  8768. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AB"
  8769. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AB"
  8770. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AB"
  8771. "'>\n"
  8772. " <!ENTITY e2 SYSTEM 'bar'>\n"
  8773. "]>\n"
  8774. "<doc>&e2;</doc>";
  8775. char entity_text[] = "Hello world";
  8776. int i;
  8777. const int max_alloc_count = 40;
  8778. for (i = 0; i < max_alloc_count; i++) {
  8779. allocation_count = i;
  8780. XML_SetUserData(g_parser, entity_text);
  8781. XML_SetParamEntityParsing(g_parser, XML_PARAM_ENTITY_PARSING_ALWAYS);
  8782. XML_SetExternalEntityRefHandler(g_parser, external_entity_alloc);
  8783. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_TRUE)
  8784. != XML_STATUS_ERROR)
  8785. break;
  8786. /* See comment in test_alloc_parse_xdecl() */
  8787. alloc_teardown();
  8788. alloc_setup();
  8789. }
  8790. if (i == 0)
  8791. fail("Parsing worked despite failing allocations");
  8792. else if (i == max_alloc_count)
  8793. fail("Parsing failed even at max allocation count");
  8794. }
  8795. END_TEST
  8796. START_TEST(test_alloc_long_notation) {
  8797. const char *text
  8798. = "<!DOCTYPE doc [\n"
  8799. " <!NOTATION note SYSTEM '"
  8800. /* 64 characters per line */
  8801. "ALongNotationNameThatShouldProvokeStringPoolGrowthWhileCallingAn"
  8802. "ExternalEntityParserUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AB"
  8803. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AB"
  8804. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AB"
  8805. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AB"
  8806. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AB"
  8807. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AB"
  8808. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AB"
  8809. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AB"
  8810. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AB"
  8811. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AB"
  8812. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AB"
  8813. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AB"
  8814. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AB"
  8815. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AB"
  8816. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AB"
  8817. "'>\n"
  8818. " <!ENTITY e1 SYSTEM 'foo' NDATA "
  8819. /* 64 characters per line */
  8820. "ALongNotationNameThatShouldProvokeStringPoolGrowthWhileCallingAn"
  8821. "ExternalEntityParserUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AB"
  8822. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AB"
  8823. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AB"
  8824. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AB"
  8825. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AB"
  8826. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AB"
  8827. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AB"
  8828. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AB"
  8829. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AB"
  8830. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AB"
  8831. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AB"
  8832. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AB"
  8833. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AB"
  8834. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AB"
  8835. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AB"
  8836. ">\n"
  8837. " <!ENTITY e2 SYSTEM 'bar'>\n"
  8838. "]>\n"
  8839. "<doc>&e2;</doc>";
  8840. ExtOption options[]
  8841. = {{XCS("foo"), "Entity Foo"}, {XCS("bar"), "Entity Bar"}, {NULL, NULL}};
  8842. int i;
  8843. const int max_alloc_count = 40;
  8844. for (i = 0; i < max_alloc_count; i++) {
  8845. allocation_count = i;
  8846. XML_SetUserData(g_parser, options);
  8847. XML_SetParamEntityParsing(g_parser, XML_PARAM_ENTITY_PARSING_ALWAYS);
  8848. XML_SetExternalEntityRefHandler(g_parser, external_entity_optioner);
  8849. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_TRUE)
  8850. != XML_STATUS_ERROR)
  8851. break;
  8852. /* See comment in test_alloc_parse_xdecl() */
  8853. alloc_teardown();
  8854. alloc_setup();
  8855. }
  8856. if (i == 0)
  8857. fail("Parsing worked despite failing allocations");
  8858. else if (i == max_alloc_count)
  8859. fail("Parsing failed even at max allocation count");
  8860. }
  8861. END_TEST
  8862. static void
  8863. nsalloc_setup(void) {
  8864. XML_Memory_Handling_Suite memsuite = {duff_allocator, duff_reallocator, free};
  8865. XML_Char ns_sep[2] = {' ', '\0'};
  8866. /* Ensure the parser creation will go through */
  8867. allocation_count = ALLOC_ALWAYS_SUCCEED;
  8868. reallocation_count = REALLOC_ALWAYS_SUCCEED;
  8869. g_parser = XML_ParserCreate_MM(NULL, &memsuite, ns_sep);
  8870. if (g_parser == NULL)
  8871. fail("Parser not created");
  8872. }
  8873. static void
  8874. nsalloc_teardown(void) {
  8875. basic_teardown();
  8876. }
  8877. /* Test the effects of allocation failure in simple namespace parsing.
  8878. * Based on test_ns_default_with_empty_uri()
  8879. */
  8880. START_TEST(test_nsalloc_xmlns) {
  8881. const char *text = "<doc xmlns='http://example.org/'>\n"
  8882. " <e xmlns=''/>\n"
  8883. "</doc>";
  8884. unsigned int i;
  8885. const unsigned int max_alloc_count = 30;
  8886. for (i = 0; i < max_alloc_count; i++) {
  8887. allocation_count = i;
  8888. /* Exercise more code paths with a default handler */
  8889. XML_SetDefaultHandler(g_parser, dummy_default_handler);
  8890. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_TRUE)
  8891. != XML_STATUS_ERROR)
  8892. break;
  8893. /* Resetting the parser is insufficient, because some memory
  8894. * allocations are cached within the parser. Instead we use
  8895. * the teardown and setup routines to ensure that we have the
  8896. * right sort of parser back in our hands.
  8897. */
  8898. nsalloc_teardown();
  8899. nsalloc_setup();
  8900. }
  8901. if (i == 0)
  8902. fail("Parsing worked despite failing allocations");
  8903. else if (i == max_alloc_count)
  8904. fail("Parsing failed even at maximum allocation count");
  8905. }
  8906. END_TEST
  8907. /* Test XML_ParseBuffer interface with namespace and a dicky allocator */
  8908. START_TEST(test_nsalloc_parse_buffer) {
  8909. const char *text = "<doc>Hello</doc>";
  8910. void *buffer;
  8911. /* Try a parse before the start of the world */
  8912. /* (Exercises new code path) */
  8913. if (XML_ParseBuffer(g_parser, 0, XML_FALSE) != XML_STATUS_ERROR)
  8914. fail("Pre-init XML_ParseBuffer not faulted");
  8915. if (XML_GetErrorCode(g_parser) != XML_ERROR_NO_BUFFER)
  8916. fail("Pre-init XML_ParseBuffer faulted for wrong reason");
  8917. buffer = XML_GetBuffer(g_parser, 1 /* any small number greater than 0 */);
  8918. if (buffer == NULL)
  8919. fail("Could not acquire parse buffer");
  8920. allocation_count = 0;
  8921. if (XML_ParseBuffer(g_parser, 0, XML_FALSE) != XML_STATUS_ERROR)
  8922. fail("Pre-init XML_ParseBuffer not faulted");
  8923. if (XML_GetErrorCode(g_parser) != XML_ERROR_NO_MEMORY)
  8924. fail("Pre-init XML_ParseBuffer faulted for wrong reason");
  8925. /* Now with actual memory allocation */
  8926. allocation_count = ALLOC_ALWAYS_SUCCEED;
  8927. if (XML_ParseBuffer(g_parser, 0, XML_FALSE) != XML_STATUS_OK)
  8928. xml_failure(g_parser);
  8929. /* Check that resuming an unsuspended parser is faulted */
  8930. if (XML_ResumeParser(g_parser) != XML_STATUS_ERROR)
  8931. fail("Resuming unsuspended parser not faulted");
  8932. if (XML_GetErrorCode(g_parser) != XML_ERROR_NOT_SUSPENDED)
  8933. xml_failure(g_parser);
  8934. /* Get the parser into suspended state */
  8935. XML_SetCharacterDataHandler(g_parser, clearing_aborting_character_handler);
  8936. resumable = XML_TRUE;
  8937. buffer = XML_GetBuffer(g_parser, (int)strlen(text));
  8938. if (buffer == NULL)
  8939. fail("Could not acquire parse buffer");
  8940. assert(buffer != NULL);
  8941. memcpy(buffer, text, strlen(text));
  8942. if (XML_ParseBuffer(g_parser, (int)strlen(text), XML_TRUE)
  8943. != XML_STATUS_SUSPENDED)
  8944. xml_failure(g_parser);
  8945. if (XML_GetErrorCode(g_parser) != XML_ERROR_NONE)
  8946. xml_failure(g_parser);
  8947. if (XML_ParseBuffer(g_parser, (int)strlen(text), XML_TRUE)
  8948. != XML_STATUS_ERROR)
  8949. fail("Suspended XML_ParseBuffer not faulted");
  8950. if (XML_GetErrorCode(g_parser) != XML_ERROR_SUSPENDED)
  8951. xml_failure(g_parser);
  8952. if (XML_GetBuffer(g_parser, (int)strlen(text)) != NULL)
  8953. fail("Suspended XML_GetBuffer not faulted");
  8954. /* Get it going again and complete the world */
  8955. XML_SetCharacterDataHandler(g_parser, NULL);
  8956. if (XML_ResumeParser(g_parser) != XML_STATUS_OK)
  8957. xml_failure(g_parser);
  8958. if (XML_ParseBuffer(g_parser, (int)strlen(text), XML_TRUE)
  8959. != XML_STATUS_ERROR)
  8960. fail("Post-finishing XML_ParseBuffer not faulted");
  8961. if (XML_GetErrorCode(g_parser) != XML_ERROR_FINISHED)
  8962. xml_failure(g_parser);
  8963. if (XML_GetBuffer(g_parser, (int)strlen(text)) != NULL)
  8964. fail("Post-finishing XML_GetBuffer not faulted");
  8965. }
  8966. END_TEST
  8967. /* Check handling of long prefix names (pool growth) */
  8968. START_TEST(test_nsalloc_long_prefix) {
  8969. const char *text
  8970. = "<"
  8971. /* 64 characters per line */
  8972. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  8973. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  8974. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  8975. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  8976. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  8977. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  8978. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  8979. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  8980. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  8981. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  8982. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  8983. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  8984. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  8985. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  8986. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  8987. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  8988. ":foo xmlns:"
  8989. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  8990. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  8991. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  8992. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  8993. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  8994. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  8995. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  8996. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  8997. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  8998. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  8999. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9000. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9001. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9002. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9003. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9004. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9005. "='http://example.org/'>"
  9006. "</"
  9007. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9008. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9009. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9010. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9011. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9012. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9013. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9014. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9015. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9016. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9017. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9018. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9019. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9020. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9021. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9022. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9023. ":foo>";
  9024. int i;
  9025. const int max_alloc_count = 40;
  9026. for (i = 0; i < max_alloc_count; i++) {
  9027. allocation_count = i;
  9028. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_TRUE)
  9029. != XML_STATUS_ERROR)
  9030. break;
  9031. /* See comment in test_nsalloc_xmlns() */
  9032. nsalloc_teardown();
  9033. nsalloc_setup();
  9034. }
  9035. if (i == 0)
  9036. fail("Parsing worked despite failing allocations");
  9037. else if (i == max_alloc_count)
  9038. fail("Parsing failed even at max allocation count");
  9039. }
  9040. END_TEST
  9041. /* Check handling of long uri names (pool growth) */
  9042. START_TEST(test_nsalloc_long_uri) {
  9043. const char *text
  9044. = "<foo:e xmlns:foo='http://example.org/"
  9045. /* 64 characters per line */
  9046. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789A/"
  9047. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789A/"
  9048. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789A/"
  9049. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789A/"
  9050. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789A/"
  9051. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789A/"
  9052. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789A/"
  9053. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789A/"
  9054. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789A/"
  9055. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789A/"
  9056. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789A/"
  9057. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789A/"
  9058. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789A/"
  9059. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789A/"
  9060. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789A/"
  9061. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789A/"
  9062. "' bar:a='12'\n"
  9063. "xmlns:bar='http://example.org/"
  9064. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789A/"
  9065. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789A/"
  9066. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789A/"
  9067. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789A/"
  9068. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789A/"
  9069. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789A/"
  9070. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789A/"
  9071. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789A/"
  9072. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789A/"
  9073. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789A/"
  9074. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789A/"
  9075. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789A/"
  9076. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789A/"
  9077. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789A/"
  9078. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789A/"
  9079. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789A/"
  9080. "'>"
  9081. "</foo:e>";
  9082. int i;
  9083. const int max_alloc_count = 40;
  9084. for (i = 0; i < max_alloc_count; i++) {
  9085. allocation_count = i;
  9086. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_TRUE)
  9087. != XML_STATUS_ERROR)
  9088. break;
  9089. /* See comment in test_nsalloc_xmlns() */
  9090. nsalloc_teardown();
  9091. nsalloc_setup();
  9092. }
  9093. if (i == 0)
  9094. fail("Parsing worked despite failing allocations");
  9095. else if (i == max_alloc_count)
  9096. fail("Parsing failed even at max allocation count");
  9097. }
  9098. END_TEST
  9099. /* Test handling of long attribute names with prefixes */
  9100. START_TEST(test_nsalloc_long_attr) {
  9101. const char *text
  9102. = "<foo:e xmlns:foo='http://example.org/' bar:"
  9103. /* 64 characters per line */
  9104. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9105. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9106. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9107. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9108. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9109. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9110. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9111. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9112. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9113. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9114. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9115. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9116. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9117. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9118. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9119. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9120. "='12'\n"
  9121. "xmlns:bar='http://example.org/'>"
  9122. "</foo:e>";
  9123. int i;
  9124. const int max_alloc_count = 40;
  9125. for (i = 0; i < max_alloc_count; i++) {
  9126. allocation_count = i;
  9127. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_TRUE)
  9128. != XML_STATUS_ERROR)
  9129. break;
  9130. /* See comment in test_nsalloc_xmlns() */
  9131. nsalloc_teardown();
  9132. nsalloc_setup();
  9133. }
  9134. if (i == 0)
  9135. fail("Parsing worked despite failing allocations");
  9136. else if (i == max_alloc_count)
  9137. fail("Parsing failed even at max allocation count");
  9138. }
  9139. END_TEST
  9140. /* Test handling of an attribute name with a long namespace prefix */
  9141. START_TEST(test_nsalloc_long_attr_prefix) {
  9142. const char *text
  9143. = "<foo:e xmlns:foo='http://example.org/' "
  9144. /* 64 characters per line */
  9145. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9146. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9147. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9148. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9149. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9150. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9151. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9152. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9153. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9154. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9155. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9156. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9157. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9158. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9159. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9160. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9161. ":a='12'\n"
  9162. "xmlns:"
  9163. /* 64 characters per line */
  9164. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9165. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9166. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9167. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9168. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9169. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9170. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9171. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9172. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9173. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9174. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9175. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9176. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9177. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9178. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9179. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9180. "='http://example.org/'>"
  9181. "</foo:e>";
  9182. const XML_Char *elemstr[] = {
  9183. /* clang-format off */
  9184. XCS("http://example.org/ e foo"),
  9185. XCS("http://example.org/ a ")
  9186. XCS("ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ")
  9187. XCS("ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ")
  9188. XCS("ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ")
  9189. XCS("ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ")
  9190. XCS("ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ")
  9191. XCS("ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ")
  9192. XCS("ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ")
  9193. XCS("ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ")
  9194. XCS("ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ")
  9195. XCS("ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ")
  9196. XCS("ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ")
  9197. XCS("ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ")
  9198. XCS("ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ")
  9199. XCS("ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ")
  9200. XCS("ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ")
  9201. XCS("ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ")
  9202. /* clang-format on */
  9203. };
  9204. int i;
  9205. const int max_alloc_count = 40;
  9206. for (i = 0; i < max_alloc_count; i++) {
  9207. allocation_count = i;
  9208. XML_SetReturnNSTriplet(g_parser, XML_TRUE);
  9209. XML_SetUserData(g_parser, (void *)elemstr);
  9210. XML_SetElementHandler(g_parser, triplet_start_checker, triplet_end_checker);
  9211. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_TRUE)
  9212. != XML_STATUS_ERROR)
  9213. break;
  9214. /* See comment in test_nsalloc_xmlns() */
  9215. nsalloc_teardown();
  9216. nsalloc_setup();
  9217. }
  9218. if (i == 0)
  9219. fail("Parsing worked despite failing allocations");
  9220. else if (i == max_alloc_count)
  9221. fail("Parsing failed even at max allocation count");
  9222. }
  9223. END_TEST
  9224. /* Test attribute handling in the face of a dodgy reallocator */
  9225. START_TEST(test_nsalloc_realloc_attributes) {
  9226. const char *text = "<foo:e xmlns:foo='http://example.org/' bar:a='12'\n"
  9227. " xmlns:bar='http://example.org/'>"
  9228. "</foo:e>";
  9229. int i;
  9230. const int max_realloc_count = 10;
  9231. for (i = 0; i < max_realloc_count; i++) {
  9232. reallocation_count = i;
  9233. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_TRUE)
  9234. != XML_STATUS_ERROR)
  9235. break;
  9236. /* See comment in test_nsalloc_xmlns() */
  9237. nsalloc_teardown();
  9238. nsalloc_setup();
  9239. }
  9240. if (i == 0)
  9241. fail("Parsing worked despite failing reallocations");
  9242. else if (i == max_realloc_count)
  9243. fail("Parsing failed at max reallocation count");
  9244. }
  9245. END_TEST
  9246. /* Test long element names with namespaces under a failing allocator */
  9247. START_TEST(test_nsalloc_long_element) {
  9248. const char *text
  9249. = "<foo:thisisalongenoughelementnametotriggerareallocation\n"
  9250. " xmlns:foo='http://example.org/' bar:a='12'\n"
  9251. " xmlns:bar='http://example.org/'>"
  9252. "</foo:thisisalongenoughelementnametotriggerareallocation>";
  9253. const XML_Char *elemstr[]
  9254. = {XCS("http://example.org/")
  9255. XCS(" thisisalongenoughelementnametotriggerareallocation foo"),
  9256. XCS("http://example.org/ a bar")};
  9257. int i;
  9258. const int max_alloc_count = 30;
  9259. for (i = 0; i < max_alloc_count; i++) {
  9260. allocation_count = i;
  9261. XML_SetReturnNSTriplet(g_parser, XML_TRUE);
  9262. XML_SetUserData(g_parser, (void *)elemstr);
  9263. XML_SetElementHandler(g_parser, triplet_start_checker, triplet_end_checker);
  9264. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_TRUE)
  9265. != XML_STATUS_ERROR)
  9266. break;
  9267. /* See comment in test_nsalloc_xmlns() */
  9268. nsalloc_teardown();
  9269. nsalloc_setup();
  9270. }
  9271. if (i == 0)
  9272. fail("Parsing worked despite failing reallocations");
  9273. else if (i == max_alloc_count)
  9274. fail("Parsing failed at max reallocation count");
  9275. }
  9276. END_TEST
  9277. /* Test the effects of reallocation failure when reassigning a
  9278. * binding.
  9279. *
  9280. * XML_ParserReset does not free the BINDING structures used by a
  9281. * parser, but instead adds them to an internal free list to be reused
  9282. * as necessary. Likewise the URI buffers allocated for the binding
  9283. * aren't freed, but kept attached to their existing binding. If the
  9284. * new binding has a longer URI, it will need reallocation. This test
  9285. * provokes that reallocation, and tests the control path if it fails.
  9286. */
  9287. START_TEST(test_nsalloc_realloc_binding_uri) {
  9288. const char *first = "<doc xmlns='http://example.org/'>\n"
  9289. " <e xmlns='' />\n"
  9290. "</doc>";
  9291. const char *second
  9292. = "<doc xmlns='http://example.org/long/enough/URI/to/reallocate/'>\n"
  9293. " <e xmlns='' />\n"
  9294. "</doc>";
  9295. unsigned i;
  9296. const unsigned max_realloc_count = 10;
  9297. /* First, do a full parse that will leave bindings around */
  9298. if (_XML_Parse_SINGLE_BYTES(g_parser, first, (int)strlen(first), XML_TRUE)
  9299. == XML_STATUS_ERROR)
  9300. xml_failure(g_parser);
  9301. /* Now repeat with a longer URI and a duff reallocator */
  9302. for (i = 0; i < max_realloc_count; i++) {
  9303. XML_ParserReset(g_parser, NULL);
  9304. reallocation_count = i;
  9305. if (_XML_Parse_SINGLE_BYTES(g_parser, second, (int)strlen(second), XML_TRUE)
  9306. != XML_STATUS_ERROR)
  9307. break;
  9308. }
  9309. if (i == 0)
  9310. fail("Parsing worked despite failing reallocation");
  9311. else if (i == max_realloc_count)
  9312. fail("Parsing failed at max reallocation count");
  9313. }
  9314. END_TEST
  9315. /* Check handling of long prefix names (pool growth) */
  9316. START_TEST(test_nsalloc_realloc_long_prefix) {
  9317. const char *text
  9318. = "<"
  9319. /* 64 characters per line */
  9320. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9321. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9322. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9323. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9324. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9325. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9326. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9327. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9328. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9329. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9330. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9331. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9332. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9333. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9334. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9335. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9336. ":foo xmlns:"
  9337. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9338. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9339. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9340. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9341. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9342. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9343. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9344. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9345. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9346. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9347. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9348. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9349. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9350. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9351. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9352. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9353. "='http://example.org/'>"
  9354. "</"
  9355. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9356. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9357. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9358. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9359. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9360. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9361. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9362. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9363. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9364. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9365. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9366. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9367. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9368. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9369. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9370. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9371. ":foo>";
  9372. int i;
  9373. const int max_realloc_count = 12;
  9374. for (i = 0; i < max_realloc_count; i++) {
  9375. reallocation_count = i;
  9376. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_TRUE)
  9377. != XML_STATUS_ERROR)
  9378. break;
  9379. /* See comment in test_nsalloc_xmlns() */
  9380. nsalloc_teardown();
  9381. nsalloc_setup();
  9382. }
  9383. if (i == 0)
  9384. fail("Parsing worked despite failing reallocations");
  9385. else if (i == max_realloc_count)
  9386. fail("Parsing failed even at max reallocation count");
  9387. }
  9388. END_TEST
  9389. /* Check handling of even long prefix names (different code path) */
  9390. START_TEST(test_nsalloc_realloc_longer_prefix) {
  9391. const char *text
  9392. = "<"
  9393. /* 64 characters per line */
  9394. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9395. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9396. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9397. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9398. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9399. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9400. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9401. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9402. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9403. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9404. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9405. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9406. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9407. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9408. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9409. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9410. "Q:foo xmlns:"
  9411. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9412. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9413. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9414. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9415. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9416. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9417. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9418. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9419. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9420. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9421. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9422. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9423. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9424. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9425. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9426. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9427. "Q='http://example.org/'>"
  9428. "</"
  9429. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9430. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9431. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9432. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9433. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9434. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9435. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9436. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9437. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9438. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9439. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9440. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9441. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9442. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9443. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9444. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9445. "Q:foo>";
  9446. int i;
  9447. const int max_realloc_count = 12;
  9448. for (i = 0; i < max_realloc_count; i++) {
  9449. reallocation_count = i;
  9450. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_TRUE)
  9451. != XML_STATUS_ERROR)
  9452. break;
  9453. /* See comment in test_nsalloc_xmlns() */
  9454. nsalloc_teardown();
  9455. nsalloc_setup();
  9456. }
  9457. if (i == 0)
  9458. fail("Parsing worked despite failing reallocations");
  9459. else if (i == max_realloc_count)
  9460. fail("Parsing failed even at max reallocation count");
  9461. }
  9462. END_TEST
  9463. START_TEST(test_nsalloc_long_namespace) {
  9464. const char *text1
  9465. = "<"
  9466. /* 64 characters per line */
  9467. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9468. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9469. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9470. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9471. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9472. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9473. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9474. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9475. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9476. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9477. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9478. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9479. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9480. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9481. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9482. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9483. ":e xmlns:"
  9484. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9485. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9486. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9487. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9488. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9489. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9490. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9491. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9492. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9493. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9494. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9495. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9496. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9497. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9498. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9499. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9500. "='http://example.org/'>\n";
  9501. const char *text2
  9502. = "<"
  9503. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9504. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9505. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9506. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9507. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9508. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9509. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9510. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9511. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9512. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9513. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9514. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9515. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9516. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9517. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9518. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9519. ":f "
  9520. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9521. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9522. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9523. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9524. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9525. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9526. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9527. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9528. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9529. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9530. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9531. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9532. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9533. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9534. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9535. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9536. ":attr='foo'/>\n"
  9537. "</"
  9538. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9539. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9540. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9541. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9542. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9543. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9544. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9545. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9546. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9547. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9548. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9549. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9550. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9551. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9552. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9553. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9554. ":e>";
  9555. int i;
  9556. const int max_alloc_count = 40;
  9557. for (i = 0; i < max_alloc_count; i++) {
  9558. allocation_count = i;
  9559. if (_XML_Parse_SINGLE_BYTES(g_parser, text1, (int)strlen(text1), XML_FALSE)
  9560. != XML_STATUS_ERROR
  9561. && _XML_Parse_SINGLE_BYTES(g_parser, text2, (int)strlen(text2),
  9562. XML_TRUE)
  9563. != XML_STATUS_ERROR)
  9564. break;
  9565. /* See comment in test_nsalloc_xmlns() */
  9566. nsalloc_teardown();
  9567. nsalloc_setup();
  9568. }
  9569. if (i == 0)
  9570. fail("Parsing worked despite failing allocations");
  9571. else if (i == max_alloc_count)
  9572. fail("Parsing failed even at max allocation count");
  9573. }
  9574. END_TEST
  9575. /* Using a slightly shorter namespace name provokes allocations in
  9576. * slightly different places in the code.
  9577. */
  9578. START_TEST(test_nsalloc_less_long_namespace) {
  9579. const char *text
  9580. = "<"
  9581. /* 64 characters per line */
  9582. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9583. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9584. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9585. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9586. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9587. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9588. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9589. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz012345678"
  9590. ":e xmlns:"
  9591. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9592. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9593. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9594. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9595. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9596. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9597. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9598. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz012345678"
  9599. "='http://example.org/'>\n"
  9600. "<"
  9601. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9602. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9603. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9604. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9605. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9606. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9607. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9608. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz012345678"
  9609. ":f "
  9610. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9611. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9612. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9613. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9614. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9615. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9616. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9617. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz012345678"
  9618. ":att='foo'/>\n"
  9619. "</"
  9620. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9621. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9622. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9623. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9624. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9625. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9626. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789AZ"
  9627. "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz012345678"
  9628. ":e>";
  9629. int i;
  9630. const int max_alloc_count = 40;
  9631. for (i = 0; i < max_alloc_count; i++) {
  9632. allocation_count = i;
  9633. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_TRUE)
  9634. != XML_STATUS_ERROR)
  9635. break;
  9636. /* See comment in test_nsalloc_xmlns() */
  9637. nsalloc_teardown();
  9638. nsalloc_setup();
  9639. }
  9640. if (i == 0)
  9641. fail("Parsing worked despite failing allocations");
  9642. else if (i == max_alloc_count)
  9643. fail("Parsing failed even at max allocation count");
  9644. }
  9645. END_TEST
  9646. START_TEST(test_nsalloc_long_context) {
  9647. const char *text
  9648. = "<!DOCTYPE doc SYSTEM 'foo' [\n"
  9649. " <!ATTLIST doc baz ID #REQUIRED>\n"
  9650. " <!ENTITY en SYSTEM 'bar'>\n"
  9651. "]>\n"
  9652. "<doc xmlns='http://example.org/"
  9653. /* 64 characters per line */
  9654. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  9655. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  9656. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  9657. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  9658. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  9659. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  9660. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  9661. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  9662. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  9663. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  9664. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  9665. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  9666. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  9667. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  9668. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  9669. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKL"
  9670. "' baz='2'>\n"
  9671. "&en;"
  9672. "</doc>";
  9673. ExtOption options[] = {
  9674. {XCS("foo"), "<!ELEMENT e EMPTY>"}, {XCS("bar"), "<e/>"}, {NULL, NULL}};
  9675. int i;
  9676. const int max_alloc_count = 70;
  9677. for (i = 0; i < max_alloc_count; i++) {
  9678. allocation_count = i;
  9679. XML_SetUserData(g_parser, options);
  9680. XML_SetParamEntityParsing(g_parser, XML_PARAM_ENTITY_PARSING_ALWAYS);
  9681. XML_SetExternalEntityRefHandler(g_parser, external_entity_optioner);
  9682. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_TRUE)
  9683. != XML_STATUS_ERROR)
  9684. break;
  9685. /* See comment in test_nsalloc_xmlns() */
  9686. nsalloc_teardown();
  9687. nsalloc_setup();
  9688. }
  9689. if (i == 0)
  9690. fail("Parsing worked despite failing allocations");
  9691. else if (i == max_alloc_count)
  9692. fail("Parsing failed even at max allocation count");
  9693. }
  9694. END_TEST
  9695. /* This function is void; it will throw a fail() on error, so if it
  9696. * returns normally it must have succeeded.
  9697. */
  9698. static void
  9699. context_realloc_test(const char *text) {
  9700. ExtOption options[] = {
  9701. {XCS("foo"), "<!ELEMENT e EMPTY>"}, {XCS("bar"), "<e/>"}, {NULL, NULL}};
  9702. int i;
  9703. const int max_realloc_count = 6;
  9704. for (i = 0; i < max_realloc_count; i++) {
  9705. reallocation_count = i;
  9706. XML_SetUserData(g_parser, options);
  9707. XML_SetParamEntityParsing(g_parser, XML_PARAM_ENTITY_PARSING_ALWAYS);
  9708. XML_SetExternalEntityRefHandler(g_parser, external_entity_optioner);
  9709. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_TRUE)
  9710. != XML_STATUS_ERROR)
  9711. break;
  9712. /* See comment in test_nsalloc_xmlns() */
  9713. nsalloc_teardown();
  9714. nsalloc_setup();
  9715. }
  9716. if (i == 0)
  9717. fail("Parsing worked despite failing reallocations");
  9718. else if (i == max_realloc_count)
  9719. fail("Parsing failed even at max reallocation count");
  9720. }
  9721. START_TEST(test_nsalloc_realloc_long_context) {
  9722. const char *text
  9723. = "<!DOCTYPE doc SYSTEM 'foo' [\n"
  9724. " <!ENTITY en SYSTEM 'bar'>\n"
  9725. "]>\n"
  9726. "<doc xmlns='http://example.org/"
  9727. /* 64 characters per line */
  9728. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  9729. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  9730. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  9731. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  9732. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  9733. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  9734. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  9735. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  9736. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  9737. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  9738. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  9739. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  9740. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  9741. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  9742. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  9743. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKL"
  9744. "'>\n"
  9745. "&en;"
  9746. "</doc>";
  9747. context_realloc_test(text);
  9748. }
  9749. END_TEST
  9750. START_TEST(test_nsalloc_realloc_long_context_2) {
  9751. const char *text
  9752. = "<!DOCTYPE doc SYSTEM 'foo' [\n"
  9753. " <!ENTITY en SYSTEM 'bar'>\n"
  9754. "]>\n"
  9755. "<doc xmlns='http://example.org/"
  9756. /* 64 characters per line */
  9757. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  9758. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  9759. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  9760. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  9761. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  9762. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  9763. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  9764. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  9765. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  9766. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  9767. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  9768. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  9769. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  9770. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  9771. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  9772. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJK"
  9773. "'>\n"
  9774. "&en;"
  9775. "</doc>";
  9776. context_realloc_test(text);
  9777. }
  9778. END_TEST
  9779. START_TEST(test_nsalloc_realloc_long_context_3) {
  9780. const char *text
  9781. = "<!DOCTYPE doc SYSTEM 'foo' [\n"
  9782. " <!ENTITY en SYSTEM 'bar'>\n"
  9783. "]>\n"
  9784. "<doc xmlns='http://example.org/"
  9785. /* 64 characters per line */
  9786. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  9787. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  9788. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  9789. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  9790. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  9791. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  9792. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  9793. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  9794. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  9795. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  9796. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  9797. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  9798. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  9799. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  9800. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  9801. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGH"
  9802. "'>\n"
  9803. "&en;"
  9804. "</doc>";
  9805. context_realloc_test(text);
  9806. }
  9807. END_TEST
  9808. START_TEST(test_nsalloc_realloc_long_context_4) {
  9809. const char *text
  9810. = "<!DOCTYPE doc SYSTEM 'foo' [\n"
  9811. " <!ENTITY en SYSTEM 'bar'>\n"
  9812. "]>\n"
  9813. "<doc xmlns='http://example.org/"
  9814. /* 64 characters per line */
  9815. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  9816. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  9817. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  9818. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  9819. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  9820. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  9821. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  9822. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  9823. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  9824. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  9825. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  9826. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  9827. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  9828. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  9829. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  9830. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO"
  9831. "'>\n"
  9832. "&en;"
  9833. "</doc>";
  9834. context_realloc_test(text);
  9835. }
  9836. END_TEST
  9837. START_TEST(test_nsalloc_realloc_long_context_5) {
  9838. const char *text
  9839. = "<!DOCTYPE doc SYSTEM 'foo' [\n"
  9840. " <!ENTITY en SYSTEM 'bar'>\n"
  9841. "]>\n"
  9842. "<doc xmlns='http://example.org/"
  9843. /* 64 characters per line */
  9844. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  9845. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  9846. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  9847. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  9848. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  9849. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  9850. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  9851. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  9852. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  9853. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  9854. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  9855. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  9856. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  9857. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  9858. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  9859. "ABC"
  9860. "'>\n"
  9861. "&en;"
  9862. "</doc>";
  9863. context_realloc_test(text);
  9864. }
  9865. END_TEST
  9866. START_TEST(test_nsalloc_realloc_long_context_6) {
  9867. const char *text
  9868. = "<!DOCTYPE doc SYSTEM 'foo' [\n"
  9869. " <!ENTITY en SYSTEM 'bar'>\n"
  9870. "]>\n"
  9871. "<doc xmlns='http://example.org/"
  9872. /* 64 characters per line */
  9873. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  9874. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  9875. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  9876. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  9877. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  9878. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  9879. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  9880. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  9881. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  9882. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  9883. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  9884. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  9885. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  9886. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  9887. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNOP"
  9888. "'>\n"
  9889. "&en;"
  9890. "</doc>";
  9891. context_realloc_test(text);
  9892. }
  9893. END_TEST
  9894. START_TEST(test_nsalloc_realloc_long_context_7) {
  9895. const char *text
  9896. = "<!DOCTYPE doc SYSTEM 'foo' [\n"
  9897. " <!ENTITY en SYSTEM 'bar'>\n"
  9898. "]>\n"
  9899. "<doc xmlns='http://example.org/"
  9900. /* 64 characters per line */
  9901. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  9902. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  9903. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  9904. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  9905. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  9906. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  9907. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  9908. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  9909. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  9910. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  9911. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  9912. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  9913. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  9914. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  9915. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  9916. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLM"
  9917. "'>\n"
  9918. "&en;"
  9919. "</doc>";
  9920. context_realloc_test(text);
  9921. }
  9922. END_TEST
  9923. START_TEST(test_nsalloc_realloc_long_ge_name) {
  9924. const char *text
  9925. = "<!DOCTYPE doc SYSTEM 'foo' [\n"
  9926. " <!ENTITY "
  9927. /* 64 characters per line */
  9928. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  9929. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  9930. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  9931. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  9932. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  9933. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  9934. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  9935. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  9936. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  9937. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  9938. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  9939. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  9940. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  9941. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  9942. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  9943. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  9944. " SYSTEM 'bar'>\n"
  9945. "]>\n"
  9946. "<doc xmlns='http://example.org/baz'>\n"
  9947. "&"
  9948. /* 64 characters per line */
  9949. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  9950. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  9951. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  9952. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  9953. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  9954. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  9955. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  9956. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  9957. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  9958. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  9959. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  9960. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  9961. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  9962. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  9963. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  9964. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  9965. ";"
  9966. "</doc>";
  9967. ExtOption options[] = {
  9968. {XCS("foo"), "<!ELEMENT el EMPTY>"}, {XCS("bar"), "<el/>"}, {NULL, NULL}};
  9969. int i;
  9970. const int max_realloc_count = 10;
  9971. for (i = 0; i < max_realloc_count; i++) {
  9972. reallocation_count = i;
  9973. XML_SetUserData(g_parser, options);
  9974. XML_SetParamEntityParsing(g_parser, XML_PARAM_ENTITY_PARSING_ALWAYS);
  9975. XML_SetExternalEntityRefHandler(g_parser, external_entity_optioner);
  9976. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_TRUE)
  9977. != XML_STATUS_ERROR)
  9978. break;
  9979. /* See comment in test_nsalloc_xmlns() */
  9980. nsalloc_teardown();
  9981. nsalloc_setup();
  9982. }
  9983. if (i == 0)
  9984. fail("Parsing worked despite failing reallocations");
  9985. else if (i == max_realloc_count)
  9986. fail("Parsing failed even at max reallocation count");
  9987. }
  9988. END_TEST
  9989. /* Test that when a namespace is passed through the context mechanism
  9990. * to an external entity parser, the parsers handle reallocation
  9991. * failures correctly. The prefix is exactly the right length to
  9992. * provoke particular uncommon code paths.
  9993. */
  9994. START_TEST(test_nsalloc_realloc_long_context_in_dtd) {
  9995. const char *text1
  9996. = "<!DOCTYPE "
  9997. /* 64 characters per line */
  9998. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  9999. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  10000. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  10001. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  10002. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  10003. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  10004. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  10005. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  10006. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  10007. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  10008. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  10009. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  10010. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  10011. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  10012. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  10013. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  10014. ":doc [\n"
  10015. " <!ENTITY First SYSTEM 'foo/First'>\n"
  10016. "]>\n"
  10017. "<"
  10018. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  10019. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  10020. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  10021. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  10022. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  10023. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  10024. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  10025. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  10026. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  10027. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  10028. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  10029. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  10030. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  10031. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  10032. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  10033. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  10034. ":doc xmlns:"
  10035. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  10036. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  10037. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  10038. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  10039. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  10040. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  10041. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  10042. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  10043. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  10044. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  10045. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  10046. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  10047. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  10048. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  10049. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  10050. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  10051. "='foo/Second'>&First;";
  10052. const char *text2
  10053. = "</"
  10054. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  10055. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  10056. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  10057. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  10058. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  10059. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  10060. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  10061. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  10062. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  10063. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  10064. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  10065. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  10066. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  10067. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  10068. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  10069. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  10070. ":doc>";
  10071. ExtOption options[] = {{XCS("foo/First"), "Hello world"}, {NULL, NULL}};
  10072. int i;
  10073. const int max_realloc_count = 20;
  10074. for (i = 0; i < max_realloc_count; i++) {
  10075. reallocation_count = i;
  10076. XML_SetUserData(g_parser, options);
  10077. XML_SetParamEntityParsing(g_parser, XML_PARAM_ENTITY_PARSING_ALWAYS);
  10078. XML_SetExternalEntityRefHandler(g_parser, external_entity_optioner);
  10079. if (_XML_Parse_SINGLE_BYTES(g_parser, text1, (int)strlen(text1), XML_FALSE)
  10080. != XML_STATUS_ERROR
  10081. && _XML_Parse_SINGLE_BYTES(g_parser, text2, (int)strlen(text2),
  10082. XML_TRUE)
  10083. != XML_STATUS_ERROR)
  10084. break;
  10085. /* See comment in test_nsalloc_xmlns() */
  10086. nsalloc_teardown();
  10087. nsalloc_setup();
  10088. }
  10089. if (i == 0)
  10090. fail("Parsing worked despite failing reallocations");
  10091. else if (i == max_realloc_count)
  10092. fail("Parsing failed even at max reallocation count");
  10093. }
  10094. END_TEST
  10095. START_TEST(test_nsalloc_long_default_in_ext) {
  10096. const char *text
  10097. = "<!DOCTYPE doc [\n"
  10098. " <!ATTLIST e a1 CDATA '"
  10099. /* 64 characters per line */
  10100. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  10101. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  10102. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  10103. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  10104. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  10105. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  10106. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  10107. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  10108. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  10109. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  10110. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  10111. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  10112. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  10113. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  10114. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  10115. "ABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOPABCDEFGHIJKLMNOP"
  10116. "'>\n"
  10117. " <!ENTITY x SYSTEM 'foo'>\n"
  10118. "]>\n"
  10119. "<doc>&x;</doc>";
  10120. ExtOption options[] = {{XCS("foo"), "<e/>"}, {NULL, NULL}};
  10121. int i;
  10122. const int max_alloc_count = 50;
  10123. for (i = 0; i < max_alloc_count; i++) {
  10124. allocation_count = i;
  10125. XML_SetUserData(g_parser, options);
  10126. XML_SetParamEntityParsing(g_parser, XML_PARAM_ENTITY_PARSING_ALWAYS);
  10127. XML_SetExternalEntityRefHandler(g_parser, external_entity_optioner);
  10128. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_TRUE)
  10129. != XML_STATUS_ERROR)
  10130. break;
  10131. /* See comment in test_nsalloc_xmlns() */
  10132. nsalloc_teardown();
  10133. nsalloc_setup();
  10134. }
  10135. if (i == 0)
  10136. fail("Parsing worked despite failing allocations");
  10137. else if (i == max_alloc_count)
  10138. fail("Parsing failed even at max allocation count");
  10139. }
  10140. END_TEST
  10141. START_TEST(test_nsalloc_long_systemid_in_ext) {
  10142. const char *text
  10143. = "<!DOCTYPE doc SYSTEM 'foo' [\n"
  10144. " <!ENTITY en SYSTEM '"
  10145. /* 64 characters per line */
  10146. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  10147. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  10148. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  10149. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  10150. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  10151. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  10152. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  10153. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  10154. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  10155. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  10156. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  10157. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  10158. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  10159. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  10160. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  10161. "ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"
  10162. "'>\n"
  10163. "]>\n"
  10164. "<doc>&en;</doc>";
  10165. ExtOption options[] = {
  10166. {XCS("foo"), "<!ELEMENT e EMPTY>"},
  10167. {/* clang-format off */
  10168. XCS("ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/")
  10169. XCS("ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/")
  10170. XCS("ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/")
  10171. XCS("ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/")
  10172. XCS("ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/")
  10173. XCS("ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/")
  10174. XCS("ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/")
  10175. XCS("ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/")
  10176. XCS("ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/")
  10177. XCS("ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/")
  10178. XCS("ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/")
  10179. XCS("ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/")
  10180. XCS("ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/")
  10181. XCS("ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/")
  10182. XCS("ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/")
  10183. XCS("ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/ABCDEFGHIJKLMNO/"),
  10184. /* clang-format on */
  10185. "<e/>"},
  10186. {NULL, NULL}};
  10187. int i;
  10188. const int max_alloc_count = 55;
  10189. for (i = 0; i < max_alloc_count; i++) {
  10190. allocation_count = i;
  10191. XML_SetUserData(g_parser, options);
  10192. XML_SetParamEntityParsing(g_parser, XML_PARAM_ENTITY_PARSING_ALWAYS);
  10193. XML_SetExternalEntityRefHandler(g_parser, external_entity_optioner);
  10194. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_TRUE)
  10195. != XML_STATUS_ERROR)
  10196. break;
  10197. /* See comment in test_nsalloc_xmlns() */
  10198. nsalloc_teardown();
  10199. nsalloc_setup();
  10200. }
  10201. if (i == 0)
  10202. fail("Parsing worked despite failing allocations");
  10203. else if (i == max_alloc_count)
  10204. fail("Parsing failed even at max allocation count");
  10205. }
  10206. END_TEST
  10207. /* Test the effects of allocation failure on parsing an element in a
  10208. * namespace. Based on test_nsalloc_long_context.
  10209. */
  10210. START_TEST(test_nsalloc_prefixed_element) {
  10211. const char *text = "<!DOCTYPE pfx:element SYSTEM 'foo' [\n"
  10212. " <!ATTLIST pfx:element baz ID #REQUIRED>\n"
  10213. " <!ENTITY en SYSTEM 'bar'>\n"
  10214. "]>\n"
  10215. "<pfx:element xmlns:pfx='http://example.org/' baz='2'>\n"
  10216. "&en;"
  10217. "</pfx:element>";
  10218. ExtOption options[] = {
  10219. {XCS("foo"), "<!ELEMENT e EMPTY>"}, {XCS("bar"), "<e/>"}, {NULL, NULL}};
  10220. int i;
  10221. const int max_alloc_count = 70;
  10222. for (i = 0; i < max_alloc_count; i++) {
  10223. allocation_count = i;
  10224. XML_SetUserData(g_parser, options);
  10225. XML_SetParamEntityParsing(g_parser, XML_PARAM_ENTITY_PARSING_ALWAYS);
  10226. XML_SetExternalEntityRefHandler(g_parser, external_entity_optioner);
  10227. if (_XML_Parse_SINGLE_BYTES(g_parser, text, (int)strlen(text), XML_TRUE)
  10228. != XML_STATUS_ERROR)
  10229. break;
  10230. /* See comment in test_nsalloc_xmlns() */
  10231. nsalloc_teardown();
  10232. nsalloc_setup();
  10233. }
  10234. if (i == 0)
  10235. fail("Success despite failing allocator");
  10236. else if (i == max_alloc_count)
  10237. fail("Failed even at full allocation count");
  10238. }
  10239. END_TEST
  10240. #if defined(XML_DTD)
  10241. typedef enum XML_Status (*XmlParseFunction)(XML_Parser, const char *, int, int);
  10242. struct AccountingTestCase {
  10243. const char *primaryText;
  10244. const char *firstExternalText; /* often NULL */
  10245. const char *secondExternalText; /* often NULL */
  10246. const unsigned long long expectedCountBytesIndirectExtra;
  10247. XML_Bool singleBytesWanted;
  10248. };
  10249. static int
  10250. accounting_external_entity_ref_handler(XML_Parser parser,
  10251. const XML_Char *context,
  10252. const XML_Char *base,
  10253. const XML_Char *systemId,
  10254. const XML_Char *publicId) {
  10255. UNUSED_P(context);
  10256. UNUSED_P(base);
  10257. UNUSED_P(publicId);
  10258. const struct AccountingTestCase *const testCase
  10259. = (const struct AccountingTestCase *)XML_GetUserData(parser);
  10260. const char *externalText = NULL;
  10261. if (xcstrcmp(systemId, XCS("first.ent")) == 0) {
  10262. externalText = testCase->firstExternalText;
  10263. } else if (xcstrcmp(systemId, XCS("second.ent")) == 0) {
  10264. externalText = testCase->secondExternalText;
  10265. } else {
  10266. assert(! "systemId is neither \"first.ent\" nor \"second.ent\"");
  10267. }
  10268. assert(externalText);
  10269. XML_Parser entParser = XML_ExternalEntityParserCreate(parser, context, 0);
  10270. assert(entParser);
  10271. const XmlParseFunction xmlParseFunction
  10272. = testCase->singleBytesWanted ? _XML_Parse_SINGLE_BYTES : XML_Parse;
  10273. const enum XML_Status status = xmlParseFunction(
  10274. entParser, externalText, (int)strlen(externalText), XML_TRUE);
  10275. XML_ParserFree(entParser);
  10276. return status;
  10277. }
  10278. START_TEST(test_accounting_precision) {
  10279. const XML_Bool filled_later = XML_TRUE; /* value is arbitrary */
  10280. struct AccountingTestCase cases[] = {
  10281. {"<e/>", NULL, NULL, 0, 0},
  10282. {"<e></e>", NULL, NULL, 0, 0},
  10283. /* Attributes */
  10284. {"<e k1=\"v2\" k2=\"v2\"/>", NULL, NULL, 0, filled_later},
  10285. {"<e k1=\"v2\" k2=\"v2\"></e>", NULL, NULL, 0, 0},
  10286. {"<p:e xmlns:p=\"https://domain.invalid/\" />", NULL, NULL, 0,
  10287. filled_later},
  10288. {"<e k=\"&amp;&apos;&gt;&lt;&quot;\" />", NULL, NULL,
  10289. sizeof(XML_Char) * 5 /* number of predefined entites */, filled_later},
  10290. {"<e1 xmlns='https://example.org/'>\n"
  10291. " <e2 xmlns=''/>\n"
  10292. "</e1>",
  10293. NULL, NULL, 0, filled_later},
  10294. /* Text */
  10295. {"<e>text</e>", NULL, NULL, 0, filled_later},
  10296. {"<e1><e2>text1<e3/>text2</e2></e1>", NULL, NULL, 0, filled_later},
  10297. {"<e>&amp;&apos;&gt;&lt;&quot;</e>", NULL, NULL,
  10298. sizeof(XML_Char) * 5 /* number of predefined entites */, filled_later},
  10299. {"<e>&#65;&#41;</e>", NULL, NULL, 0, filled_later},
  10300. /* Prolog */
  10301. {"<?xml version=\"1.0\"?><root/>", NULL, NULL, 0, filled_later},
  10302. /* Whitespace */
  10303. {" <e1> <e2> </e2> </e1> ", NULL, NULL, 0, filled_later},
  10304. {"<e1 ><e2 /></e1 >", NULL, NULL, 0, filled_later},
  10305. {"<e1><e2 k = \"v\"/><e3 k = 'v'/></e1>", NULL, NULL, 0, filled_later},
  10306. /* Comments */
  10307. {"<!-- Comment --><e><!-- Comment --></e>", NULL, NULL, 0, filled_later},
  10308. /* Processing instructions */
  10309. {"<?xml-stylesheet type=\"text/xsl\" href=\"https://domain.invalid/\" media=\"all\"?><e/>",
  10310. NULL, NULL, 0, filled_later},
  10311. {"<?pi0?><?pi1 ?><?pi2 ?><!DOCTYPE r SYSTEM 'first.ent'><r/>",
  10312. "<?pi3?><!ENTITY % e1 SYSTEM 'second.ent'><?pi4?>%e1;<?pi5?>", "<?pi6?>",
  10313. 0, filled_later},
  10314. /* CDATA */
  10315. {"<e><![CDATA[one two three]]></e>", NULL, NULL, 0, filled_later},
  10316. /* The following is the essence of this OSS-Fuzz finding:
  10317. https://bugs.chromium.org/p/oss-fuzz/issues/detail?id=34302
  10318. https://oss-fuzz.com/testcase-detail/4860575394955264
  10319. */
  10320. {"<!DOCTYPE r [\n"
  10321. "<!ENTITY e \"111<![CDATA[2 <= 2]]>333\">\n"
  10322. "]>\n"
  10323. "<r>&e;</r>\n",
  10324. NULL, NULL, sizeof(XML_Char) * strlen("111<![CDATA[2 <= 2]]>333"),
  10325. filled_later},
  10326. /* Conditional sections */
  10327. {"<!DOCTYPE r [\n"
  10328. "<!ENTITY % draft 'INCLUDE'>\n"
  10329. "<!ENTITY % final 'IGNORE'>\n"
  10330. "<!ENTITY % import SYSTEM \"first.ent\">\n"
  10331. "%import;\n"
  10332. "]>\n"
  10333. "<r/>\n",
  10334. "<![%draft;[<!--1-->]]>\n"
  10335. "<![%final;[<!--22-->]]>",
  10336. NULL, sizeof(XML_Char) * (strlen("INCLUDE") + strlen("IGNORE")),
  10337. filled_later},
  10338. /* General entities */
  10339. {"<!DOCTYPE root [\n"
  10340. "<!ENTITY nine \"123456789\">\n"
  10341. "]>\n"
  10342. "<root>&nine;</root>",
  10343. NULL, NULL, sizeof(XML_Char) * strlen("123456789"), filled_later},
  10344. {"<!DOCTYPE root [\n"
  10345. "<!ENTITY nine \"123456789\">\n"
  10346. "]>\n"
  10347. "<root k1=\"&nine;\"/>",
  10348. NULL, NULL, sizeof(XML_Char) * strlen("123456789"), filled_later},
  10349. {"<!DOCTYPE root [\n"
  10350. "<!ENTITY nine \"123456789\">\n"
  10351. "<!ENTITY nine2 \"&nine;&nine;\">\n"
  10352. "]>\n"
  10353. "<root>&nine2;&nine2;&nine2;</root>",
  10354. NULL, NULL,
  10355. sizeof(XML_Char) * 3 /* calls to &nine2; */ * 2 /* calls to &nine; */
  10356. * (strlen("&nine;") + strlen("123456789")),
  10357. filled_later},
  10358. {"<!DOCTYPE r [\n"
  10359. " <!ENTITY five SYSTEM 'first.ent'>\n"
  10360. "]>\n"
  10361. "<r>&five;</r>",
  10362. "12345", NULL, 0, filled_later},
  10363. /* Parameter entities */
  10364. {"<!DOCTYPE r [\n"
  10365. "<!ENTITY % comment \"<!---->\">\n"
  10366. "%comment;\n"
  10367. "]>\n"
  10368. "<r/>",
  10369. NULL, NULL, sizeof(XML_Char) * strlen("<!---->"), filled_later},
  10370. {"<!DOCTYPE r [\n"
  10371. "<!ENTITY % ninedef \"&#60;!ENTITY nine &#34;123456789&#34;&#62;\">\n"
  10372. "%ninedef;\n"
  10373. "]>\n"
  10374. "<r>&nine;</r>",
  10375. NULL, NULL,
  10376. sizeof(XML_Char)
  10377. * (strlen("<!ENTITY nine \"123456789\">") + strlen("123456789")),
  10378. filled_later},
  10379. {"<!DOCTYPE r [\n"
  10380. "<!ENTITY % comment \"<!--1-->\">\n"
  10381. "<!ENTITY % comment2 \"&#37;comment;<!--22-->&#37;comment;\">\n"
  10382. "%comment2;\n"
  10383. "]>\n"
  10384. "<r/>\n",
  10385. NULL, NULL,
  10386. sizeof(XML_Char)
  10387. * (strlen("%comment;<!--22-->%comment;") + 2 * strlen("<!--1-->")),
  10388. filled_later},
  10389. {"<!DOCTYPE r [\n"
  10390. " <!ENTITY % five \"12345\">\n"
  10391. " <!ENTITY % five2def \"&#60;!ENTITY five2 &#34;[&#37;five;][&#37;five;]]]]&#34;&#62;\">\n"
  10392. " %five2def;\n"
  10393. "]>\n"
  10394. "<r>&five2;</r>",
  10395. NULL, NULL, /* from "%five2def;": */
  10396. sizeof(XML_Char)
  10397. * (strlen("<!ENTITY five2 \"[%five;][%five;]]]]\">")
  10398. + 2 /* calls to "%five;" */ * strlen("12345")
  10399. + /* from "&five2;": */ strlen("[12345][12345]]]]")),
  10400. filled_later},
  10401. {"<!DOCTYPE r SYSTEM \"first.ent\">\n"
  10402. "<r/>",
  10403. "<!ENTITY % comment '<!--1-->'>\n"
  10404. "<!ENTITY % comment2 '<!--22-->%comment;<!--22-->%comment;<!--22-->'>\n"
  10405. "%comment2;",
  10406. NULL,
  10407. sizeof(XML_Char)
  10408. * (strlen("<!--22-->%comment;<!--22-->%comment;<!--22-->")
  10409. + 2 /* calls to "%comment;" */ * strlen("<!---->")),
  10410. filled_later},
  10411. {"<!DOCTYPE r SYSTEM 'first.ent'>\n"
  10412. "<r/>",
  10413. "<!ENTITY % e1 PUBLIC 'foo' 'second.ent'>\n"
  10414. "<!ENTITY % e2 '<!--22-->%e1;<!--22-->'>\n"
  10415. "%e2;\n",
  10416. "<!--1-->", sizeof(XML_Char) * strlen("<!--22--><!--1--><!--22-->"),
  10417. filled_later},
  10418. {
  10419. "<!DOCTYPE r SYSTEM 'first.ent'>\n"
  10420. "<r/>",
  10421. "<!ENTITY % e1 SYSTEM 'second.ent'>\n"
  10422. "<!ENTITY % e2 '%e1;'>",
  10423. "<?xml version='1.0' encoding='utf-8'?>\n"
  10424. "hello\n"
  10425. "xml" /* without trailing newline! */,
  10426. 0,
  10427. filled_later,
  10428. },
  10429. {
  10430. "<!DOCTYPE r SYSTEM 'first.ent'>\n"
  10431. "<r/>",
  10432. "<!ENTITY % e1 SYSTEM 'second.ent'>\n"
  10433. "<!ENTITY % e2 '%e1;'>",
  10434. "<?xml version='1.0' encoding='utf-8'?>\n"
  10435. "hello\n"
  10436. "xml\n" /* with trailing newline! */,
  10437. 0,
  10438. filled_later,
  10439. },
  10440. {"<!DOCTYPE doc SYSTEM 'first.ent'>\n"
  10441. "<doc></doc>\n",
  10442. "<!ELEMENT doc EMPTY>\n"
  10443. "<!ENTITY % e1 SYSTEM 'second.ent'>\n"
  10444. "<!ENTITY % e2 '%e1;'>\n"
  10445. "%e1;\n",
  10446. "\xEF\xBB\xBF<!ATTLIST doc a1 CDATA 'value'>" /* UTF-8 BOM */,
  10447. strlen("\xEF\xBB\xBF<!ATTLIST doc a1 CDATA 'value'>"), filled_later},
  10448. {"<!DOCTYPE r [\n"
  10449. " <!ENTITY five SYSTEM 'first.ent'>\n"
  10450. "]>\n"
  10451. "<r>&five;</r>",
  10452. "\xEF\xBB\xBF" /* UTF-8 BOM */, NULL, 0, filled_later},
  10453. };
  10454. const size_t countCases = sizeof(cases) / sizeof(cases[0]);
  10455. size_t u = 0;
  10456. for (; u < countCases; u++) {
  10457. size_t v = 0;
  10458. for (; v < 2; v++) {
  10459. const XML_Bool singleBytesWanted = (v == 0) ? XML_FALSE : XML_TRUE;
  10460. const unsigned long long expectedCountBytesDirect
  10461. = strlen(cases[u].primaryText);
  10462. const unsigned long long expectedCountBytesIndirect
  10463. = (cases[u].firstExternalText ? strlen(cases[u].firstExternalText)
  10464. : 0)
  10465. + (cases[u].secondExternalText ? strlen(cases[u].secondExternalText)
  10466. : 0)
  10467. + cases[u].expectedCountBytesIndirectExtra;
  10468. XML_Parser parser = XML_ParserCreate(NULL);
  10469. XML_SetParamEntityParsing(parser, XML_PARAM_ENTITY_PARSING_ALWAYS);
  10470. if (cases[u].firstExternalText) {
  10471. XML_SetExternalEntityRefHandler(parser,
  10472. accounting_external_entity_ref_handler);
  10473. XML_SetUserData(parser, (void *)&cases[u]);
  10474. cases[u].singleBytesWanted = singleBytesWanted;
  10475. }
  10476. const XmlParseFunction xmlParseFunction
  10477. = singleBytesWanted ? _XML_Parse_SINGLE_BYTES : XML_Parse;
  10478. enum XML_Status status
  10479. = xmlParseFunction(parser, cases[u].primaryText,
  10480. (int)strlen(cases[u].primaryText), XML_TRUE);
  10481. if (status != XML_STATUS_OK) {
  10482. _xml_failure(parser, __FILE__, __LINE__);
  10483. }
  10484. const unsigned long long actualCountBytesDirect
  10485. = testingAccountingGetCountBytesDirect(parser);
  10486. const unsigned long long actualCountBytesIndirect
  10487. = testingAccountingGetCountBytesIndirect(parser);
  10488. XML_ParserFree(parser);
  10489. if (actualCountBytesDirect != expectedCountBytesDirect) {
  10490. fprintf(
  10491. stderr,
  10492. "Document " EXPAT_FMT_SIZE_T("") " of " EXPAT_FMT_SIZE_T("") ", %s: Expected " EXPAT_FMT_ULL(
  10493. "") " count direct bytes, got " EXPAT_FMT_ULL("") " instead.\n",
  10494. u + 1, countCases, singleBytesWanted ? "single bytes" : "chunks",
  10495. expectedCountBytesDirect, actualCountBytesDirect);
  10496. fail("Count of direct bytes is off");
  10497. }
  10498. if (actualCountBytesIndirect != expectedCountBytesIndirect) {
  10499. fprintf(
  10500. stderr,
  10501. "Document " EXPAT_FMT_SIZE_T("") " of " EXPAT_FMT_SIZE_T("") ", %s: Expected " EXPAT_FMT_ULL(
  10502. "") " count indirect bytes, got " EXPAT_FMT_ULL("") " instead.\n",
  10503. u + 1, countCases, singleBytesWanted ? "single bytes" : "chunks",
  10504. expectedCountBytesIndirect, actualCountBytesIndirect);
  10505. fail("Count of indirect bytes is off");
  10506. }
  10507. }
  10508. }
  10509. }
  10510. END_TEST
  10511. START_TEST(test_billion_laughs_attack_protection_api) {
  10512. XML_Parser parserWithoutParent = XML_ParserCreate(NULL);
  10513. XML_Parser parserWithParent
  10514. = XML_ExternalEntityParserCreate(parserWithoutParent, NULL, NULL);
  10515. if (parserWithoutParent == NULL)
  10516. fail("parserWithoutParent is NULL");
  10517. if (parserWithParent == NULL)
  10518. fail("parserWithParent is NULL");
  10519. // XML_SetBillionLaughsAttackProtectionMaximumAmplification, error cases
  10520. if (XML_SetBillionLaughsAttackProtectionMaximumAmplification(NULL, 123.0f)
  10521. == XML_TRUE)
  10522. fail("Call with NULL parser is NOT supposed to succeed");
  10523. if (XML_SetBillionLaughsAttackProtectionMaximumAmplification(parserWithParent,
  10524. 123.0f)
  10525. == XML_TRUE)
  10526. fail("Call with non-root parser is NOT supposed to succeed");
  10527. if (XML_SetBillionLaughsAttackProtectionMaximumAmplification(
  10528. parserWithoutParent, NAN)
  10529. == XML_TRUE)
  10530. fail("Call with NaN limit is NOT supposed to succeed");
  10531. if (XML_SetBillionLaughsAttackProtectionMaximumAmplification(
  10532. parserWithoutParent, -1.0f)
  10533. == XML_TRUE)
  10534. fail("Call with negative limit is NOT supposed to succeed");
  10535. if (XML_SetBillionLaughsAttackProtectionMaximumAmplification(
  10536. parserWithoutParent, 0.9f)
  10537. == XML_TRUE)
  10538. fail("Call with positive limit <1.0 is NOT supposed to succeed");
  10539. // XML_SetBillionLaughsAttackProtectionMaximumAmplification, success cases
  10540. if (XML_SetBillionLaughsAttackProtectionMaximumAmplification(
  10541. parserWithoutParent, 1.0f)
  10542. == XML_FALSE)
  10543. fail("Call with positive limit >=1.0 is supposed to succeed");
  10544. if (XML_SetBillionLaughsAttackProtectionMaximumAmplification(
  10545. parserWithoutParent, 123456.789f)
  10546. == XML_FALSE)
  10547. fail("Call with positive limit >=1.0 is supposed to succeed");
  10548. if (XML_SetBillionLaughsAttackProtectionMaximumAmplification(
  10549. parserWithoutParent, INFINITY)
  10550. == XML_FALSE)
  10551. fail("Call with positive limit >=1.0 is supposed to succeed");
  10552. // XML_SetBillionLaughsAttackProtectionActivationThreshold, error cases
  10553. if (XML_SetBillionLaughsAttackProtectionActivationThreshold(NULL, 123)
  10554. == XML_TRUE)
  10555. fail("Call with NULL parser is NOT supposed to succeed");
  10556. if (XML_SetBillionLaughsAttackProtectionActivationThreshold(parserWithParent,
  10557. 123)
  10558. == XML_TRUE)
  10559. fail("Call with non-root parser is NOT supposed to succeed");
  10560. // XML_SetBillionLaughsAttackProtectionActivationThreshold, success cases
  10561. if (XML_SetBillionLaughsAttackProtectionActivationThreshold(
  10562. parserWithoutParent, 123)
  10563. == XML_FALSE)
  10564. fail("Call with non-NULL parentless parser is supposed to succeed");
  10565. XML_ParserFree(parserWithParent);
  10566. XML_ParserFree(parserWithoutParent);
  10567. }
  10568. END_TEST
  10569. START_TEST(test_helper_unsigned_char_to_printable) {
  10570. // Smoke test
  10571. unsigned char uc = 0;
  10572. for (; uc < (unsigned char)-1; uc++) {
  10573. const char *const printable = unsignedCharToPrintable(uc);
  10574. if (printable == NULL)
  10575. fail("unsignedCharToPrintable returned NULL");
  10576. if (strlen(printable) < (size_t)1)
  10577. fail("unsignedCharToPrintable returned empty string");
  10578. }
  10579. // Two concrete samples
  10580. if (strcmp(unsignedCharToPrintable('A'), "A") != 0)
  10581. fail("unsignedCharToPrintable result mistaken");
  10582. if (strcmp(unsignedCharToPrintable('\\'), "\\\\") != 0)
  10583. fail("unsignedCharToPrintable result mistaken");
  10584. }
  10585. END_TEST
  10586. #endif // defined(XML_DTD)
  10587. static Suite *
  10588. make_suite(void) {
  10589. Suite *s = suite_create("basic");
  10590. TCase *tc_basic = tcase_create("basic tests");
  10591. TCase *tc_namespace = tcase_create("XML namespaces");
  10592. TCase *tc_misc = tcase_create("miscellaneous tests");
  10593. TCase *tc_alloc = tcase_create("allocation tests");
  10594. TCase *tc_nsalloc = tcase_create("namespace allocation tests");
  10595. #if defined(XML_DTD)
  10596. TCase *tc_accounting = tcase_create("accounting tests");
  10597. #endif
  10598. suite_add_tcase(s, tc_basic);
  10599. tcase_add_checked_fixture(tc_basic, basic_setup, basic_teardown);
  10600. tcase_add_test(tc_basic, test_nul_byte);
  10601. tcase_add_test(tc_basic, test_u0000_char);
  10602. tcase_add_test(tc_basic, test_siphash_self);
  10603. tcase_add_test(tc_basic, test_siphash_spec);
  10604. tcase_add_test(tc_basic, test_bom_utf8);
  10605. tcase_add_test(tc_basic, test_bom_utf16_be);
  10606. tcase_add_test(tc_basic, test_bom_utf16_le);
  10607. tcase_add_test(tc_basic, test_nobom_utf16_le);
  10608. tcase_add_test(tc_basic, test_illegal_utf8);
  10609. tcase_add_test(tc_basic, test_utf8_auto_align);
  10610. tcase_add_test(tc_basic, test_utf16);
  10611. tcase_add_test(tc_basic, test_utf16_le_epilog_newline);
  10612. tcase_add_test(tc_basic, test_not_utf16);
  10613. tcase_add_test(tc_basic, test_bad_encoding);
  10614. tcase_add_test(tc_basic, test_latin1_umlauts);
  10615. tcase_add_test(tc_basic, test_long_utf8_character);
  10616. tcase_add_test(tc_basic, test_long_latin1_attribute);
  10617. tcase_add_test(tc_basic, test_long_ascii_attribute);
  10618. /* Regression test for SF bug #491986. */
  10619. tcase_add_test(tc_basic, test_danish_latin1);
  10620. /* Regression test for SF bug #514281. */
  10621. tcase_add_test(tc_basic, test_french_charref_hexidecimal);
  10622. tcase_add_test(tc_basic, test_french_charref_decimal);
  10623. tcase_add_test(tc_basic, test_french_latin1);
  10624. tcase_add_test(tc_basic, test_french_utf8);
  10625. tcase_add_test(tc_basic, test_utf8_false_rejection);
  10626. tcase_add_test(tc_basic, test_line_number_after_parse);
  10627. tcase_add_test(tc_basic, test_column_number_after_parse);
  10628. tcase_add_test(tc_basic, test_line_and_column_numbers_inside_handlers);
  10629. tcase_add_test(tc_basic, test_line_number_after_error);
  10630. tcase_add_test(tc_basic, test_column_number_after_error);
  10631. tcase_add_test(tc_basic, test_really_long_lines);
  10632. tcase_add_test(tc_basic, test_really_long_encoded_lines);
  10633. tcase_add_test(tc_basic, test_end_element_events);
  10634. tcase_add_test(tc_basic, test_attr_whitespace_normalization);
  10635. tcase_add_test(tc_basic, test_xmldecl_misplaced);
  10636. tcase_add_test(tc_basic, test_xmldecl_invalid);
  10637. tcase_add_test(tc_basic, test_xmldecl_missing_attr);
  10638. tcase_add_test(tc_basic, test_xmldecl_missing_value);
  10639. tcase_add_test(tc_basic, test_unknown_encoding_internal_entity);
  10640. tcase_add_test(tc_basic, test_unrecognised_encoding_internal_entity);
  10641. tcase_add_test(tc_basic, test_wfc_undeclared_entity_unread_external_subset);
  10642. tcase_add_test(tc_basic, test_wfc_undeclared_entity_no_external_subset);
  10643. tcase_add_test(tc_basic, test_wfc_undeclared_entity_standalone);
  10644. tcase_add_test(tc_basic, test_wfc_undeclared_entity_with_external_subset);
  10645. tcase_add_test(tc_basic, test_not_standalone_handler_reject);
  10646. tcase_add_test(tc_basic, test_not_standalone_handler_accept);
  10647. tcase_add_test(tc_basic,
  10648. test_wfc_undeclared_entity_with_external_subset_standalone);
  10649. tcase_add_test(tc_basic, test_entity_with_external_subset_unless_standalone);
  10650. tcase_add_test(tc_basic, test_wfc_no_recursive_entity_refs);
  10651. tcase_add_test__ifdef_xml_dtd(tc_basic, test_ext_entity_set_encoding);
  10652. tcase_add_test__ifdef_xml_dtd(tc_basic, test_ext_entity_no_handler);
  10653. tcase_add_test__ifdef_xml_dtd(tc_basic, test_ext_entity_set_bom);
  10654. tcase_add_test__ifdef_xml_dtd(tc_basic, test_ext_entity_bad_encoding);
  10655. tcase_add_test__ifdef_xml_dtd(tc_basic, test_ext_entity_bad_encoding_2);
  10656. tcase_add_test__ifdef_xml_dtd(tc_basic, test_ext_entity_invalid_parse);
  10657. tcase_add_test__ifdef_xml_dtd(tc_basic,
  10658. test_ext_entity_invalid_suspended_parse);
  10659. tcase_add_test(tc_basic, test_dtd_default_handling);
  10660. tcase_add_test(tc_basic, test_dtd_attr_handling);
  10661. tcase_add_test(tc_basic, test_empty_ns_without_namespaces);
  10662. tcase_add_test(tc_basic, test_ns_in_attribute_default_without_namespaces);
  10663. tcase_add_test(tc_basic, test_stop_parser_between_char_data_calls);
  10664. tcase_add_test(tc_basic, test_suspend_parser_between_char_data_calls);
  10665. tcase_add_test(tc_basic, test_repeated_stop_parser_between_char_data_calls);
  10666. tcase_add_test(tc_basic, test_good_cdata_ascii);
  10667. tcase_add_test(tc_basic, test_good_cdata_utf16);
  10668. tcase_add_test(tc_basic, test_good_cdata_utf16_le);
  10669. tcase_add_test(tc_basic, test_long_cdata_utf16);
  10670. tcase_add_test(tc_basic, test_multichar_cdata_utf16);
  10671. tcase_add_test(tc_basic, test_utf16_bad_surrogate_pair);
  10672. tcase_add_test(tc_basic, test_bad_cdata);
  10673. tcase_add_test(tc_basic, test_bad_cdata_utf16);
  10674. tcase_add_test(tc_basic, test_stop_parser_between_cdata_calls);
  10675. tcase_add_test(tc_basic, test_suspend_parser_between_cdata_calls);
  10676. tcase_add_test(tc_basic, test_memory_allocation);
  10677. tcase_add_test(tc_basic, test_default_current);
  10678. tcase_add_test(tc_basic, test_dtd_elements);
  10679. tcase_add_test__ifdef_xml_dtd(tc_basic, test_set_foreign_dtd);
  10680. tcase_add_test__ifdef_xml_dtd(tc_basic, test_foreign_dtd_not_standalone);
  10681. tcase_add_test__ifdef_xml_dtd(tc_basic, test_invalid_foreign_dtd);
  10682. tcase_add_test__ifdef_xml_dtd(tc_basic, test_foreign_dtd_with_doctype);
  10683. tcase_add_test__ifdef_xml_dtd(tc_basic,
  10684. test_foreign_dtd_without_external_subset);
  10685. tcase_add_test__ifdef_xml_dtd(tc_basic, test_empty_foreign_dtd);
  10686. tcase_add_test(tc_basic, test_set_base);
  10687. tcase_add_test(tc_basic, test_attributes);
  10688. tcase_add_test(tc_basic, test_reset_in_entity);
  10689. tcase_add_test(tc_basic, test_resume_invalid_parse);
  10690. tcase_add_test(tc_basic, test_resume_resuspended);
  10691. tcase_add_test(tc_basic, test_cdata_default);
  10692. tcase_add_test(tc_basic, test_subordinate_reset);
  10693. tcase_add_test(tc_basic, test_subordinate_suspend);
  10694. tcase_add_test(tc_basic, test_subordinate_xdecl_suspend);
  10695. tcase_add_test(tc_basic, test_subordinate_xdecl_abort);
  10696. tcase_add_test(tc_basic, test_explicit_encoding);
  10697. tcase_add_test(tc_basic, test_trailing_cr);
  10698. tcase_add_test(tc_basic, test_ext_entity_trailing_cr);
  10699. tcase_add_test(tc_basic, test_trailing_rsqb);
  10700. tcase_add_test(tc_basic, test_ext_entity_trailing_rsqb);
  10701. tcase_add_test(tc_basic, test_ext_entity_good_cdata);
  10702. tcase_add_test__ifdef_xml_dtd(tc_basic, test_user_parameters);
  10703. tcase_add_test__ifdef_xml_dtd(tc_basic, test_ext_entity_ref_parameter);
  10704. tcase_add_test(tc_basic, test_empty_parse);
  10705. tcase_add_test(tc_basic, test_get_buffer_1);
  10706. tcase_add_test(tc_basic, test_get_buffer_2);
  10707. tcase_add_test(tc_basic, test_byte_info_at_end);
  10708. tcase_add_test(tc_basic, test_byte_info_at_error);
  10709. tcase_add_test(tc_basic, test_byte_info_at_cdata);
  10710. tcase_add_test(tc_basic, test_predefined_entities);
  10711. tcase_add_test__ifdef_xml_dtd(tc_basic, test_invalid_tag_in_dtd);
  10712. tcase_add_test(tc_basic, test_not_predefined_entities);
  10713. tcase_add_test__ifdef_xml_dtd(tc_basic, test_ignore_section);
  10714. tcase_add_test__ifdef_xml_dtd(tc_basic, test_ignore_section_utf16);
  10715. tcase_add_test__ifdef_xml_dtd(tc_basic, test_ignore_section_utf16_be);
  10716. tcase_add_test__ifdef_xml_dtd(tc_basic, test_bad_ignore_section);
  10717. tcase_add_test__ifdef_xml_dtd(tc_basic, test_external_entity_values);
  10718. tcase_add_test__ifdef_xml_dtd(tc_basic, test_ext_entity_not_standalone);
  10719. tcase_add_test__ifdef_xml_dtd(tc_basic, test_ext_entity_value_abort);
  10720. tcase_add_test(tc_basic, test_bad_public_doctype);
  10721. tcase_add_test(tc_basic, test_attribute_enum_value);
  10722. tcase_add_test(tc_basic, test_predefined_entity_redefinition);
  10723. tcase_add_test__ifdef_xml_dtd(tc_basic, test_dtd_stop_processing);
  10724. tcase_add_test(tc_basic, test_public_notation_no_sysid);
  10725. tcase_add_test(tc_basic, test_nested_groups);
  10726. tcase_add_test(tc_basic, test_group_choice);
  10727. tcase_add_test(tc_basic, test_standalone_parameter_entity);
  10728. tcase_add_test__ifdef_xml_dtd(tc_basic, test_skipped_parameter_entity);
  10729. tcase_add_test__ifdef_xml_dtd(tc_basic,
  10730. test_recursive_external_parameter_entity);
  10731. tcase_add_test(tc_basic, test_undefined_ext_entity_in_external_dtd);
  10732. tcase_add_test(tc_basic, test_suspend_xdecl);
  10733. tcase_add_test(tc_basic, test_abort_epilog);
  10734. tcase_add_test(tc_basic, test_abort_epilog_2);
  10735. tcase_add_test(tc_basic, test_suspend_epilog);
  10736. tcase_add_test(tc_basic, test_suspend_in_sole_empty_tag);
  10737. tcase_add_test(tc_basic, test_unfinished_epilog);
  10738. tcase_add_test(tc_basic, test_partial_char_in_epilog);
  10739. tcase_add_test(tc_basic, test_hash_collision);
  10740. tcase_add_test__ifdef_xml_dtd(tc_basic, test_suspend_resume_internal_entity);
  10741. tcase_add_test__ifdef_xml_dtd(tc_basic, test_resume_entity_with_syntax_error);
  10742. tcase_add_test__ifdef_xml_dtd(tc_basic, test_suspend_resume_parameter_entity);
  10743. tcase_add_test(tc_basic, test_restart_on_error);
  10744. tcase_add_test(tc_basic, test_reject_lt_in_attribute_value);
  10745. tcase_add_test(tc_basic, test_reject_unfinished_param_in_att_value);
  10746. tcase_add_test(tc_basic, test_trailing_cr_in_att_value);
  10747. tcase_add_test(tc_basic, test_standalone_internal_entity);
  10748. tcase_add_test(tc_basic, test_skipped_external_entity);
  10749. tcase_add_test(tc_basic, test_skipped_null_loaded_ext_entity);
  10750. tcase_add_test(tc_basic, test_skipped_unloaded_ext_entity);
  10751. tcase_add_test__ifdef_xml_dtd(tc_basic, test_param_entity_with_trailing_cr);
  10752. tcase_add_test(tc_basic, test_invalid_character_entity);
  10753. tcase_add_test(tc_basic, test_invalid_character_entity_2);
  10754. tcase_add_test(tc_basic, test_invalid_character_entity_3);
  10755. tcase_add_test(tc_basic, test_invalid_character_entity_4);
  10756. tcase_add_test(tc_basic, test_pi_handled_in_default);
  10757. tcase_add_test(tc_basic, test_comment_handled_in_default);
  10758. tcase_add_test(tc_basic, test_pi_yml);
  10759. tcase_add_test(tc_basic, test_pi_xnl);
  10760. tcase_add_test(tc_basic, test_pi_xmm);
  10761. tcase_add_test(tc_basic, test_utf16_pi);
  10762. tcase_add_test(tc_basic, test_utf16_be_pi);
  10763. tcase_add_test(tc_basic, test_utf16_be_comment);
  10764. tcase_add_test(tc_basic, test_utf16_le_comment);
  10765. tcase_add_test(tc_basic, test_missing_encoding_conversion_fn);
  10766. tcase_add_test(tc_basic, test_failing_encoding_conversion_fn);
  10767. tcase_add_test(tc_basic, test_unknown_encoding_success);
  10768. tcase_add_test(tc_basic, test_unknown_encoding_bad_name);
  10769. tcase_add_test(tc_basic, test_unknown_encoding_bad_name_2);
  10770. tcase_add_test(tc_basic, test_unknown_encoding_long_name_1);
  10771. tcase_add_test(tc_basic, test_unknown_encoding_long_name_2);
  10772. tcase_add_test(tc_basic, test_invalid_unknown_encoding);
  10773. tcase_add_test(tc_basic, test_unknown_ascii_encoding_ok);
  10774. tcase_add_test(tc_basic, test_unknown_ascii_encoding_fail);
  10775. tcase_add_test(tc_basic, test_unknown_encoding_invalid_length);
  10776. tcase_add_test(tc_basic, test_unknown_encoding_invalid_topbit);
  10777. tcase_add_test(tc_basic, test_unknown_encoding_invalid_surrogate);
  10778. tcase_add_test(tc_basic, test_unknown_encoding_invalid_high);
  10779. tcase_add_test(tc_basic, test_unknown_encoding_invalid_attr_value);
  10780. tcase_add_test(tc_basic, test_ext_entity_latin1_utf16le_bom);
  10781. tcase_add_test(tc_basic, test_ext_entity_latin1_utf16be_bom);
  10782. tcase_add_test(tc_basic, test_ext_entity_latin1_utf16le_bom2);
  10783. tcase_add_test(tc_basic, test_ext_entity_latin1_utf16be_bom2);
  10784. tcase_add_test(tc_basic, test_ext_entity_utf16_be);
  10785. tcase_add_test(tc_basic, test_ext_entity_utf16_le);
  10786. tcase_add_test(tc_basic, test_ext_entity_utf16_unknown);
  10787. tcase_add_test(tc_basic, test_ext_entity_utf8_non_bom);
  10788. tcase_add_test(tc_basic, test_utf8_in_cdata_section);
  10789. tcase_add_test(tc_basic, test_utf8_in_cdata_section_2);
  10790. tcase_add_test(tc_basic, test_trailing_spaces_in_elements);
  10791. tcase_add_test(tc_basic, test_utf16_attribute);
  10792. tcase_add_test(tc_basic, test_utf16_second_attr);
  10793. tcase_add_test(tc_basic, test_attr_after_solidus);
  10794. tcase_add_test__ifdef_xml_dtd(tc_basic, test_utf16_pe);
  10795. tcase_add_test(tc_basic, test_bad_attr_desc_keyword);
  10796. tcase_add_test(tc_basic, test_bad_attr_desc_keyword_utf16);
  10797. tcase_add_test(tc_basic, test_bad_doctype);
  10798. tcase_add_test(tc_basic, test_bad_doctype_utf16);
  10799. tcase_add_test(tc_basic, test_bad_doctype_plus);
  10800. tcase_add_test(tc_basic, test_bad_doctype_star);
  10801. tcase_add_test(tc_basic, test_bad_doctype_query);
  10802. tcase_add_test__ifdef_xml_dtd(tc_basic, test_unknown_encoding_bad_ignore);
  10803. tcase_add_test(tc_basic, test_entity_in_utf16_be_attr);
  10804. tcase_add_test(tc_basic, test_entity_in_utf16_le_attr);
  10805. tcase_add_test__ifdef_xml_dtd(tc_basic, test_entity_public_utf16_be);
  10806. tcase_add_test__ifdef_xml_dtd(tc_basic, test_entity_public_utf16_le);
  10807. tcase_add_test(tc_basic, test_short_doctype);
  10808. tcase_add_test(tc_basic, test_short_doctype_2);
  10809. tcase_add_test(tc_basic, test_short_doctype_3);
  10810. tcase_add_test(tc_basic, test_long_doctype);
  10811. tcase_add_test(tc_basic, test_bad_entity);
  10812. tcase_add_test(tc_basic, test_bad_entity_2);
  10813. tcase_add_test(tc_basic, test_bad_entity_3);
  10814. tcase_add_test(tc_basic, test_bad_entity_4);
  10815. tcase_add_test(tc_basic, test_bad_notation);
  10816. tcase_add_test(tc_basic, test_default_doctype_handler);
  10817. tcase_add_test(tc_basic, test_empty_element_abort);
  10818. suite_add_tcase(s, tc_namespace);
  10819. tcase_add_checked_fixture(tc_namespace, namespace_setup, namespace_teardown);
  10820. tcase_add_test(tc_namespace, test_return_ns_triplet);
  10821. tcase_add_test(tc_namespace, test_ns_tagname_overwrite);
  10822. tcase_add_test(tc_namespace, test_ns_tagname_overwrite_triplet);
  10823. tcase_add_test(tc_namespace, test_start_ns_clears_start_element);
  10824. tcase_add_test__ifdef_xml_dtd(tc_namespace,
  10825. test_default_ns_from_ext_subset_and_ext_ge);
  10826. tcase_add_test(tc_namespace, test_ns_prefix_with_empty_uri_1);
  10827. tcase_add_test(tc_namespace, test_ns_prefix_with_empty_uri_2);
  10828. tcase_add_test(tc_namespace, test_ns_prefix_with_empty_uri_3);
  10829. tcase_add_test(tc_namespace, test_ns_prefix_with_empty_uri_4);
  10830. tcase_add_test(tc_namespace, test_ns_unbound_prefix);
  10831. tcase_add_test(tc_namespace, test_ns_default_with_empty_uri);
  10832. tcase_add_test(tc_namespace, test_ns_duplicate_attrs_diff_prefixes);
  10833. tcase_add_test(tc_namespace, test_ns_duplicate_hashes);
  10834. tcase_add_test(tc_namespace, test_ns_unbound_prefix_on_attribute);
  10835. tcase_add_test(tc_namespace, test_ns_unbound_prefix_on_element);
  10836. tcase_add_test(tc_namespace, test_ns_parser_reset);
  10837. tcase_add_test(tc_namespace, test_ns_long_element);
  10838. tcase_add_test(tc_namespace, test_ns_mixed_prefix_atts);
  10839. tcase_add_test(tc_namespace, test_ns_extend_uri_buffer);
  10840. tcase_add_test(tc_namespace, test_ns_reserved_attributes);
  10841. tcase_add_test(tc_namespace, test_ns_reserved_attributes_2);
  10842. tcase_add_test(tc_namespace, test_ns_extremely_long_prefix);
  10843. tcase_add_test(tc_namespace, test_ns_unknown_encoding_success);
  10844. tcase_add_test(tc_namespace, test_ns_double_colon);
  10845. tcase_add_test(tc_namespace, test_ns_double_colon_element);
  10846. tcase_add_test(tc_namespace, test_ns_bad_attr_leafname);
  10847. tcase_add_test(tc_namespace, test_ns_bad_element_leafname);
  10848. tcase_add_test(tc_namespace, test_ns_utf16_leafname);
  10849. tcase_add_test(tc_namespace, test_ns_utf16_element_leafname);
  10850. tcase_add_test(tc_namespace, test_ns_utf16_doctype);
  10851. tcase_add_test(tc_namespace, test_ns_invalid_doctype);
  10852. tcase_add_test(tc_namespace, test_ns_double_colon_doctype);
  10853. suite_add_tcase(s, tc_misc);
  10854. tcase_add_checked_fixture(tc_misc, NULL, basic_teardown);
  10855. tcase_add_test(tc_misc, test_misc_alloc_create_parser);
  10856. tcase_add_test(tc_misc, test_misc_alloc_create_parser_with_encoding);
  10857. tcase_add_test(tc_misc, test_misc_null_parser);
  10858. tcase_add_test(tc_misc, test_misc_error_string);
  10859. tcase_add_test(tc_misc, test_misc_version);
  10860. tcase_add_test(tc_misc, test_misc_features);
  10861. tcase_add_test(tc_misc, test_misc_attribute_leak);
  10862. tcase_add_test(tc_misc, test_misc_utf16le);
  10863. tcase_add_test(tc_misc, test_misc_stop_during_end_handler_issue_240_1);
  10864. tcase_add_test(tc_misc, test_misc_stop_during_end_handler_issue_240_2);
  10865. tcase_add_test__ifdef_xml_dtd(
  10866. tc_misc, test_misc_deny_internal_entity_closing_doctype_issue_317);
  10867. suite_add_tcase(s, tc_alloc);
  10868. tcase_add_checked_fixture(tc_alloc, alloc_setup, alloc_teardown);
  10869. tcase_add_test(tc_alloc, test_alloc_parse_xdecl);
  10870. tcase_add_test(tc_alloc, test_alloc_parse_xdecl_2);
  10871. tcase_add_test(tc_alloc, test_alloc_parse_pi);
  10872. tcase_add_test(tc_alloc, test_alloc_parse_pi_2);
  10873. tcase_add_test(tc_alloc, test_alloc_parse_pi_3);
  10874. tcase_add_test(tc_alloc, test_alloc_parse_comment);
  10875. tcase_add_test(tc_alloc, test_alloc_parse_comment_2);
  10876. tcase_add_test__ifdef_xml_dtd(tc_alloc, test_alloc_create_external_parser);
  10877. tcase_add_test__ifdef_xml_dtd(tc_alloc, test_alloc_run_external_parser);
  10878. tcase_add_test__ifdef_xml_dtd(tc_alloc, test_alloc_dtd_copy_default_atts);
  10879. tcase_add_test__ifdef_xml_dtd(tc_alloc, test_alloc_external_entity);
  10880. tcase_add_test__ifdef_xml_dtd(tc_alloc, test_alloc_ext_entity_set_encoding);
  10881. tcase_add_test__ifdef_xml_dtd(tc_alloc, test_alloc_internal_entity);
  10882. tcase_add_test__ifdef_xml_dtd(tc_alloc, test_alloc_dtd_default_handling);
  10883. tcase_add_test(tc_alloc, test_alloc_explicit_encoding);
  10884. tcase_add_test(tc_alloc, test_alloc_set_base);
  10885. tcase_add_test(tc_alloc, test_alloc_realloc_buffer);
  10886. tcase_add_test(tc_alloc, test_alloc_ext_entity_realloc_buffer);
  10887. tcase_add_test(tc_alloc, test_alloc_realloc_many_attributes);
  10888. tcase_add_test__ifdef_xml_dtd(tc_alloc, test_alloc_public_entity_value);
  10889. tcase_add_test__ifdef_xml_dtd(tc_alloc,
  10890. test_alloc_realloc_subst_public_entity_value);
  10891. tcase_add_test(tc_alloc, test_alloc_parse_public_doctype);
  10892. tcase_add_test(tc_alloc, test_alloc_parse_public_doctype_long_name);
  10893. tcase_add_test__ifdef_xml_dtd(tc_alloc, test_alloc_set_foreign_dtd);
  10894. tcase_add_test__ifdef_xml_dtd(tc_alloc, test_alloc_attribute_enum_value);
  10895. tcase_add_test__ifdef_xml_dtd(tc_alloc,
  10896. test_alloc_realloc_attribute_enum_value);
  10897. tcase_add_test__ifdef_xml_dtd(tc_alloc, test_alloc_realloc_implied_attribute);
  10898. tcase_add_test__ifdef_xml_dtd(tc_alloc, test_alloc_realloc_default_attribute);
  10899. tcase_add_test(tc_alloc, test_alloc_notation);
  10900. tcase_add_test(tc_alloc, test_alloc_public_notation);
  10901. tcase_add_test(tc_alloc, test_alloc_system_notation);
  10902. tcase_add_test__ifdef_xml_dtd(tc_alloc, test_alloc_nested_groups);
  10903. tcase_add_test__ifdef_xml_dtd(tc_alloc, test_alloc_realloc_nested_groups);
  10904. tcase_add_test(tc_alloc, test_alloc_large_group);
  10905. tcase_add_test__ifdef_xml_dtd(tc_alloc, test_alloc_realloc_group_choice);
  10906. tcase_add_test(tc_alloc, test_alloc_pi_in_epilog);
  10907. tcase_add_test(tc_alloc, test_alloc_comment_in_epilog);
  10908. tcase_add_test__ifdef_xml_dtd(tc_alloc,
  10909. test_alloc_realloc_long_attribute_value);
  10910. tcase_add_test(tc_alloc, test_alloc_attribute_whitespace);
  10911. tcase_add_test(tc_alloc, test_alloc_attribute_predefined_entity);
  10912. tcase_add_test(tc_alloc, test_alloc_long_attr_default_with_char_ref);
  10913. tcase_add_test(tc_alloc, test_alloc_long_attr_value);
  10914. tcase_add_test__ifdef_xml_dtd(tc_alloc, test_alloc_nested_entities);
  10915. tcase_add_test__ifdef_xml_dtd(tc_alloc,
  10916. test_alloc_realloc_param_entity_newline);
  10917. tcase_add_test__ifdef_xml_dtd(tc_alloc, test_alloc_realloc_ce_extends_pe);
  10918. tcase_add_test__ifdef_xml_dtd(tc_alloc, test_alloc_realloc_attributes);
  10919. tcase_add_test(tc_alloc, test_alloc_long_doc_name);
  10920. tcase_add_test(tc_alloc, test_alloc_long_base);
  10921. tcase_add_test(tc_alloc, test_alloc_long_public_id);
  10922. tcase_add_test(tc_alloc, test_alloc_long_entity_value);
  10923. tcase_add_test(tc_alloc, test_alloc_long_notation);
  10924. suite_add_tcase(s, tc_nsalloc);
  10925. tcase_add_checked_fixture(tc_nsalloc, nsalloc_setup, nsalloc_teardown);
  10926. tcase_add_test(tc_nsalloc, test_nsalloc_xmlns);
  10927. tcase_add_test(tc_nsalloc, test_nsalloc_parse_buffer);
  10928. tcase_add_test(tc_nsalloc, test_nsalloc_long_prefix);
  10929. tcase_add_test(tc_nsalloc, test_nsalloc_long_uri);
  10930. tcase_add_test(tc_nsalloc, test_nsalloc_long_attr);
  10931. tcase_add_test(tc_nsalloc, test_nsalloc_long_attr_prefix);
  10932. tcase_add_test(tc_nsalloc, test_nsalloc_realloc_attributes);
  10933. tcase_add_test(tc_nsalloc, test_nsalloc_long_element);
  10934. tcase_add_test(tc_nsalloc, test_nsalloc_realloc_binding_uri);
  10935. tcase_add_test(tc_nsalloc, test_nsalloc_realloc_long_prefix);
  10936. tcase_add_test(tc_nsalloc, test_nsalloc_realloc_longer_prefix);
  10937. tcase_add_test(tc_nsalloc, test_nsalloc_long_namespace);
  10938. tcase_add_test(tc_nsalloc, test_nsalloc_less_long_namespace);
  10939. tcase_add_test(tc_nsalloc, test_nsalloc_long_context);
  10940. tcase_add_test(tc_nsalloc, test_nsalloc_realloc_long_context);
  10941. tcase_add_test(tc_nsalloc, test_nsalloc_realloc_long_context_2);
  10942. tcase_add_test(tc_nsalloc, test_nsalloc_realloc_long_context_3);
  10943. tcase_add_test(tc_nsalloc, test_nsalloc_realloc_long_context_4);
  10944. tcase_add_test(tc_nsalloc, test_nsalloc_realloc_long_context_5);
  10945. tcase_add_test(tc_nsalloc, test_nsalloc_realloc_long_context_6);
  10946. tcase_add_test(tc_nsalloc, test_nsalloc_realloc_long_context_7);
  10947. tcase_add_test(tc_nsalloc, test_nsalloc_realloc_long_ge_name);
  10948. tcase_add_test(tc_nsalloc, test_nsalloc_realloc_long_context_in_dtd);
  10949. tcase_add_test(tc_nsalloc, test_nsalloc_long_default_in_ext);
  10950. tcase_add_test(tc_nsalloc, test_nsalloc_long_systemid_in_ext);
  10951. tcase_add_test(tc_nsalloc, test_nsalloc_prefixed_element);
  10952. #if defined(XML_DTD)
  10953. suite_add_tcase(s, tc_accounting);
  10954. tcase_add_test(tc_accounting, test_accounting_precision);
  10955. tcase_add_test(tc_accounting, test_billion_laughs_attack_protection_api);
  10956. tcase_add_test(tc_accounting, test_helper_unsigned_char_to_printable);
  10957. #endif
  10958. return s;
  10959. }
  10960. int
  10961. main(int argc, char *argv[]) {
  10962. int i, nf;
  10963. int verbosity = CK_NORMAL;
  10964. Suite *s = make_suite();
  10965. SRunner *sr = srunner_create(s);
  10966. /* run the tests for internal helper functions */
  10967. testhelper_is_whitespace_normalized();
  10968. for (i = 1; i < argc; ++i) {
  10969. char *opt = argv[i];
  10970. if (strcmp(opt, "-v") == 0 || strcmp(opt, "--verbose") == 0)
  10971. verbosity = CK_VERBOSE;
  10972. else if (strcmp(opt, "-q") == 0 || strcmp(opt, "--quiet") == 0)
  10973. verbosity = CK_SILENT;
  10974. else {
  10975. fprintf(stderr, "runtests: unknown option '%s'\n", opt);
  10976. return 2;
  10977. }
  10978. }
  10979. if (verbosity != CK_SILENT)
  10980. printf("Expat version: %" XML_FMT_STR "\n", XML_ExpatVersion());
  10981. srunner_run_all(sr, verbosity);
  10982. nf = srunner_ntests_failed(sr);
  10983. srunner_free(sr);
  10984. return (nf == 0) ? EXIT_SUCCESS : EXIT_FAILURE;
  10985. }