| 1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071727374757677787980818283848586878889909192939495969798991001011021031041051061071081091101111121131141151161171181191201211221231241251261271281291301311321331341351361371381391401411421431441451461471481491501511521531541551561571581591601611621631641651661671681691701711721731741751761771781791801811821831841851861871881891901911921931941951961971981992002012022032042052062072082092102112122132142152162172182192202212222232242252262272282292302312322332342352362372382392402412422432442452462472482492502512522532542552562572582592602612622632642652662672682692702712722732742752762772782792802812822832842852862872882892902912922932942952962972982993003013023033043053063073083093103113123133143153163173183193203213223233243253263273283293303313323333343353363373383393403413423433443453463473483493503513523533543553563573583593603613623633643653663673683693703713723733743753763773783793803813823833843853863873883893903913923933943953963973983994004014024034044054064074084094104114124134144154164174184194204214224234244254264274284294304314324334344354364374384394404414424434444454464474484494504514524534544554564574584594604614624634644654664674684694704714724734744754764774784794804814824834844854864874884894904914924934944954964974984995005015025035045055065075085095105115125135145155165175185195205215225235245255265275285295305315325335345355365375385395405415425435445455465475485495505515525535545555565575585595605615625635645655665675685695705715725735745755765775785795805815825835845855865875885895905915925935945955965975985996006016026036046056066076086096106116126136146156166176186196206216226236246256266276286296306316326336346356366376386396406416426436446456466476486496506516526536546556566576586596606616626636646656666676686696706716726736746756766776786796806816826836846856866876886896906916926936946956966976986997007017027037047057067077087097107117127137147157167177187197207217227237247257267277287297307317327337347357367377387397407417427437447457467477487497507517527537547557567577587597607617627637647657667677687697707717727737747757767777787797807817827837847857867877887897907917927937947957967977987998008018028038048058068078088098108118128138148158168178188198208218228238248258268278288298308318328338348358368378388398408418428438448458468478488498508518528538548558568578588598608618628638648658668678688698708718728738748758768778788798808818828838848858868878888898908918928938948958968978988999009019029039049059069079089099109119129139149159169179189199209219229239249259269279289299309319329339349359369379389399409419429439449459469479489499509519529539549559569579589599609619629639649659669679689699709719729739749759769779789799809819829839849859869879889899909919929939949959969979989991000100110021003100410051006100710081009101010111012101310141015101610171018101910201021102210231024102510261027102810291030103110321033103410351036103710381039104010411042104310441045104610471048104910501051105210531054105510561057105810591060106110621063106410651066106710681069107010711072107310741075107610771078107910801081108210831084108510861087108810891090109110921093109410951096109710981099110011011102110311041105110611071108110911101111111211131114111511161117111811191120112111221123112411251126 |
- /*
- __ __ _
- ___\ \/ /_ __ __ _| |_
- / _ \\ /| '_ \ / _` | __|
- | __// \| |_) | (_| | |_
- \___/_/\_\ .__/ \__,_|\__|
- |_| XML parser
- Copyright (c) 1997-2000 Thai Open Source Software Center Ltd
- Copyright (c) 2000-2017 Expat development team
- Licensed under the MIT license:
- Permission is hereby granted, free of charge, to any person obtaining
- a copy of this software and associated documentation files (the
- "Software"), to deal in the Software without restriction, including
- without limitation the rights to use, copy, modify, merge, publish,
- distribute, sublicense, and/or sell copies of the Software, and to permit
- persons to whom the Software is furnished to do so, subject to the
- following conditions:
- The above copyright notice and this permission notice shall be included
- in all copies or substantial portions of the Software.
- THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
- EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
- MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN
- NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM,
- DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR
- OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE
- USE OR OTHER DEALINGS IN THE SOFTWARE.
- */
- #include <assert.h>
- #include <stdio.h>
- #include <stdlib.h>
- #include <stddef.h>
- #include <string.h>
- #include "expat.h"
- #include "codepage.h"
- #include "internal.h" /* for UNUSED_P only */
- #include "xmlfile.h"
- #include "xmltchar.h"
- #ifdef _MSC_VER
- # include <crtdbg.h>
- #endif
- #ifdef XML_UNICODE
- # include <wchar.h>
- #endif
- /* Structures for handler user data */
- typedef struct NotationList {
- struct NotationList *next;
- const XML_Char *notationName;
- const XML_Char *systemId;
- const XML_Char *publicId;
- } NotationList;
- typedef struct xmlwfUserData {
- FILE *fp;
- NotationList *notationListHead;
- const XML_Char *currentDoctypeName;
- } XmlwfUserData;
- /* This ensures proper sorting. */
- #define NSSEP T('\001')
- static void XMLCALL
- characterData(void *userData, const XML_Char *s, int len) {
- FILE *fp = ((XmlwfUserData *)userData)->fp;
- for (; len > 0; --len, ++s) {
- switch (*s) {
- case T('&'):
- fputts(T("&"), fp);
- break;
- case T('<'):
- fputts(T("<"), fp);
- break;
- case T('>'):
- fputts(T(">"), fp);
- break;
- #ifdef W3C14N
- case 13:
- fputts(T("
"), fp);
- break;
- #else
- case T('"'):
- fputts(T("""), fp);
- break;
- case 9:
- case 10:
- case 13:
- ftprintf(fp, T("&#%d;"), *s);
- break;
- #endif
- default:
- puttc(*s, fp);
- break;
- }
- }
- }
- static void
- attributeValue(FILE *fp, const XML_Char *s) {
- puttc(T('='), fp);
- puttc(T('"'), fp);
- assert(s);
- for (;;) {
- switch (*s) {
- case 0:
- case NSSEP:
- puttc(T('"'), fp);
- return;
- case T('&'):
- fputts(T("&"), fp);
- break;
- case T('<'):
- fputts(T("<"), fp);
- break;
- case T('"'):
- fputts(T("""), fp);
- break;
- #ifdef W3C14N
- case 9:
- fputts(T("	"), fp);
- break;
- case 10:
- fputts(T("
"), fp);
- break;
- case 13:
- fputts(T("
"), fp);
- break;
- #else
- case T('>'):
- fputts(T(">"), fp);
- break;
- case 9:
- case 10:
- case 13:
- ftprintf(fp, T("&#%d;"), *s);
- break;
- #endif
- default:
- puttc(*s, fp);
- break;
- }
- s++;
- }
- }
- /* Lexicographically comparing UTF-8 encoded attribute values,
- is equivalent to lexicographically comparing based on the character number. */
- static int
- attcmp(const void *att1, const void *att2) {
- return tcscmp(*(const XML_Char **)att1, *(const XML_Char **)att2);
- }
- static void XMLCALL
- startElement(void *userData, const XML_Char *name, const XML_Char **atts) {
- int nAtts;
- const XML_Char **p;
- FILE *fp = ((XmlwfUserData *)userData)->fp;
- puttc(T('<'), fp);
- fputts(name, fp);
- p = atts;
- while (*p)
- ++p;
- nAtts = (int)((p - atts) >> 1);
- if (nAtts > 1)
- qsort((void *)atts, nAtts, sizeof(XML_Char *) * 2, attcmp);
- while (*atts) {
- puttc(T(' '), fp);
- fputts(*atts++, fp);
- attributeValue(fp, *atts);
- atts++;
- }
- puttc(T('>'), fp);
- }
- static void XMLCALL
- endElement(void *userData, const XML_Char *name) {
- FILE *fp = ((XmlwfUserData *)userData)->fp;
- puttc(T('<'), fp);
- puttc(T('/'), fp);
- fputts(name, fp);
- puttc(T('>'), fp);
- }
- static int
- nsattcmp(const void *p1, const void *p2) {
- const XML_Char *att1 = *(const XML_Char **)p1;
- const XML_Char *att2 = *(const XML_Char **)p2;
- int sep1 = (tcsrchr(att1, NSSEP) != 0);
- int sep2 = (tcsrchr(att1, NSSEP) != 0);
- if (sep1 != sep2)
- return sep1 - sep2;
- return tcscmp(att1, att2);
- }
- static void XMLCALL
- startElementNS(void *userData, const XML_Char *name, const XML_Char **atts) {
- int nAtts;
- int nsi;
- const XML_Char **p;
- FILE *fp = ((XmlwfUserData *)userData)->fp;
- const XML_Char *sep;
- puttc(T('<'), fp);
- sep = tcsrchr(name, NSSEP);
- if (sep) {
- fputts(T("n1:"), fp);
- fputts(sep + 1, fp);
- fputts(T(" xmlns:n1"), fp);
- attributeValue(fp, name);
- nsi = 2;
- } else {
- fputts(name, fp);
- nsi = 1;
- }
- p = atts;
- while (*p)
- ++p;
- nAtts = (int)((p - atts) >> 1);
- if (nAtts > 1)
- qsort((void *)atts, nAtts, sizeof(XML_Char *) * 2, nsattcmp);
- while (*atts) {
- name = *atts++;
- sep = tcsrchr(name, NSSEP);
- puttc(T(' '), fp);
- if (sep) {
- ftprintf(fp, T("n%d:"), nsi);
- fputts(sep + 1, fp);
- } else
- fputts(name, fp);
- attributeValue(fp, *atts);
- if (sep) {
- ftprintf(fp, T(" xmlns:n%d"), nsi++);
- attributeValue(fp, name);
- }
- atts++;
- }
- puttc(T('>'), fp);
- }
- static void XMLCALL
- endElementNS(void *userData, const XML_Char *name) {
- FILE *fp = ((XmlwfUserData *)userData)->fp;
- const XML_Char *sep;
- puttc(T('<'), fp);
- puttc(T('/'), fp);
- sep = tcsrchr(name, NSSEP);
- if (sep) {
- fputts(T("n1:"), fp);
- fputts(sep + 1, fp);
- } else
- fputts(name, fp);
- puttc(T('>'), fp);
- }
- #ifndef W3C14N
- static void XMLCALL
- processingInstruction(void *userData, const XML_Char *target,
- const XML_Char *data) {
- FILE *fp = ((XmlwfUserData *)userData)->fp;
- puttc(T('<'), fp);
- puttc(T('?'), fp);
- fputts(target, fp);
- puttc(T(' '), fp);
- fputts(data, fp);
- puttc(T('?'), fp);
- puttc(T('>'), fp);
- }
- static XML_Char *
- xcsdup(const XML_Char *s) {
- XML_Char *result;
- int count = 0;
- int numBytes;
- /* Get the length of the string, including terminator */
- while (s[count++] != 0) {
- /* Do nothing */
- }
- numBytes = count * sizeof(XML_Char);
- result = malloc(numBytes);
- if (result == NULL)
- return NULL;
- memcpy(result, s, numBytes);
- return result;
- }
- static void XMLCALL
- startDoctypeDecl(void *userData, const XML_Char *doctypeName,
- const XML_Char *sysid, const XML_Char *publid,
- int has_internal_subset) {
- XmlwfUserData *data = (XmlwfUserData *)userData;
- UNUSED_P(sysid);
- UNUSED_P(publid);
- UNUSED_P(has_internal_subset);
- data->currentDoctypeName = xcsdup(doctypeName);
- }
- static void
- freeNotations(XmlwfUserData *data) {
- NotationList *notationListHead = data->notationListHead;
- while (notationListHead != NULL) {
- NotationList *next = notationListHead->next;
- free((void *)notationListHead->notationName);
- free((void *)notationListHead->systemId);
- free((void *)notationListHead->publicId);
- free(notationListHead);
- notationListHead = next;
- }
- data->notationListHead = NULL;
- }
- static int
- xcscmp(const XML_Char *xs, const XML_Char *xt) {
- while (*xs != 0 && *xt != 0) {
- if (*xs < *xt)
- return -1;
- if (*xs > *xt)
- return 1;
- xs++;
- xt++;
- }
- if (*xs < *xt)
- return -1;
- if (*xs > *xt)
- return 1;
- return 0;
- }
- static int
- notationCmp(const void *a, const void *b) {
- const NotationList *const n1 = *(NotationList **)a;
- const NotationList *const n2 = *(NotationList **)b;
- return xcscmp(n1->notationName, n2->notationName);
- }
- static void XMLCALL
- endDoctypeDecl(void *userData) {
- XmlwfUserData *data = (XmlwfUserData *)userData;
- NotationList **notations;
- int notationCount = 0;
- NotationList *p;
- int i;
- /* How many notations do we have? */
- for (p = data->notationListHead; p != NULL; p = p->next)
- notationCount++;
- if (notationCount == 0) {
- /* Nothing to report */
- free((void *)data->currentDoctypeName);
- data->currentDoctypeName = NULL;
- return;
- }
- notations = malloc(notationCount * sizeof(NotationList *));
- if (notations == NULL) {
- fprintf(stderr, "Unable to sort notations");
- freeNotations(data);
- return;
- }
- for (p = data->notationListHead, i = 0; i < notationCount; p = p->next, i++) {
- notations[i] = p;
- }
- qsort(notations, notationCount, sizeof(NotationList *), notationCmp);
- /* Output the DOCTYPE header */
- fputts(T("<!DOCTYPE "), data->fp);
- fputts(data->currentDoctypeName, data->fp);
- fputts(T(" [\n"), data->fp);
- /* Now the NOTATIONs */
- for (i = 0; i < notationCount; i++) {
- fputts(T("<!NOTATION "), data->fp);
- fputts(notations[i]->notationName, data->fp);
- if (notations[i]->publicId != NULL) {
- fputts(T(" PUBLIC '"), data->fp);
- fputts(notations[i]->publicId, data->fp);
- puttc(T('\''), data->fp);
- if (notations[i]->systemId != NULL) {
- puttc(T(' '), data->fp);
- puttc(T('\''), data->fp);
- fputts(notations[i]->systemId, data->fp);
- puttc(T('\''), data->fp);
- }
- } else if (notations[i]->systemId != NULL) {
- fputts(T(" SYSTEM '"), data->fp);
- fputts(notations[i]->systemId, data->fp);
- puttc(T('\''), data->fp);
- }
- puttc(T('>'), data->fp);
- puttc(T('\n'), data->fp);
- }
- /* Finally end the DOCTYPE */
- fputts(T("]>\n"), data->fp);
- free(notations);
- freeNotations(data);
- free((void *)data->currentDoctypeName);
- data->currentDoctypeName = NULL;
- }
- static void XMLCALL
- notationDecl(void *userData, const XML_Char *notationName, const XML_Char *base,
- const XML_Char *systemId, const XML_Char *publicId) {
- XmlwfUserData *data = (XmlwfUserData *)userData;
- NotationList *entry = malloc(sizeof(NotationList));
- const char *errorMessage = "Unable to store NOTATION for output\n";
- UNUSED_P(base);
- if (entry == NULL) {
- fputs(errorMessage, stderr);
- return; /* Nothing we can really do about this */
- }
- entry->notationName = xcsdup(notationName);
- if (entry->notationName == NULL) {
- fputs(errorMessage, stderr);
- free(entry);
- return;
- }
- if (systemId != NULL) {
- entry->systemId = xcsdup(systemId);
- if (entry->systemId == NULL) {
- fputs(errorMessage, stderr);
- free((void *)entry->notationName);
- free(entry);
- return;
- }
- } else {
- entry->systemId = NULL;
- }
- if (publicId != NULL) {
- entry->publicId = xcsdup(publicId);
- if (entry->publicId == NULL) {
- fputs(errorMessage, stderr);
- free((void *)entry->systemId); /* Safe if it's NULL */
- free((void *)entry->notationName);
- free(entry);
- return;
- }
- } else {
- entry->publicId = NULL;
- }
- entry->next = data->notationListHead;
- data->notationListHead = entry;
- }
- #endif /* not W3C14N */
- static void XMLCALL
- defaultCharacterData(void *userData, const XML_Char *s, int len) {
- UNUSED_P(s);
- UNUSED_P(len);
- XML_DefaultCurrent((XML_Parser)userData);
- }
- static void XMLCALL
- defaultStartElement(void *userData, const XML_Char *name,
- const XML_Char **atts) {
- UNUSED_P(name);
- UNUSED_P(atts);
- XML_DefaultCurrent((XML_Parser)userData);
- }
- static void XMLCALL
- defaultEndElement(void *userData, const XML_Char *name) {
- UNUSED_P(name);
- XML_DefaultCurrent((XML_Parser)userData);
- }
- static void XMLCALL
- defaultProcessingInstruction(void *userData, const XML_Char *target,
- const XML_Char *data) {
- UNUSED_P(target);
- UNUSED_P(data);
- XML_DefaultCurrent((XML_Parser)userData);
- }
- static void XMLCALL
- nopCharacterData(void *userData, const XML_Char *s, int len) {
- UNUSED_P(userData);
- UNUSED_P(s);
- UNUSED_P(len);
- }
- static void XMLCALL
- nopStartElement(void *userData, const XML_Char *name, const XML_Char **atts) {
- UNUSED_P(userData);
- UNUSED_P(name);
- UNUSED_P(atts);
- }
- static void XMLCALL
- nopEndElement(void *userData, const XML_Char *name) {
- UNUSED_P(userData);
- UNUSED_P(name);
- }
- static void XMLCALL
- nopProcessingInstruction(void *userData, const XML_Char *target,
- const XML_Char *data) {
- UNUSED_P(userData);
- UNUSED_P(target);
- UNUSED_P(data);
- }
- static void XMLCALL
- markup(void *userData, const XML_Char *s, int len) {
- FILE *fp = ((XmlwfUserData *)XML_GetUserData((XML_Parser)userData))->fp;
- for (; len > 0; --len, ++s)
- puttc(*s, fp);
- }
- static void
- metaLocation(XML_Parser parser) {
- const XML_Char *uri = XML_GetBase(parser);
- FILE *fp = ((XmlwfUserData *)XML_GetUserData(parser))->fp;
- if (uri)
- ftprintf(fp, T(" uri=\"%s\""), uri);
- ftprintf(fp,
- T(" byte=\"%") T(XML_FMT_INT_MOD) T("d\"") T(" nbytes=\"%d\"")
- T(" line=\"%") T(XML_FMT_INT_MOD) T("u\"") T(" col=\"%")
- T(XML_FMT_INT_MOD) T("u\""),
- XML_GetCurrentByteIndex(parser), XML_GetCurrentByteCount(parser),
- XML_GetCurrentLineNumber(parser),
- XML_GetCurrentColumnNumber(parser));
- }
- static void
- metaStartDocument(void *userData) {
- fputts(T("<document>\n"),
- ((XmlwfUserData *)XML_GetUserData((XML_Parser)userData))->fp);
- }
- static void
- metaEndDocument(void *userData) {
- fputts(T("</document>\n"),
- ((XmlwfUserData *)XML_GetUserData((XML_Parser)userData))->fp);
- }
- static void XMLCALL
- metaStartElement(void *userData, const XML_Char *name, const XML_Char **atts) {
- XML_Parser parser = (XML_Parser)userData;
- XmlwfUserData *data = (XmlwfUserData *)XML_GetUserData(parser);
- FILE *fp = data->fp;
- const XML_Char **specifiedAttsEnd
- = atts + XML_GetSpecifiedAttributeCount(parser);
- const XML_Char **idAttPtr;
- int idAttIndex = XML_GetIdAttributeIndex(parser);
- if (idAttIndex < 0)
- idAttPtr = 0;
- else
- idAttPtr = atts + idAttIndex;
- ftprintf(fp, T("<starttag name=\"%s\""), name);
- metaLocation(parser);
- if (*atts) {
- fputts(T(">\n"), fp);
- do {
- ftprintf(fp, T("<attribute name=\"%s\" value=\""), atts[0]);
- characterData(data, atts[1], (int)tcslen(atts[1]));
- if (atts >= specifiedAttsEnd)
- fputts(T("\" defaulted=\"yes\"/>\n"), fp);
- else if (atts == idAttPtr)
- fputts(T("\" id=\"yes\"/>\n"), fp);
- else
- fputts(T("\"/>\n"), fp);
- } while (*(atts += 2));
- fputts(T("</starttag>\n"), fp);
- } else
- fputts(T("/>\n"), fp);
- }
- static void XMLCALL
- metaEndElement(void *userData, const XML_Char *name) {
- XML_Parser parser = (XML_Parser)userData;
- XmlwfUserData *data = (XmlwfUserData *)XML_GetUserData(parser);
- FILE *fp = data->fp;
- ftprintf(fp, T("<endtag name=\"%s\""), name);
- metaLocation(parser);
- fputts(T("/>\n"), fp);
- }
- static void XMLCALL
- metaProcessingInstruction(void *userData, const XML_Char *target,
- const XML_Char *data) {
- XML_Parser parser = (XML_Parser)userData;
- XmlwfUserData *usrData = (XmlwfUserData *)XML_GetUserData(parser);
- FILE *fp = usrData->fp;
- ftprintf(fp, T("<pi target=\"%s\" data=\""), target);
- characterData(usrData, data, (int)tcslen(data));
- puttc(T('"'), fp);
- metaLocation(parser);
- fputts(T("/>\n"), fp);
- }
- static void XMLCALL
- metaComment(void *userData, const XML_Char *data) {
- XML_Parser parser = (XML_Parser)userData;
- XmlwfUserData *usrData = (XmlwfUserData *)XML_GetUserData(parser);
- FILE *fp = usrData->fp;
- fputts(T("<comment data=\""), fp);
- characterData(usrData, data, (int)tcslen(data));
- puttc(T('"'), fp);
- metaLocation(parser);
- fputts(T("/>\n"), fp);
- }
- static void XMLCALL
- metaStartCdataSection(void *userData) {
- XML_Parser parser = (XML_Parser)userData;
- XmlwfUserData *data = (XmlwfUserData *)XML_GetUserData(parser);
- FILE *fp = data->fp;
- fputts(T("<startcdata"), fp);
- metaLocation(parser);
- fputts(T("/>\n"), fp);
- }
- static void XMLCALL
- metaEndCdataSection(void *userData) {
- XML_Parser parser = (XML_Parser)userData;
- XmlwfUserData *data = (XmlwfUserData *)XML_GetUserData(parser);
- FILE *fp = data->fp;
- fputts(T("<endcdata"), fp);
- metaLocation(parser);
- fputts(T("/>\n"), fp);
- }
- static void XMLCALL
- metaCharacterData(void *userData, const XML_Char *s, int len) {
- XML_Parser parser = (XML_Parser)userData;
- XmlwfUserData *data = (XmlwfUserData *)XML_GetUserData(parser);
- FILE *fp = data->fp;
- fputts(T("<chars str=\""), fp);
- characterData(data, s, len);
- puttc(T('"'), fp);
- metaLocation(parser);
- fputts(T("/>\n"), fp);
- }
- static void XMLCALL
- metaStartDoctypeDecl(void *userData, const XML_Char *doctypeName,
- const XML_Char *sysid, const XML_Char *pubid,
- int has_internal_subset) {
- XML_Parser parser = (XML_Parser)userData;
- XmlwfUserData *data = (XmlwfUserData *)XML_GetUserData(parser);
- FILE *fp = data->fp;
- UNUSED_P(sysid);
- UNUSED_P(pubid);
- UNUSED_P(has_internal_subset);
- ftprintf(fp, T("<startdoctype name=\"%s\""), doctypeName);
- metaLocation(parser);
- fputts(T("/>\n"), fp);
- }
- static void XMLCALL
- metaEndDoctypeDecl(void *userData) {
- XML_Parser parser = (XML_Parser)userData;
- XmlwfUserData *data = (XmlwfUserData *)XML_GetUserData(parser);
- FILE *fp = data->fp;
- fputts(T("<enddoctype"), fp);
- metaLocation(parser);
- fputts(T("/>\n"), fp);
- }
- static void XMLCALL
- metaNotationDecl(void *userData, const XML_Char *notationName,
- const XML_Char *base, const XML_Char *systemId,
- const XML_Char *publicId) {
- XML_Parser parser = (XML_Parser)userData;
- XmlwfUserData *data = (XmlwfUserData *)XML_GetUserData(parser);
- FILE *fp = data->fp;
- UNUSED_P(base);
- ftprintf(fp, T("<notation name=\"%s\""), notationName);
- if (publicId)
- ftprintf(fp, T(" public=\"%s\""), publicId);
- if (systemId) {
- fputts(T(" system=\""), fp);
- characterData(data, systemId, (int)tcslen(systemId));
- puttc(T('"'), fp);
- }
- metaLocation(parser);
- fputts(T("/>\n"), fp);
- }
- static void XMLCALL
- metaEntityDecl(void *userData, const XML_Char *entityName, int is_param,
- const XML_Char *value, int value_length, const XML_Char *base,
- const XML_Char *systemId, const XML_Char *publicId,
- const XML_Char *notationName) {
- XML_Parser parser = (XML_Parser)userData;
- XmlwfUserData *data = (XmlwfUserData *)XML_GetUserData(parser);
- FILE *fp = data->fp;
- UNUSED_P(is_param);
- UNUSED_P(base);
- if (value) {
- ftprintf(fp, T("<entity name=\"%s\""), entityName);
- metaLocation(parser);
- puttc(T('>'), fp);
- characterData(data, value, value_length);
- fputts(T("</entity/>\n"), fp);
- } else if (notationName) {
- ftprintf(fp, T("<entity name=\"%s\""), entityName);
- if (publicId)
- ftprintf(fp, T(" public=\"%s\""), publicId);
- fputts(T(" system=\""), fp);
- characterData(data, systemId, (int)tcslen(systemId));
- puttc(T('"'), fp);
- ftprintf(fp, T(" notation=\"%s\""), notationName);
- metaLocation(parser);
- fputts(T("/>\n"), fp);
- } else {
- ftprintf(fp, T("<entity name=\"%s\""), entityName);
- if (publicId)
- ftprintf(fp, T(" public=\"%s\""), publicId);
- fputts(T(" system=\""), fp);
- characterData(data, systemId, (int)tcslen(systemId));
- puttc(T('"'), fp);
- metaLocation(parser);
- fputts(T("/>\n"), fp);
- }
- }
- static void XMLCALL
- metaStartNamespaceDecl(void *userData, const XML_Char *prefix,
- const XML_Char *uri) {
- XML_Parser parser = (XML_Parser)userData;
- XmlwfUserData *data = (XmlwfUserData *)XML_GetUserData(parser);
- FILE *fp = data->fp;
- fputts(T("<startns"), fp);
- if (prefix)
- ftprintf(fp, T(" prefix=\"%s\""), prefix);
- if (uri) {
- fputts(T(" ns=\""), fp);
- characterData(data, uri, (int)tcslen(uri));
- fputts(T("\"/>\n"), fp);
- } else
- fputts(T("/>\n"), fp);
- }
- static void XMLCALL
- metaEndNamespaceDecl(void *userData, const XML_Char *prefix) {
- XML_Parser parser = (XML_Parser)userData;
- XmlwfUserData *data = (XmlwfUserData *)XML_GetUserData(parser);
- FILE *fp = data->fp;
- if (! prefix)
- fputts(T("<endns/>\n"), fp);
- else
- ftprintf(fp, T("<endns prefix=\"%s\"/>\n"), prefix);
- }
- static int XMLCALL
- unknownEncodingConvert(void *data, const char *p) {
- return codepageConvert(*(int *)data, p);
- }
- static int XMLCALL
- unknownEncoding(void *userData, const XML_Char *name, XML_Encoding *info) {
- int cp;
- static const XML_Char prefixL[] = T("windows-");
- static const XML_Char prefixU[] = T("WINDOWS-");
- int i;
- UNUSED_P(userData);
- for (i = 0; prefixU[i]; i++)
- if (name[i] != prefixU[i] && name[i] != prefixL[i])
- return 0;
- cp = 0;
- for (; name[i]; i++) {
- static const XML_Char digits[] = T("0123456789");
- const XML_Char *s = tcschr(digits, name[i]);
- if (! s)
- return 0;
- cp *= 10;
- cp += (int)(s - digits);
- if (cp >= 0x10000)
- return 0;
- }
- if (! codepageMap(cp, info->map))
- return 0;
- info->convert = unknownEncodingConvert;
- /* We could just cast the code page integer to a void *,
- and avoid the use of release. */
- info->release = free;
- info->data = malloc(sizeof(int));
- if (! info->data)
- return 0;
- *(int *)info->data = cp;
- return 1;
- }
- static int XMLCALL
- notStandalone(void *userData) {
- UNUSED_P(userData);
- return 0;
- }
- static void
- showVersion(XML_Char *prog) {
- XML_Char *s = prog;
- XML_Char ch;
- const XML_Feature *features = XML_GetFeatureList();
- while ((ch = *s) != 0) {
- if (ch == '/'
- #if defined(_WIN32)
- || ch == '\\'
- #endif
- )
- prog = s + 1;
- ++s;
- }
- ftprintf(stdout, T("%s using %s\n"), prog, XML_ExpatVersion());
- if (features != NULL && features[0].feature != XML_FEATURE_END) {
- int i = 1;
- ftprintf(stdout, T("%s"), features[0].name);
- if (features[0].value)
- ftprintf(stdout, T("=%ld"), features[0].value);
- while (features[i].feature != XML_FEATURE_END) {
- ftprintf(stdout, T(", %s"), features[i].name);
- if (features[i].value)
- ftprintf(stdout, T("=%ld"), features[i].value);
- ++i;
- }
- ftprintf(stdout, T("\n"));
- }
- }
- static void
- usage(const XML_Char *prog, int rc) {
- ftprintf(
- stderr,
- /* Generated with:
- * $ xmlwf/xmlwf_helpgen.sh
- */
- /* clang-format off */
- T("usage: %s [-s] [-n] [-p] [-x] [-e ENCODING] [-w] [-r] [-d DIRECTORY]\n")
- T(" [-c | -m | -t] [-N]\n")
- T(" [FILE [FILE ...]]\n")
- T("\n")
- T("xmlwf - Determines if an XML document is well-formed\n")
- T("\n")
- T("positional arguments:\n")
- T(" FILE files to process (default: STDIN)\n")
- T("\n")
- T("input control arguments:\n")
- T(" -s print an error if the document is not [s]tandalone\n")
- T(" -n enable [n]amespace processing\n")
- T(" -p enable processing external DTDs and [p]arameter entities\n")
- T(" -x enable processing of e[x]ternal entities\n")
- T(" -e ENCODING override any in-document [e]ncoding declaration\n")
- T(" -w enable support for [W]indows code pages\n")
- T(" -r disable memory-mapping and use normal file [r]ead IO calls instead\n")
- T("\n")
- T("output control arguments:\n")
- T(" -d DIRECTORY output [d]estination directory\n")
- T(" -c write a [c]opy of input XML, not canonical XML\n")
- T(" -m write [m]eta XML, not canonical XML\n")
- T(" -t write no XML output for [t]iming of plain parsing\n")
- T(" -N enable adding doctype and [n]otation declarations\n")
- T("\n")
- T("info arguments:\n")
- T(" -h show this [h]elp message and exit\n")
- T(" -v show program's [v]ersion number and exit\n")
- T("\n")
- T("libexpat is software libre, licensed under the MIT license.\n")
- T("Please report bugs at https://github.com/libexpat/libexpat/issues. Thank you!\n")
- , /* clang-format on */
- prog);
- exit(rc);
- }
- #if defined(__MINGW32__) && defined(XML_UNICODE)
- /* Silence warning about missing prototype */
- int wmain(int argc, XML_Char **argv);
- #endif
- int
- tmain(int argc, XML_Char **argv) {
- int i, j;
- const XML_Char *outputDir = NULL;
- const XML_Char *encoding = NULL;
- unsigned processFlags = XML_MAP_FILE;
- int windowsCodePages = 0;
- int outputType = 0;
- int useNamespaces = 0;
- int requireStandalone = 0;
- int requiresNotations = 0;
- enum XML_ParamEntityParsing paramEntityParsing
- = XML_PARAM_ENTITY_PARSING_NEVER;
- int useStdin = 0;
- XmlwfUserData userData = {NULL, NULL, NULL};
- #ifdef _MSC_VER
- _CrtSetDbgFlag(_CRTDBG_ALLOC_MEM_DF | _CRTDBG_LEAK_CHECK_DF);
- #endif
- i = 1;
- j = 0;
- while (i < argc) {
- if (j == 0) {
- if (argv[i][0] != T('-'))
- break;
- if (argv[i][1] == T('-') && argv[i][2] == T('\0')) {
- i++;
- break;
- }
- j++;
- }
- switch (argv[i][j]) {
- case T('r'):
- processFlags &= ~XML_MAP_FILE;
- j++;
- break;
- case T('s'):
- requireStandalone = 1;
- j++;
- break;
- case T('n'):
- useNamespaces = 1;
- j++;
- break;
- case T('p'):
- paramEntityParsing = XML_PARAM_ENTITY_PARSING_ALWAYS;
- /* fall through */
- case T('x'):
- processFlags |= XML_EXTERNAL_ENTITIES;
- j++;
- break;
- case T('w'):
- windowsCodePages = 1;
- j++;
- break;
- case T('m'):
- outputType = 'm';
- j++;
- break;
- case T('c'):
- outputType = 'c';
- useNamespaces = 0;
- j++;
- break;
- case T('t'):
- outputType = 't';
- j++;
- break;
- case T('N'):
- requiresNotations = 1;
- j++;
- break;
- case T('d'):
- if (argv[i][j + 1] == T('\0')) {
- if (++i == argc)
- usage(argv[0], 2);
- outputDir = argv[i];
- } else
- outputDir = argv[i] + j + 1;
- i++;
- j = 0;
- break;
- case T('e'):
- if (argv[i][j + 1] == T('\0')) {
- if (++i == argc)
- usage(argv[0], 2);
- encoding = argv[i];
- } else
- encoding = argv[i] + j + 1;
- i++;
- j = 0;
- break;
- case T('h'):
- usage(argv[0], 0);
- return 0;
- case T('v'):
- showVersion(argv[0]);
- return 0;
- case T('\0'):
- if (j > 1) {
- i++;
- j = 0;
- break;
- }
- /* fall through */
- default:
- usage(argv[0], 2);
- }
- }
- if (i == argc) {
- useStdin = 1;
- processFlags &= ~XML_MAP_FILE;
- i--;
- }
- for (; i < argc; i++) {
- XML_Char *outName = 0;
- int result;
- XML_Parser parser;
- if (useNamespaces)
- parser = XML_ParserCreateNS(encoding, NSSEP);
- else
- parser = XML_ParserCreate(encoding);
- if (! parser) {
- tperror(T("Could not instantiate parser"));
- exit(1);
- }
- if (requireStandalone)
- XML_SetNotStandaloneHandler(parser, notStandalone);
- XML_SetParamEntityParsing(parser, paramEntityParsing);
- if (outputType == 't') {
- /* This is for doing timings; this gives a more realistic estimate of
- the parsing time. */
- outputDir = 0;
- XML_SetElementHandler(parser, nopStartElement, nopEndElement);
- XML_SetCharacterDataHandler(parser, nopCharacterData);
- XML_SetProcessingInstructionHandler(parser, nopProcessingInstruction);
- } else if (outputDir) {
- const XML_Char *delim = T("/");
- const XML_Char *file = useStdin ? T("STDIN") : argv[i];
- if (! useStdin) {
- /* Jump after last (back)slash */
- const XML_Char *lastDelim = tcsrchr(file, delim[0]);
- if (lastDelim)
- file = lastDelim + 1;
- #if defined(_WIN32)
- else {
- const XML_Char *winDelim = T("\\");
- lastDelim = tcsrchr(file, winDelim[0]);
- if (lastDelim) {
- file = lastDelim + 1;
- delim = winDelim;
- }
- }
- #endif
- }
- outName = (XML_Char *)malloc((tcslen(outputDir) + tcslen(file) + 2)
- * sizeof(XML_Char));
- tcscpy(outName, outputDir);
- tcscat(outName, delim);
- tcscat(outName, file);
- userData.fp = tfopen(outName, T("wb"));
- if (! userData.fp) {
- tperror(outName);
- exit(1);
- }
- setvbuf(userData.fp, NULL, _IOFBF, 16384);
- #ifdef XML_UNICODE
- puttc(0xFEFF, userData.fp);
- #endif
- XML_SetUserData(parser, &userData);
- switch (outputType) {
- case 'm':
- XML_UseParserAsHandlerArg(parser);
- XML_SetElementHandler(parser, metaStartElement, metaEndElement);
- XML_SetProcessingInstructionHandler(parser, metaProcessingInstruction);
- XML_SetCommentHandler(parser, metaComment);
- XML_SetCdataSectionHandler(parser, metaStartCdataSection,
- metaEndCdataSection);
- XML_SetCharacterDataHandler(parser, metaCharacterData);
- XML_SetDoctypeDeclHandler(parser, metaStartDoctypeDecl,
- metaEndDoctypeDecl);
- XML_SetEntityDeclHandler(parser, metaEntityDecl);
- XML_SetNotationDeclHandler(parser, metaNotationDecl);
- XML_SetNamespaceDeclHandler(parser, metaStartNamespaceDecl,
- metaEndNamespaceDecl);
- metaStartDocument(parser);
- break;
- case 'c':
- XML_UseParserAsHandlerArg(parser);
- XML_SetDefaultHandler(parser, markup);
- XML_SetElementHandler(parser, defaultStartElement, defaultEndElement);
- XML_SetCharacterDataHandler(parser, defaultCharacterData);
- XML_SetProcessingInstructionHandler(parser,
- defaultProcessingInstruction);
- break;
- default:
- if (useNamespaces)
- XML_SetElementHandler(parser, startElementNS, endElementNS);
- else
- XML_SetElementHandler(parser, startElement, endElement);
- XML_SetCharacterDataHandler(parser, characterData);
- #ifndef W3C14N
- XML_SetProcessingInstructionHandler(parser, processingInstruction);
- if (requiresNotations) {
- XML_SetDoctypeDeclHandler(parser, startDoctypeDecl, endDoctypeDecl);
- XML_SetNotationDeclHandler(parser, notationDecl);
- }
- #endif /* not W3C14N */
- break;
- }
- }
- if (windowsCodePages)
- XML_SetUnknownEncodingHandler(parser, unknownEncoding, 0);
- result = XML_ProcessFile(parser, useStdin ? NULL : argv[i], processFlags);
- if (outputDir) {
- if (outputType == 'm')
- metaEndDocument(parser);
- fclose(userData.fp);
- if (! result) {
- tremove(outName);
- }
- free(outName);
- }
- XML_ParserFree(parser);
- if (! result) {
- exit(2);
- }
- }
- return 0;
- }
|