| 123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280 |
- /*
- __ __ _
- ___\ \/ /_ __ __ _| |_
- / _ \\ /| '_ \ / _` | __|
- | __// \| |_) | (_| | |_
- \___/_/\_\ .__/ \__,_|\__|
- |_| XML parser
- Copyright (c) 1997-2000 Thai Open Source Software Center Ltd
- Copyright (c) 2000 Clark Cooper <[email protected]>
- Copyright (c) 2002-2003 Fred L. Drake, Jr. <[email protected]>
- Copyright (c) 2004-2006 Karl Waclawek <[email protected]>
- Copyright (c) 2005-2007 Steven Solie <[email protected]>
- Copyright (c) 2016-2021 Sebastian Pipping <[email protected]>
- Copyright (c) 2017 Rhodri James <[email protected]>
- Copyright (c) 2019 David Loffredo <[email protected]>
- Copyright (c) 2021 Dong-hee Na <[email protected]>
- Licensed under the MIT license:
- Permission is hereby granted, free of charge, to any person obtaining
- a copy of this software and associated documentation files (the
- "Software"), to deal in the Software without restriction, including
- without limitation the rights to use, copy, modify, merge, publish,
- distribute, sublicense, and/or sell copies of the Software, and to permit
- persons to whom the Software is furnished to do so, subject to the
- following conditions:
- The above copyright notice and this permission notice shall be included
- in all copies or substantial portions of the Software.
- THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
- EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
- MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN
- NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM,
- DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR
- OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE
- USE OR OTHER DEALINGS IN THE SOFTWARE.
- */
- #include <expat_config.h>
- #include <stdio.h>
- #include <stdlib.h>
- #include <stddef.h>
- #include <string.h>
- #include <fcntl.h>
- #ifdef _WIN32
- # include "winconfig.h"
- #endif
- #include "expat.h"
- #include "internal.h" /* for UNUSED_P only */
- #include "xmlfile.h"
- #include "xmltchar.h"
- #include "filemap.h"
- #if defined(_MSC_VER)
- # include <io.h>
- #endif
- #ifdef HAVE_UNISTD_H
- # include <unistd.h>
- #endif
- #ifndef O_BINARY
- # ifdef _O_BINARY
- # define O_BINARY _O_BINARY
- # else
- # define O_BINARY 0
- # endif
- #endif
- #ifdef _DEBUG
- # define READ_SIZE 16
- #else
- # define READ_SIZE (1024 * 8)
- #endif
- typedef struct {
- XML_Parser parser;
- int *retPtr;
- } PROCESS_ARGS;
- static int processStream(const XML_Char *filename, XML_Parser parser);
- static void
- reportError(XML_Parser parser, const XML_Char *filename) {
- enum XML_Error code = XML_GetErrorCode(parser);
- const XML_Char *message = XML_ErrorString(code);
- if (message)
- ftprintf(stdout,
- T("%s") T(":%") T(XML_FMT_INT_MOD) T("u") T(":%")
- T(XML_FMT_INT_MOD) T("u") T(": %s\n"),
- filename, XML_GetErrorLineNumber(parser),
- XML_GetErrorColumnNumber(parser), message);
- else
- ftprintf(stderr, T("%s: (unknown message %d)\n"), filename, code);
- }
- /* This implementation will give problems on files larger than INT_MAX. */
- static void
- processFile(const void *data, size_t size, const XML_Char *filename,
- void *args) {
- XML_Parser parser = ((PROCESS_ARGS *)args)->parser;
- int *retPtr = ((PROCESS_ARGS *)args)->retPtr;
- if (XML_Parse(parser, (const char *)data, (int)size, 1) == XML_STATUS_ERROR) {
- reportError(parser, filename);
- *retPtr = 0;
- } else
- *retPtr = 1;
- }
- #if defined(_WIN32)
- static int
- isAsciiLetter(XML_Char c) {
- return (T('a') <= c && c <= T('z')) || (T('A') <= c && c <= T('Z'));
- }
- #endif /* _WIN32 */
- static const XML_Char *
- resolveSystemId(const XML_Char *base, const XML_Char *systemId,
- XML_Char **toFree) {
- XML_Char *s;
- *toFree = 0;
- if (! base || *systemId == T('/')
- #if defined(_WIN32)
- || *systemId == T('\\')
- || (isAsciiLetter(systemId[0]) && systemId[1] == T(':'))
- #endif
- )
- return systemId;
- *toFree = (XML_Char *)malloc((tcslen(base) + tcslen(systemId) + 2)
- * sizeof(XML_Char));
- if (! *toFree)
- return systemId;
- tcscpy(*toFree, base);
- s = *toFree;
- if (tcsrchr(s, T('/')))
- s = tcsrchr(s, T('/')) + 1;
- #if defined(_WIN32)
- if (tcsrchr(s, T('\\')))
- s = tcsrchr(s, T('\\')) + 1;
- #endif
- tcscpy(s, systemId);
- return *toFree;
- }
- static int
- externalEntityRefFilemap(XML_Parser parser, const XML_Char *context,
- const XML_Char *base, const XML_Char *systemId,
- const XML_Char *publicId) {
- int result;
- XML_Char *s;
- const XML_Char *filename;
- XML_Parser entParser = XML_ExternalEntityParserCreate(parser, context, 0);
- int filemapRes;
- PROCESS_ARGS args;
- UNUSED_P(publicId);
- args.retPtr = &result;
- args.parser = entParser;
- filename = resolveSystemId(base, systemId, &s);
- XML_SetBase(entParser, filename);
- filemapRes = filemap(filename, processFile, &args);
- switch (filemapRes) {
- case 0:
- result = 0;
- break;
- case 2:
- ftprintf(stderr,
- T("%s: file too large for memory-mapping")
- T(", switching to streaming\n"),
- filename);
- result = processStream(filename, entParser);
- break;
- }
- free(s);
- XML_ParserFree(entParser);
- return result;
- }
- static int
- processStream(const XML_Char *filename, XML_Parser parser) {
- /* passing NULL for filename means read input from stdin */
- int fd = 0; /* 0 is the fileno for stdin */
- if (filename != NULL) {
- fd = topen(filename, O_BINARY | O_RDONLY);
- if (fd < 0) {
- tperror(filename);
- return 0;
- }
- }
- for (;;) {
- int nread;
- char *buf = (char *)XML_GetBuffer(parser, READ_SIZE);
- if (! buf) {
- if (filename != NULL)
- close(fd);
- ftprintf(stderr, T("%s: out of memory\n"),
- filename != NULL ? filename : T("xmlwf"));
- return 0;
- }
- nread = read(fd, buf, READ_SIZE);
- if (nread < 0) {
- tperror(filename != NULL ? filename : T("STDIN"));
- if (filename != NULL)
- close(fd);
- return 0;
- }
- if (XML_ParseBuffer(parser, nread, nread == 0) == XML_STATUS_ERROR) {
- reportError(parser, filename != NULL ? filename : T("STDIN"));
- if (filename != NULL)
- close(fd);
- return 0;
- }
- if (nread == 0) {
- if (filename != NULL)
- close(fd);
- break;
- ;
- }
- }
- return 1;
- }
- static int
- externalEntityRefStream(XML_Parser parser, const XML_Char *context,
- const XML_Char *base, const XML_Char *systemId,
- const XML_Char *publicId) {
- XML_Char *s;
- const XML_Char *filename;
- int ret;
- XML_Parser entParser = XML_ExternalEntityParserCreate(parser, context, 0);
- UNUSED_P(publicId);
- filename = resolveSystemId(base, systemId, &s);
- XML_SetBase(entParser, filename);
- ret = processStream(filename, entParser);
- free(s);
- XML_ParserFree(entParser);
- return ret;
- }
- int
- XML_ProcessFile(XML_Parser parser, const XML_Char *filename, unsigned flags) {
- int result;
- if (! XML_SetBase(parser, filename)) {
- ftprintf(stderr, T("%s: out of memory"), filename);
- exit(1);
- }
- if (flags & XML_EXTERNAL_ENTITIES)
- XML_SetExternalEntityRefHandler(parser, (flags & XML_MAP_FILE)
- ? externalEntityRefFilemap
- : externalEntityRefStream);
- if (flags & XML_MAP_FILE) {
- int filemapRes;
- PROCESS_ARGS args;
- args.retPtr = &result;
- args.parser = parser;
- filemapRes = filemap(filename, processFile, &args);
- switch (filemapRes) {
- case 0:
- result = 0;
- break;
- case 2:
- ftprintf(stderr,
- T("%s: file too large for memory-mapping")
- T(", switching to streaming\n"),
- filename);
- result = processStream(filename, parser);
- break;
- }
- } else
- result = processStream(filename, parser);
- return result;
- }
|