Home | History | Annotate | Download | only in xmlwf
      1 /*
      2                             __  __            _
      3                          ___\ \/ /_ __   __ _| |_
      4                         / _ \\  /| '_ \ / _` | __|
      5                        |  __//  \| |_) | (_| | |_
      6                         \___/_/\_\ .__/ \__,_|\__|
      7                                  |_| XML parser
      8 
      9    Copyright (c) 1997-2000 Thai Open Source Software Center Ltd
     10    Copyright (c) 2000-2017 Expat development team
     11    Licensed under the MIT license:
     12 
     13    Permission is  hereby granted,  free of charge,  to any  person obtaining
     14    a  copy  of  this  software   and  associated  documentation  files  (the
     15    "Software"),  to  deal in  the  Software  without restriction,  including
     16    without  limitation the  rights  to use,  copy,  modify, merge,  publish,
     17    distribute, sublicense, and/or sell copies of the Software, and to permit
     18    persons  to whom  the Software  is  furnished to  do so,  subject to  the
     19    following conditions:
     20 
     21    The above copyright  notice and this permission notice  shall be included
     22    in all copies or substantial portions of the Software.
     23 
     24    THE  SOFTWARE  IS  PROVIDED  "AS  IS",  WITHOUT  WARRANTY  OF  ANY  KIND,
     25    EXPRESS  OR IMPLIED,  INCLUDING  BUT  NOT LIMITED  TO  THE WARRANTIES  OF
     26    MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN
     27    NO EVENT SHALL THE AUTHORS OR  COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM,
     28    DAMAGES OR  OTHER LIABILITY, WHETHER  IN AN  ACTION OF CONTRACT,  TORT OR
     29    OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE
     30    USE OR OTHER DEALINGS IN THE SOFTWARE.
     31 */
     32 
     33 #include <stdio.h>
     34 #include <stdlib.h>
     35 #include <stddef.h>
     36 #include <string.h>
     37 #include <fcntl.h>
     38 
     39 #ifdef _WIN32
     40 #include "winconfig.h"
     41 #elif defined(HAVE_EXPAT_CONFIG_H)
     42 #include <expat_config.h>
     43 #endif /* ndef _WIN32 */
     44 
     45 #include "expat.h"
     46 #include "internal.h"  /* for UNUSED_P only */
     47 #include "xmlfile.h"
     48 #include "xmltchar.h"
     49 #include "filemap.h"
     50 
     51 #if defined(_MSC_VER)
     52 #include <io.h>
     53 #endif
     54 
     55 #ifdef HAVE_UNISTD_H
     56 #include <unistd.h>
     57 #endif
     58 
     59 #ifndef O_BINARY
     60 #ifdef _O_BINARY
     61 #define O_BINARY _O_BINARY
     62 #else
     63 #define O_BINARY 0
     64 #endif
     65 #endif
     66 
     67 #ifdef _DEBUG
     68 #define READ_SIZE 16
     69 #else
     70 #define READ_SIZE (1024*8)
     71 #endif
     72 
     73 
     74 typedef struct {
     75   XML_Parser parser;
     76   int *retPtr;
     77 } PROCESS_ARGS;
     78 
     79 static int
     80 processStream(const XML_Char *filename, XML_Parser parser);
     81 
     82 static void
     83 reportError(XML_Parser parser, const XML_Char *filename)
     84 {
     85   enum XML_Error code = XML_GetErrorCode(parser);
     86   const XML_Char *message = XML_ErrorString(code);
     87   if (message)
     88     ftprintf(stdout,
     89              T("%s")
     90                T(":%") T(XML_FMT_INT_MOD) T("u")
     91                T(":%") T(XML_FMT_INT_MOD) T("u")
     92                T(": %s\n"),
     93              filename,
     94              XML_GetErrorLineNumber(parser),
     95              XML_GetErrorColumnNumber(parser),
     96              message);
     97   else
     98     ftprintf(stderr, T("%s: (unknown message %d)\n"), filename, code);
     99 }
    100 
    101 /* This implementation will give problems on files larger than INT_MAX. */
    102 static void
    103 processFile(const void *data, size_t size,
    104             const XML_Char *filename, void *args)
    105 {
    106   XML_Parser parser = ((PROCESS_ARGS *)args)->parser;
    107   int *retPtr = ((PROCESS_ARGS *)args)->retPtr;
    108   if (XML_Parse(parser, (const char *)data, (int)size, 1) == XML_STATUS_ERROR) {
    109     reportError(parser, filename);
    110     *retPtr = 0;
    111   }
    112   else
    113     *retPtr = 1;
    114 }
    115 
    116 #if defined(_WIN32)
    117 
    118 static int
    119 isAsciiLetter(XML_Char c)
    120 {
    121   return (T('a') <= c && c <= T('z')) || (T('A') <= c && c <= T('Z'));
    122 }
    123 
    124 #endif /* _WIN32 */
    125 
    126 static const XML_Char *
    127 resolveSystemId(const XML_Char *base, const XML_Char *systemId,
    128                 XML_Char **toFree)
    129 {
    130   XML_Char *s;
    131   *toFree = 0;
    132   if (!base
    133       || *systemId == T('/')
    134 #if defined(_WIN32)
    135       || *systemId == T('\\')
    136       || (isAsciiLetter(systemId[0]) && systemId[1] == T(':'))
    137 #endif
    138      )
    139     return systemId;
    140   *toFree = (XML_Char *)malloc((tcslen(base) + tcslen(systemId) + 2)
    141                                * sizeof(XML_Char));
    142   if (!*toFree)
    143     return systemId;
    144   tcscpy(*toFree, base);
    145   s = *toFree;
    146   if (tcsrchr(s, T('/')))
    147     s = tcsrchr(s, T('/')) + 1;
    148 #if defined(_WIN32)
    149   if (tcsrchr(s, T('\\')))
    150     s = tcsrchr(s, T('\\')) + 1;
    151 #endif
    152   tcscpy(s, systemId);
    153   return *toFree;
    154 }
    155 
    156 static int
    157 externalEntityRefFilemap(XML_Parser parser,
    158                          const XML_Char *context,
    159                          const XML_Char *base,
    160                          const XML_Char *systemId,
    161                          const XML_Char *UNUSED_P(publicId))
    162 {
    163   int result;
    164   XML_Char *s;
    165   const XML_Char *filename;
    166   XML_Parser entParser = XML_ExternalEntityParserCreate(parser, context, 0);
    167   int filemapRes;
    168   PROCESS_ARGS args;
    169   args.retPtr = &result;
    170   args.parser = entParser;
    171   filename = resolveSystemId(base, systemId, &s);
    172   XML_SetBase(entParser, filename);
    173   filemapRes = filemap(filename, processFile, &args);
    174   switch (filemapRes) {
    175   case 0:
    176     result = 0;
    177     break;
    178   case 2:
    179     ftprintf(stderr, T("%s: file too large for memory-mapping")
    180         T(", switching to streaming\n"), filename);
    181     result = processStream(filename, entParser);
    182     break;
    183   }
    184   free(s);
    185   XML_ParserFree(entParser);
    186   return result;
    187 }
    188 
    189 static int
    190 processStream(const XML_Char *filename, XML_Parser parser)
    191 {
    192   /* passing NULL for filename means read intput from stdin */
    193   int fd = 0;   /* 0 is the fileno for stdin */
    194 
    195   if (filename != NULL) {
    196     fd = topen(filename, O_BINARY|O_RDONLY);
    197     if (fd < 0) {
    198       tperror(filename);
    199       return 0;
    200     }
    201   }
    202   for (;;) {
    203     int nread;
    204     char *buf = (char *)XML_GetBuffer(parser, READ_SIZE);
    205     if (!buf) {
    206       if (filename != NULL)
    207         close(fd);
    208       ftprintf(stderr, T("%s: out of memory\n"),
    209                filename != NULL ? filename : T("xmlwf"));
    210       return 0;
    211     }
    212     nread = read(fd, buf, READ_SIZE);
    213     if (nread < 0) {
    214       tperror(filename != NULL ? filename : T("STDIN"));
    215       if (filename != NULL)
    216         close(fd);
    217       return 0;
    218     }
    219     if (XML_ParseBuffer(parser, nread, nread == 0) == XML_STATUS_ERROR) {
    220         reportError(parser, filename != NULL ? filename : T("STDIN"));
    221       if (filename != NULL)
    222         close(fd);
    223       return 0;
    224     }
    225     if (nread == 0) {
    226       if (filename != NULL)
    227         close(fd);
    228       break;;
    229     }
    230   }
    231   return 1;
    232 }
    233 
    234 static int
    235 externalEntityRefStream(XML_Parser parser,
    236                         const XML_Char *context,
    237                         const XML_Char *base,
    238                         const XML_Char *systemId,
    239                         const XML_Char *UNUSED_P(publicId))
    240 {
    241   XML_Char *s;
    242   const XML_Char *filename;
    243   int ret;
    244   XML_Parser entParser = XML_ExternalEntityParserCreate(parser, context, 0);
    245   filename = resolveSystemId(base, systemId, &s);
    246   XML_SetBase(entParser, filename);
    247   ret = processStream(filename, entParser);
    248   free(s);
    249   XML_ParserFree(entParser);
    250   return ret;
    251 }
    252 
    253 int
    254 XML_ProcessFile(XML_Parser parser,
    255                 const XML_Char *filename,
    256                 unsigned flags)
    257 {
    258   int result;
    259 
    260   if (!XML_SetBase(parser, filename)) {
    261     ftprintf(stderr, T("%s: out of memory"), filename);
    262     exit(1);
    263   }
    264 
    265   if (flags & XML_EXTERNAL_ENTITIES)
    266       XML_SetExternalEntityRefHandler(parser,
    267                                       (flags & XML_MAP_FILE)
    268                                       ? externalEntityRefFilemap
    269                                       : externalEntityRefStream);
    270   if (flags & XML_MAP_FILE) {
    271     int filemapRes;
    272     PROCESS_ARGS args;
    273     args.retPtr = &result;
    274     args.parser = parser;
    275     filemapRes = filemap(filename, processFile, &args);
    276     switch (filemapRes) {
    277     case 0:
    278       result = 0;
    279       break;
    280     case 2:
    281       ftprintf(stderr, T("%s: file too large for memory-mapping")
    282           T(", switching to streaming\n"), filename);
    283       result = processStream(filename, parser);
    284       break;
    285     }
    286   }
    287   else
    288     result = processStream(filename, parser);
    289   return result;
    290 }
    291