Home | History | Annotate | Download | only in intl
      1 /* Copyright (C) 1995-1999, 2000-2003 Free Software Foundation, Inc.
      2    Contributed by Ulrich Drepper <drepper (at) gnu.ai.mit.edu>, 1995.
      3 
      4    This program is free software; you can redistribute it and/or modify it
      5    under the terms of the GNU Library General Public License as published
      6    by the Free Software Foundation; either version 2, or (at your option)
      7    any later version.
      8 
      9    This program is distributed in the hope that it will be useful,
     10    but WITHOUT ANY WARRANTY; without even the implied warranty of
     11    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
     12    Library General Public License for more details.
     13 
     14    You should have received a copy of the GNU Library General Public
     15    License along with this program; if not, write to the Free Software
     16    Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307,
     17    USA.  */
     18 
     19 /* Tell glibc's <string.h> to provide a prototype for stpcpy().
     20    This must come before <config.h> because <config.h> may include
     21    <features.h>, and once <features.h> has been included, it's too late.  */
     22 #ifndef _GNU_SOURCE
     23 # define _GNU_SOURCE	1
     24 #endif
     25 
     26 #ifdef HAVE_CONFIG_H
     27 # include <config.h>
     28 #endif
     29 
     30 #include <string.h>
     31 
     32 #if defined _LIBC || defined HAVE_ARGZ_H
     33 # include <argz.h>
     34 #endif
     35 #include <ctype.h>
     36 #include <sys/types.h>
     37 #include <stdlib.h>
     38 
     39 #include "loadinfo.h"
     40 
     41 /* On some strange systems still no definition of NULL is found.  Sigh!  */
     42 #ifndef NULL
     43 # if defined __STDC__ && __STDC__
     44 #  define NULL ((void *) 0)
     45 # else
     46 #  define NULL 0
     47 # endif
     48 #endif
     49 
     50 /* @@ end of prolog @@ */
     51 
     52 #ifdef _LIBC
     53 /* Rename the non ANSI C functions.  This is required by the standard
     54    because some ANSI C functions will require linking with this object
     55    file and the name space must not be polluted.  */
     56 # ifndef stpcpy
     57 #  define stpcpy(dest, src) __stpcpy(dest, src)
     58 # endif
     59 #else
     60 # ifndef HAVE_STPCPY
     61 static char *stpcpy (char *dest, const char *src);
     62 # endif
     63 #endif
     64 
     65 /* Pathname support.
     66    ISSLASH(C)           tests whether C is a directory separator character.
     67    IS_ABSOLUTE_PATH(P)  tests whether P is an absolute path.  If it is not,
     68                         it may be concatenated to a directory pathname.
     69  */
     70 #if defined _WIN32 || defined __WIN32__ || defined __EMX__ || defined __DJGPP__
     71   /* Win32, OS/2, DOS */
     72 # define ISSLASH(C) ((C) == '/' || (C) == '\\')
     73 # define HAS_DEVICE(P) \
     74     ((((P)[0] >= 'A' && (P)[0] <= 'Z') || ((P)[0] >= 'a' && (P)[0] <= 'z')) \
     75      && (P)[1] == ':')
     76 # define IS_ABSOLUTE_PATH(P) (ISSLASH ((P)[0]) || HAS_DEVICE (P))
     77 #else
     78   /* Unix */
     79 # define ISSLASH(C) ((C) == '/')
     80 # define IS_ABSOLUTE_PATH(P) ISSLASH ((P)[0])
     81 #endif
     82 
     83 /* Define function which are usually not available.  */
     84 
     85 #if !defined _LIBC && !defined HAVE___ARGZ_COUNT
     86 /* Returns the number of strings in ARGZ.  */
     87 static size_t
     88 argz_count__ (const char *argz, size_t len)
     89 {
     90   size_t count = 0;
     91   while (len > 0)
     92     {
     93       size_t part_len = strlen (argz);
     94       argz += part_len + 1;
     95       len -= part_len + 1;
     96       count++;
     97     }
     98   return count;
     99 }
    100 # undef __argz_count
    101 # define __argz_count(argz, len) argz_count__ (argz, len)
    102 #else
    103 # ifdef _LIBC
    104 #  define __argz_count(argz, len) INTUSE(__argz_count) (argz, len)
    105 # endif
    106 #endif	/* !_LIBC && !HAVE___ARGZ_COUNT */
    107 
    108 #if !defined _LIBC && !defined HAVE___ARGZ_STRINGIFY
    109 /* Make '\0' separated arg vector ARGZ printable by converting all the '\0's
    110    except the last into the character SEP.  */
    111 static void
    112 argz_stringify__ (char *argz, size_t len, int sep)
    113 {
    114   while (len > 0)
    115     {
    116       size_t part_len = strlen (argz);
    117       argz += part_len;
    118       len -= part_len + 1;
    119       if (len > 0)
    120 	*argz++ = sep;
    121     }
    122 }
    123 # undef __argz_stringify
    124 # define __argz_stringify(argz, len, sep) argz_stringify__ (argz, len, sep)
    125 #else
    126 # ifdef _LIBC
    127 #  define __argz_stringify(argz, len, sep) \
    128   INTUSE(__argz_stringify) (argz, len, sep)
    129 # endif
    130 #endif	/* !_LIBC && !HAVE___ARGZ_STRINGIFY */
    131 
    132 #if !defined _LIBC && !defined HAVE___ARGZ_NEXT
    133 static char *
    134 argz_next__ (char *argz, size_t argz_len, const char *entry)
    135 {
    136   if (entry)
    137     {
    138       if (entry < argz + argz_len)
    139         entry = strchr (entry, '\0') + 1;
    140 
    141       return entry >= argz + argz_len ? NULL : (char *) entry;
    142     }
    143   else
    144     if (argz_len > 0)
    145       return argz;
    146     else
    147       return 0;
    148 }
    149 # undef __argz_next
    150 # define __argz_next(argz, len, entry) argz_next__ (argz, len, entry)
    151 #endif	/* !_LIBC && !HAVE___ARGZ_NEXT */
    152 
    153 
    154 /* Return number of bits set in X.  */
    155 static inline int
    156 pop (int x)
    157 {
    158   /* We assume that no more than 16 bits are used.  */
    159   x = ((x & ~0x5555) >> 1) + (x & 0x5555);
    160   x = ((x & ~0x3333) >> 2) + (x & 0x3333);
    161   x = ((x >> 4) + x) & 0x0f0f;
    162   x = ((x >> 8) + x) & 0xff;
    163 
    164   return x;
    165 }
    166 
    167 
    168 struct loaded_l10nfile *
    170 _nl_make_l10nflist (struct loaded_l10nfile **l10nfile_list,
    171 		    const char *dirlist, size_t dirlist_len,
    172 		    int mask, const char *language, const char *territory,
    173 		    const char *codeset, const char *normalized_codeset,
    174 		    const char *modifier, const char *special,
    175 		    const char *sponsor, const char *revision,
    176 		    const char *filename, int do_allocate)
    177 {
    178   char *abs_filename;
    179   struct loaded_l10nfile **lastp;
    180   struct loaded_l10nfile *retval;
    181   char *cp;
    182   size_t dirlist_count;
    183   size_t entries;
    184   int cnt;
    185 
    186   /* If LANGUAGE contains an absolute directory specification, we ignore
    187      DIRLIST.  */
    188   if (IS_ABSOLUTE_PATH (language))
    189     dirlist_len = 0;
    190 
    191   /* Allocate room for the full file name.  */
    192   abs_filename = (char *) malloc (dirlist_len
    193 				  + strlen (language)
    194 				  + ((mask & TERRITORY) != 0
    195 				     ? strlen (territory) + 1 : 0)
    196 				  + ((mask & XPG_CODESET) != 0
    197 				     ? strlen (codeset) + 1 : 0)
    198 				  + ((mask & XPG_NORM_CODESET) != 0
    199 				     ? strlen (normalized_codeset) + 1 : 0)
    200 				  + (((mask & XPG_MODIFIER) != 0
    201 				      || (mask & CEN_AUDIENCE) != 0)
    202 				     ? strlen (modifier) + 1 : 0)
    203 				  + ((mask & CEN_SPECIAL) != 0
    204 				     ? strlen (special) + 1 : 0)
    205 				  + (((mask & CEN_SPONSOR) != 0
    206 				      || (mask & CEN_REVISION) != 0)
    207 				     ? (1 + ((mask & CEN_SPONSOR) != 0
    208 					     ? strlen (sponsor) : 0)
    209 					+ ((mask & CEN_REVISION) != 0
    210 					   ? strlen (revision) + 1 : 0)) : 0)
    211 				  + 1 + strlen (filename) + 1);
    212 
    213   if (abs_filename == NULL)
    214     return NULL;
    215 
    216   /* Construct file name.  */
    217   cp = abs_filename;
    218   if (dirlist_len > 0)
    219     {
    220       memcpy (cp, dirlist, dirlist_len);
    221       __argz_stringify (cp, dirlist_len, PATH_SEPARATOR);
    222       cp += dirlist_len;
    223       cp[-1] = '/';
    224     }
    225 
    226   cp = stpcpy (cp, language);
    227 
    228   if ((mask & TERRITORY) != 0)
    229     {
    230       *cp++ = '_';
    231       cp = stpcpy (cp, territory);
    232     }
    233   if ((mask & XPG_CODESET) != 0)
    234     {
    235       *cp++ = '.';
    236       cp = stpcpy (cp, codeset);
    237     }
    238   if ((mask & XPG_NORM_CODESET) != 0)
    239     {
    240       *cp++ = '.';
    241       cp = stpcpy (cp, normalized_codeset);
    242     }
    243   if ((mask & (XPG_MODIFIER | CEN_AUDIENCE)) != 0)
    244     {
    245       /* This component can be part of both syntaces but has different
    246 	 leading characters.  For CEN we use `+', else `@'.  */
    247       *cp++ = (mask & CEN_AUDIENCE) != 0 ? '+' : '@';
    248       cp = stpcpy (cp, modifier);
    249     }
    250   if ((mask & CEN_SPECIAL) != 0)
    251     {
    252       *cp++ = '+';
    253       cp = stpcpy (cp, special);
    254     }
    255   if ((mask & (CEN_SPONSOR | CEN_REVISION)) != 0)
    256     {
    257       *cp++ = ',';
    258       if ((mask & CEN_SPONSOR) != 0)
    259 	cp = stpcpy (cp, sponsor);
    260       if ((mask & CEN_REVISION) != 0)
    261 	{
    262 	  *cp++ = '_';
    263 	  cp = stpcpy (cp, revision);
    264 	}
    265     }
    266 
    267   *cp++ = '/';
    268   stpcpy (cp, filename);
    269 
    270   /* Look in list of already loaded domains whether it is already
    271      available.  */
    272   lastp = l10nfile_list;
    273   for (retval = *l10nfile_list; retval != NULL; retval = retval->next)
    274     if (retval->filename != NULL)
    275       {
    276 	int compare = strcmp (retval->filename, abs_filename);
    277 	if (compare == 0)
    278 	  /* We found it!  */
    279 	  break;
    280 	if (compare < 0)
    281 	  {
    282 	    /* It's not in the list.  */
    283 	    retval = NULL;
    284 	    break;
    285 	  }
    286 
    287 	lastp = &retval->next;
    288       }
    289 
    290   if (retval != NULL || do_allocate == 0)
    291     {
    292       free (abs_filename);
    293       return retval;
    294     }
    295 
    296   dirlist_count = (dirlist_len > 0 ? __argz_count (dirlist, dirlist_len) : 1);
    297 
    298   /* Allocate a new loaded_l10nfile.  */
    299   retval =
    300     (struct loaded_l10nfile *)
    301     malloc (sizeof (*retval)
    302 	    + (((dirlist_count << pop (mask)) + (dirlist_count > 1 ? 1 : 0))
    303 	       * sizeof (struct loaded_l10nfile *)));
    304   if (retval == NULL)
    305     return NULL;
    306 
    307   retval->filename = abs_filename;
    308 
    309   /* We set retval->data to NULL here; it is filled in later.
    310      Setting retval->decided to 1 here means that retval does not
    311      correspond to a real file (dirlist_count > 1) or is not worth
    312      looking up (if an unnormalized codeset was specified).  */
    313   retval->decided = (dirlist_count > 1
    314 		     || ((mask & XPG_CODESET) != 0
    315 			 && (mask & XPG_NORM_CODESET) != 0));
    316   retval->data = NULL;
    317 
    318   retval->next = *lastp;
    319   *lastp = retval;
    320 
    321   entries = 0;
    322   /* Recurse to fill the inheritance list of RETVAL.
    323      If the DIRLIST is a real list (i.e. DIRLIST_COUNT > 1), the RETVAL
    324      entry does not correspond to a real file; retval->filename contains
    325      colons.  In this case we loop across all elements of DIRLIST and
    326      across all bit patterns dominated by MASK.
    327      If the DIRLIST is a single directory or entirely redundant (i.e.
    328      DIRLIST_COUNT == 1), we loop across all bit patterns dominated by
    329      MASK, excluding MASK itself.
    330      In either case, we loop down from MASK to 0.  This has the effect
    331      that the extra bits in the locale name are dropped in this order:
    332      first the modifier, then the territory, then the codeset, then the
    333      normalized_codeset.  */
    334   for (cnt = dirlist_count > 1 ? mask : mask - 1; cnt >= 0; --cnt)
    335     if ((cnt & ~mask) == 0
    336 	&& ((cnt & CEN_SPECIFIC) == 0 || (cnt & XPG_SPECIFIC) == 0)
    337 	&& ((cnt & XPG_CODESET) == 0 || (cnt & XPG_NORM_CODESET) == 0))
    338       {
    339 	if (dirlist_count > 1)
    340 	  {
    341 	    /* Iterate over all elements of the DIRLIST.  */
    342 	    char *dir = NULL;
    343 
    344 	    while ((dir = __argz_next ((char *) dirlist, dirlist_len, dir))
    345 		   != NULL)
    346 	      retval->successor[entries++]
    347 		= _nl_make_l10nflist (l10nfile_list, dir, strlen (dir) + 1,
    348 				      cnt, language, territory, codeset,
    349 				      normalized_codeset, modifier, special,
    350 				      sponsor, revision, filename, 1);
    351 	  }
    352 	else
    353 	  retval->successor[entries++]
    354 	    = _nl_make_l10nflist (l10nfile_list, dirlist, dirlist_len,
    355 				  cnt, language, territory, codeset,
    356 				  normalized_codeset, modifier, special,
    357 				  sponsor, revision, filename, 1);
    358       }
    359   retval->successor[entries] = NULL;
    360 
    361   return retval;
    362 }
    363 
    364 /* Normalize codeset name.  There is no standard for the codeset
    366    names.  Normalization allows the user to use any of the common
    367    names.  The return value is dynamically allocated and has to be
    368    freed by the caller.  */
    369 const char *
    370 _nl_normalize_codeset (const char *codeset, size_t name_len)
    371 {
    372   int len = 0;
    373   int only_digit = 1;
    374   char *retval;
    375   char *wp;
    376   size_t cnt;
    377 
    378   for (cnt = 0; cnt < name_len; ++cnt)
    379     if (isalnum ((unsigned char) codeset[cnt]))
    380       {
    381 	++len;
    382 
    383 	if (isalpha ((unsigned char) codeset[cnt]))
    384 	  only_digit = 0;
    385       }
    386 
    387   retval = (char *) malloc ((only_digit ? 3 : 0) + len + 1);
    388 
    389   if (retval != NULL)
    390     {
    391       if (only_digit)
    392 	wp = stpcpy (retval, "iso");
    393       else
    394 	wp = retval;
    395 
    396       for (cnt = 0; cnt < name_len; ++cnt)
    397 	if (isalpha ((unsigned char) codeset[cnt]))
    398 	  *wp++ = tolower ((unsigned char) codeset[cnt]);
    399 	else if (isdigit ((unsigned char) codeset[cnt]))
    400 	  *wp++ = codeset[cnt];
    401 
    402       *wp = '\0';
    403     }
    404 
    405   return (const char *) retval;
    406 }
    407 
    408 
    409 /* @@ begin of epilog @@ */
    410 
    411 /* We don't want libintl.a to depend on any other library.  So we
    412    avoid the non-standard function stpcpy.  In GNU C Library this
    413    function is available, though.  Also allow the symbol HAVE_STPCPY
    414    to be defined.  */
    415 #if !_LIBC && !HAVE_STPCPY
    416 static char *
    417 stpcpy (char *dest, const char *src)
    418 {
    419   while ((*dest++ = *src++) != '\0')
    420     /* Do nothing. */ ;
    421   return dest - 1;
    422 }
    423 #endif
    424