Home | History | Annotate | Download | only in build
      1 #!/usr/bin/env python
      2 # Copyright 2013 The Chromium Authors. All rights reserved.
      3 # Use of this source code is governed by a BSD-style license that can be
      4 # found in the LICENSE file.
      5 
      6 """
      7 localize.py -- Generates an output file from the given template replacing
      8 variables and localizing strings.
      9 
     10 The script uses Jinja2 template processing library (src/third_party/jinja2).
     11 Variables available to the templates:
     12   - |languages| - the list of languages passed on the command line. ('-l').
     13   - Each NAME=VALUE define ('-d') can be accesses as {{ NAME }}.
     14   - |official_build| is set to '1' when CHROME_BUILD_TYPE environment variable
     15     is set to "_official".
     16 
     17 Filters:
     18   - GetCodepage - returns the code page for the given language.
     19   - GetCodepageDecimal same as GetCodepage, but returns a decimal value.
     20   - GetLangId - returns Win32 LANGID.
     21   - GetPrimaryLanguage - returns a named Win32 constant specifing the primary
     22     language ID.
     23   - GetSublanguage -  returns a named Win32 constant specifing the sublanguage
     24     ID.
     25 
     26 Globals:
     27   - IsRtlLanguage(language) - returns True if the language is right-to-left.
     28   - SelectLanguage(language) - allows to select the language to the used by
     29     {% trans %}{% endtrans %} statements.
     30 
     31 """
     32 
     33 import io
     34 import json
     35 from optparse import OptionParser
     36 import os
     37 import sys
     38 from string import Template
     39 
     40 
     41 # Win32 primary languages IDs.
     42 _LANGUAGE_PRIMARY = {
     43   'LANG_NEUTRAL' : 0x00,
     44   'LANG_INVARIANT' : 0x7f,
     45   'LANG_AFRIKAANS' : 0x36,
     46   'LANG_ALBANIAN' : 0x1c,
     47   'LANG_ALSATIAN' : 0x84,
     48   'LANG_AMHARIC' : 0x5e,
     49   'LANG_ARABIC' : 0x01,
     50   'LANG_ARMENIAN' : 0x2b,
     51   'LANG_ASSAMESE' : 0x4d,
     52   'LANG_AZERI' : 0x2c,
     53   'LANG_BASHKIR' : 0x6d,
     54   'LANG_BASQUE' : 0x2d,
     55   'LANG_BELARUSIAN' : 0x23,
     56   'LANG_BENGALI' : 0x45,
     57   'LANG_BRETON' : 0x7e,
     58   'LANG_BOSNIAN' : 0x1a,
     59   'LANG_BULGARIAN' : 0x02,
     60   'LANG_CATALAN' : 0x03,
     61   'LANG_CHINESE' : 0x04,
     62   'LANG_CORSICAN' : 0x83,
     63   'LANG_CROATIAN' : 0x1a,
     64   'LANG_CZECH' : 0x05,
     65   'LANG_DANISH' : 0x06,
     66   'LANG_DARI' : 0x8c,
     67   'LANG_DIVEHI' : 0x65,
     68   'LANG_DUTCH' : 0x13,
     69   'LANG_ENGLISH' : 0x09,
     70   'LANG_ESTONIAN' : 0x25,
     71   'LANG_FAEROESE' : 0x38,
     72   'LANG_FILIPINO' : 0x64,
     73   'LANG_FINNISH' : 0x0b,
     74   'LANG_FRENCH' : 0x0c,
     75   'LANG_FRISIAN' : 0x62,
     76   'LANG_GALICIAN' : 0x56,
     77   'LANG_GEORGIAN' : 0x37,
     78   'LANG_GERMAN' : 0x07,
     79   'LANG_GREEK' : 0x08,
     80   'LANG_GREENLANDIC' : 0x6f,
     81   'LANG_GUJARATI' : 0x47,
     82   'LANG_HAUSA' : 0x68,
     83   'LANG_HEBREW' : 0x0d,
     84   'LANG_HINDI' : 0x39,
     85   'LANG_HUNGARIAN' : 0x0e,
     86   'LANG_ICELANDIC' : 0x0f,
     87   'LANG_IGBO' : 0x70,
     88   'LANG_INDONESIAN' : 0x21,
     89   'LANG_INUKTITUT' : 0x5d,
     90   'LANG_IRISH' : 0x3c,
     91   'LANG_ITALIAN' : 0x10,
     92   'LANG_JAPANESE' : 0x11,
     93   'LANG_KANNADA' : 0x4b,
     94   'LANG_KASHMIRI' : 0x60,
     95   'LANG_KAZAK' : 0x3f,
     96   'LANG_KHMER' : 0x53,
     97   'LANG_KICHE' : 0x86,
     98   'LANG_KINYARWANDA' : 0x87,
     99   'LANG_KONKANI' : 0x57,
    100   'LANG_KOREAN' : 0x12,
    101   'LANG_KYRGYZ' : 0x40,
    102   'LANG_LAO' : 0x54,
    103   'LANG_LATVIAN' : 0x26,
    104   'LANG_LITHUANIAN' : 0x27,
    105   'LANG_LOWER_SORBIAN' : 0x2e,
    106   'LANG_LUXEMBOURGISH' : 0x6e,
    107   'LANG_MACEDONIAN' : 0x2f,
    108   'LANG_MALAY' : 0x3e,
    109   'LANG_MALAYALAM' : 0x4c,
    110   'LANG_MALTESE' : 0x3a,
    111   'LANG_MANIPURI' : 0x58,
    112   'LANG_MAORI' : 0x81,
    113   'LANG_MAPUDUNGUN' : 0x7a,
    114   'LANG_MARATHI' : 0x4e,
    115   'LANG_MOHAWK' : 0x7c,
    116   'LANG_MONGOLIAN' : 0x50,
    117   'LANG_NEPALI' : 0x61,
    118   'LANG_NORWEGIAN' : 0x14,
    119   'LANG_OCCITAN' : 0x82,
    120   'LANG_ORIYA' : 0x48,
    121   'LANG_PASHTO' : 0x63,
    122   'LANG_PERSIAN' : 0x29,
    123   'LANG_POLISH' : 0x15,
    124   'LANG_PORTUGUESE' : 0x16,
    125   'LANG_PUNJABI' : 0x46,
    126   'LANG_QUECHUA' : 0x6b,
    127   'LANG_ROMANIAN' : 0x18,
    128   'LANG_ROMANSH' : 0x17,
    129   'LANG_RUSSIAN' : 0x19,
    130   'LANG_SAMI' : 0x3b,
    131   'LANG_SANSKRIT' : 0x4f,
    132   'LANG_SCOTTISH_GAELIC' : 0x91,
    133   'LANG_SERBIAN' : 0x1a,
    134   'LANG_SINDHI' : 0x59,
    135   'LANG_SINHALESE' : 0x5b,
    136   'LANG_SLOVAK' : 0x1b,
    137   'LANG_SLOVENIAN' : 0x24,
    138   'LANG_SOTHO' : 0x6c,
    139   'LANG_SPANISH' : 0x0a,
    140   'LANG_SWAHILI' : 0x41,
    141   'LANG_SWEDISH' : 0x1d,
    142   'LANG_SYRIAC' : 0x5a,
    143   'LANG_TAJIK' : 0x28,
    144   'LANG_TAMAZIGHT' : 0x5f,
    145   'LANG_TAMIL' : 0x49,
    146   'LANG_TATAR' : 0x44,
    147   'LANG_TELUGU' : 0x4a,
    148   'LANG_THAI' : 0x1e,
    149   'LANG_TIBETAN' : 0x51,
    150   'LANG_TIGRIGNA' : 0x73,
    151   'LANG_TSWANA' : 0x32,
    152   'LANG_TURKISH' : 0x1f,
    153   'LANG_TURKMEN' : 0x42,
    154   'LANG_UIGHUR' : 0x80,
    155   'LANG_UKRAINIAN' : 0x22,
    156   'LANG_UPPER_SORBIAN' : 0x2e,
    157   'LANG_URDU' : 0x20,
    158   'LANG_UZBEK' : 0x43,
    159   'LANG_VIETNAMESE' : 0x2a,
    160   'LANG_WELSH' : 0x52,
    161   'LANG_WOLOF' : 0x88,
    162   'LANG_XHOSA' : 0x34,
    163   'LANG_YAKUT' : 0x85,
    164   'LANG_YI' : 0x78,
    165   'LANG_YORUBA' : 0x6a,
    166   'LANG_ZULU' : 0x35,
    167 }
    168 
    169 
    170 # Win32 sublanguage IDs.
    171 _LANGUAGE_SUB = {
    172   'SUBLANG_NEUTRAL' : 0x00,
    173   'SUBLANG_DEFAULT' : 0x01,
    174   'SUBLANG_SYS_DEFAULT' : 0x02,
    175   'SUBLANG_CUSTOM_DEFAULT' : 0x03,
    176   'SUBLANG_CUSTOM_UNSPECIFIED' : 0x04,
    177   'SUBLANG_UI_CUSTOM_DEFAULT' : 0x05,
    178   'SUBLANG_AFRIKAANS_SOUTH_AFRICA' : 0x01,
    179   'SUBLANG_ALBANIAN_ALBANIA' : 0x01,
    180   'SUBLANG_ALSATIAN_FRANCE' : 0x01,
    181   'SUBLANG_AMHARIC_ETHIOPIA' : 0x01,
    182   'SUBLANG_ARABIC_SAUDI_ARABIA' : 0x01,
    183   'SUBLANG_ARABIC_IRAQ' : 0x02,
    184   'SUBLANG_ARABIC_EGYPT' : 0x03,
    185   'SUBLANG_ARABIC_LIBYA' : 0x04,
    186   'SUBLANG_ARABIC_ALGERIA' : 0x05,
    187   'SUBLANG_ARABIC_MOROCCO' : 0x06,
    188   'SUBLANG_ARABIC_TUNISIA' : 0x07,
    189   'SUBLANG_ARABIC_OMAN' : 0x08,
    190   'SUBLANG_ARABIC_YEMEN' : 0x09,
    191   'SUBLANG_ARABIC_SYRIA' : 0x0a,
    192   'SUBLANG_ARABIC_JORDAN' : 0x0b,
    193   'SUBLANG_ARABIC_LEBANON' : 0x0c,
    194   'SUBLANG_ARABIC_KUWAIT' : 0x0d,
    195   'SUBLANG_ARABIC_UAE' : 0x0e,
    196   'SUBLANG_ARABIC_BAHRAIN' : 0x0f,
    197   'SUBLANG_ARABIC_QATAR' : 0x10,
    198   'SUBLANG_ARMENIAN_ARMENIA' : 0x01,
    199   'SUBLANG_ASSAMESE_INDIA' : 0x01,
    200   'SUBLANG_AZERI_LATIN' : 0x01,
    201   'SUBLANG_AZERI_CYRILLIC' : 0x02,
    202   'SUBLANG_BASHKIR_RUSSIA' : 0x01,
    203   'SUBLANG_BASQUE_BASQUE' : 0x01,
    204   'SUBLANG_BELARUSIAN_BELARUS' : 0x01,
    205   'SUBLANG_BENGALI_INDIA' : 0x01,
    206   'SUBLANG_BENGALI_BANGLADESH' : 0x02,
    207   'SUBLANG_BOSNIAN_BOSNIA_HERZEGOVINA_LATIN' : 0x05,
    208   'SUBLANG_BOSNIAN_BOSNIA_HERZEGOVINA_CYRILLIC' : 0x08,
    209   'SUBLANG_BRETON_FRANCE' : 0x01,
    210   'SUBLANG_BULGARIAN_BULGARIA' : 0x01,
    211   'SUBLANG_CATALAN_CATALAN' : 0x01,
    212   'SUBLANG_CHINESE_TRADITIONAL' : 0x01,
    213   'SUBLANG_CHINESE_SIMPLIFIED' : 0x02,
    214   'SUBLANG_CHINESE_HONGKONG' : 0x03,
    215   'SUBLANG_CHINESE_SINGAPORE' : 0x04,
    216   'SUBLANG_CHINESE_MACAU' : 0x05,
    217   'SUBLANG_CORSICAN_FRANCE' : 0x01,
    218   'SUBLANG_CZECH_CZECH_REPUBLIC' : 0x01,
    219   'SUBLANG_CROATIAN_CROATIA' : 0x01,
    220   'SUBLANG_CROATIAN_BOSNIA_HERZEGOVINA_LATIN' : 0x04,
    221   'SUBLANG_DANISH_DENMARK' : 0x01,
    222   'SUBLANG_DARI_AFGHANISTAN' : 0x01,
    223   'SUBLANG_DIVEHI_MALDIVES' : 0x01,
    224   'SUBLANG_DUTCH' : 0x01,
    225   'SUBLANG_DUTCH_BELGIAN' : 0x02,
    226   'SUBLANG_ENGLISH_US' : 0x01,
    227   'SUBLANG_ENGLISH_UK' : 0x02,
    228   'SUBLANG_ENGLISH_AUS' : 0x03,
    229   'SUBLANG_ENGLISH_CAN' : 0x04,
    230   'SUBLANG_ENGLISH_NZ' : 0x05,
    231   'SUBLANG_ENGLISH_EIRE' : 0x06,
    232   'SUBLANG_ENGLISH_SOUTH_AFRICA' : 0x07,
    233   'SUBLANG_ENGLISH_JAMAICA' : 0x08,
    234   'SUBLANG_ENGLISH_CARIBBEAN' : 0x09,
    235   'SUBLANG_ENGLISH_BELIZE' : 0x0a,
    236   'SUBLANG_ENGLISH_TRINIDAD' : 0x0b,
    237   'SUBLANG_ENGLISH_ZIMBABWE' : 0x0c,
    238   'SUBLANG_ENGLISH_PHILIPPINES' : 0x0d,
    239   'SUBLANG_ENGLISH_INDIA' : 0x10,
    240   'SUBLANG_ENGLISH_MALAYSIA' : 0x11,
    241   'SUBLANG_ENGLISH_SINGAPORE' : 0x12,
    242   'SUBLANG_ESTONIAN_ESTONIA' : 0x01,
    243   'SUBLANG_FAEROESE_FAROE_ISLANDS' : 0x01,
    244   'SUBLANG_FILIPINO_PHILIPPINES' : 0x01,
    245   'SUBLANG_FINNISH_FINLAND' : 0x01,
    246   'SUBLANG_FRENCH' : 0x01,
    247   'SUBLANG_FRENCH_BELGIAN' : 0x02,
    248   'SUBLANG_FRENCH_CANADIAN' : 0x03,
    249   'SUBLANG_FRENCH_SWISS' : 0x04,
    250   'SUBLANG_FRENCH_LUXEMBOURG' : 0x05,
    251   'SUBLANG_FRENCH_MONACO' : 0x06,
    252   'SUBLANG_FRISIAN_NETHERLANDS' : 0x01,
    253   'SUBLANG_GALICIAN_GALICIAN' : 0x01,
    254   'SUBLANG_GEORGIAN_GEORGIA' : 0x01,
    255   'SUBLANG_GERMAN' : 0x01,
    256   'SUBLANG_GERMAN_SWISS' : 0x02,
    257   'SUBLANG_GERMAN_AUSTRIAN' : 0x03,
    258   'SUBLANG_GERMAN_LUXEMBOURG' : 0x04,
    259   'SUBLANG_GERMAN_LIECHTENSTEIN' : 0x05,
    260   'SUBLANG_GREEK_GREECE' : 0x01,
    261   'SUBLANG_GREENLANDIC_GREENLAND' : 0x01,
    262   'SUBLANG_GUJARATI_INDIA' : 0x01,
    263   'SUBLANG_HAUSA_NIGERIA_LATIN' : 0x01,
    264   'SUBLANG_HEBREW_ISRAEL' : 0x01,
    265   'SUBLANG_HINDI_INDIA' : 0x01,
    266   'SUBLANG_HUNGARIAN_HUNGARY' : 0x01,
    267   'SUBLANG_ICELANDIC_ICELAND' : 0x01,
    268   'SUBLANG_IGBO_NIGERIA' : 0x01,
    269   'SUBLANG_INDONESIAN_INDONESIA' : 0x01,
    270   'SUBLANG_INUKTITUT_CANADA' : 0x01,
    271   'SUBLANG_INUKTITUT_CANADA_LATIN' : 0x02,
    272   'SUBLANG_IRISH_IRELAND' : 0x02,
    273   'SUBLANG_ITALIAN' : 0x01,
    274   'SUBLANG_ITALIAN_SWISS' : 0x02,
    275   'SUBLANG_JAPANESE_JAPAN' : 0x01,
    276   'SUBLANG_KANNADA_INDIA' : 0x01,
    277   'SUBLANG_KASHMIRI_SASIA' : 0x02,
    278   'SUBLANG_KASHMIRI_INDIA' : 0x02,
    279   'SUBLANG_KAZAK_KAZAKHSTAN' : 0x01,
    280   'SUBLANG_KHMER_CAMBODIA' : 0x01,
    281   'SUBLANG_KICHE_GUATEMALA' : 0x01,
    282   'SUBLANG_KINYARWANDA_RWANDA' : 0x01,
    283   'SUBLANG_KONKANI_INDIA' : 0x01,
    284   'SUBLANG_KOREAN' : 0x01,
    285   'SUBLANG_KYRGYZ_KYRGYZSTAN' : 0x01,
    286   'SUBLANG_LAO_LAO' : 0x01,
    287   'SUBLANG_LATVIAN_LATVIA' : 0x01,
    288   'SUBLANG_LITHUANIAN' : 0x01,
    289   'SUBLANG_LOWER_SORBIAN_GERMANY' : 0x02,
    290   'SUBLANG_LUXEMBOURGISH_LUXEMBOURG' : 0x01,
    291   'SUBLANG_MACEDONIAN_MACEDONIA' : 0x01,
    292   'SUBLANG_MALAY_MALAYSIA' : 0x01,
    293   'SUBLANG_MALAY_BRUNEI_DARUSSALAM' : 0x02,
    294   'SUBLANG_MALAYALAM_INDIA' : 0x01,
    295   'SUBLANG_MALTESE_MALTA' : 0x01,
    296   'SUBLANG_MAORI_NEW_ZEALAND' : 0x01,
    297   'SUBLANG_MAPUDUNGUN_CHILE' : 0x01,
    298   'SUBLANG_MARATHI_INDIA' : 0x01,
    299   'SUBLANG_MOHAWK_MOHAWK' : 0x01,
    300   'SUBLANG_MONGOLIAN_CYRILLIC_MONGOLIA' : 0x01,
    301   'SUBLANG_MONGOLIAN_PRC' : 0x02,
    302   'SUBLANG_NEPALI_INDIA' : 0x02,
    303   'SUBLANG_NEPALI_NEPAL' : 0x01,
    304   'SUBLANG_NORWEGIAN_BOKMAL' : 0x01,
    305   'SUBLANG_NORWEGIAN_NYNORSK' : 0x02,
    306   'SUBLANG_OCCITAN_FRANCE' : 0x01,
    307   'SUBLANG_ORIYA_INDIA' : 0x01,
    308   'SUBLANG_PASHTO_AFGHANISTAN' : 0x01,
    309   'SUBLANG_PERSIAN_IRAN' : 0x01,
    310   'SUBLANG_POLISH_POLAND' : 0x01,
    311   'SUBLANG_PORTUGUESE' : 0x02,
    312   'SUBLANG_PORTUGUESE_BRAZILIAN' : 0x01,
    313   'SUBLANG_PUNJABI_INDIA' : 0x01,
    314   'SUBLANG_QUECHUA_BOLIVIA' : 0x01,
    315   'SUBLANG_QUECHUA_ECUADOR' : 0x02,
    316   'SUBLANG_QUECHUA_PERU' : 0x03,
    317   'SUBLANG_ROMANIAN_ROMANIA' : 0x01,
    318   'SUBLANG_ROMANSH_SWITZERLAND' : 0x01,
    319   'SUBLANG_RUSSIAN_RUSSIA' : 0x01,
    320   'SUBLANG_SAMI_NORTHERN_NORWAY' : 0x01,
    321   'SUBLANG_SAMI_NORTHERN_SWEDEN' : 0x02,
    322   'SUBLANG_SAMI_NORTHERN_FINLAND' : 0x03,
    323   'SUBLANG_SAMI_LULE_NORWAY' : 0x04,
    324   'SUBLANG_SAMI_LULE_SWEDEN' : 0x05,
    325   'SUBLANG_SAMI_SOUTHERN_NORWAY' : 0x06,
    326   'SUBLANG_SAMI_SOUTHERN_SWEDEN' : 0x07,
    327   'SUBLANG_SAMI_SKOLT_FINLAND' : 0x08,
    328   'SUBLANG_SAMI_INARI_FINLAND' : 0x09,
    329   'SUBLANG_SANSKRIT_INDIA' : 0x01,
    330   'SUBLANG_SCOTTISH_GAELIC' : 0x01,
    331   'SUBLANG_SERBIAN_BOSNIA_HERZEGOVINA_LATIN' : 0x06,
    332   'SUBLANG_SERBIAN_BOSNIA_HERZEGOVINA_CYRILLIC' : 0x07,
    333   'SUBLANG_SERBIAN_MONTENEGRO_LATIN' : 0x0b,
    334   'SUBLANG_SERBIAN_MONTENEGRO_CYRILLIC' : 0x0c,
    335   'SUBLANG_SERBIAN_SERBIA_LATIN' : 0x09,
    336   'SUBLANG_SERBIAN_SERBIA_CYRILLIC' : 0x0a,
    337   'SUBLANG_SERBIAN_CROATIA' : 0x01,
    338   'SUBLANG_SERBIAN_LATIN' : 0x02,
    339   'SUBLANG_SERBIAN_CYRILLIC' : 0x03,
    340   'SUBLANG_SINDHI_INDIA' : 0x01,
    341   'SUBLANG_SINDHI_PAKISTAN' : 0x02,
    342   'SUBLANG_SINDHI_AFGHANISTAN' : 0x02,
    343   'SUBLANG_SINHALESE_SRI_LANKA' : 0x01,
    344   'SUBLANG_SOTHO_NORTHERN_SOUTH_AFRICA' : 0x01,
    345   'SUBLANG_SLOVAK_SLOVAKIA' : 0x01,
    346   'SUBLANG_SLOVENIAN_SLOVENIA' : 0x01,
    347   'SUBLANG_SPANISH' : 0x01,
    348   'SUBLANG_SPANISH_MEXICAN' : 0x02,
    349   'SUBLANG_SPANISH_MODERN' : 0x03,
    350   'SUBLANG_SPANISH_GUATEMALA' : 0x04,
    351   'SUBLANG_SPANISH_COSTA_RICA' : 0x05,
    352   'SUBLANG_SPANISH_PANAMA' : 0x06,
    353   'SUBLANG_SPANISH_DOMINICAN_REPUBLIC' : 0x07,
    354   'SUBLANG_SPANISH_VENEZUELA' : 0x08,
    355   'SUBLANG_SPANISH_COLOMBIA' : 0x09,
    356   'SUBLANG_SPANISH_PERU' : 0x0a,
    357   'SUBLANG_SPANISH_ARGENTINA' : 0x0b,
    358   'SUBLANG_SPANISH_ECUADOR' : 0x0c,
    359   'SUBLANG_SPANISH_CHILE' : 0x0d,
    360   'SUBLANG_SPANISH_URUGUAY' : 0x0e,
    361   'SUBLANG_SPANISH_PARAGUAY' : 0x0f,
    362   'SUBLANG_SPANISH_BOLIVIA' : 0x10,
    363   'SUBLANG_SPANISH_EL_SALVADOR' : 0x11,
    364   'SUBLANG_SPANISH_HONDURAS' : 0x12,
    365   'SUBLANG_SPANISH_NICARAGUA' : 0x13,
    366   'SUBLANG_SPANISH_PUERTO_RICO' : 0x14,
    367   'SUBLANG_SPANISH_US' : 0x15,
    368   'SUBLANG_SWAHILI_KENYA' : 0x01,
    369   'SUBLANG_SWEDISH' : 0x01,
    370   'SUBLANG_SWEDISH_FINLAND' : 0x02,
    371   'SUBLANG_SYRIAC_SYRIA' : 0x01,
    372   'SUBLANG_TAJIK_TAJIKISTAN' : 0x01,
    373   'SUBLANG_TAMAZIGHT_ALGERIA_LATIN' : 0x02,
    374   'SUBLANG_TAMIL_INDIA' : 0x01,
    375   'SUBLANG_TATAR_RUSSIA' : 0x01,
    376   'SUBLANG_TELUGU_INDIA' : 0x01,
    377   'SUBLANG_THAI_THAILAND' : 0x01,
    378   'SUBLANG_TIBETAN_PRC' : 0x01,
    379   'SUBLANG_TIGRIGNA_ERITREA' : 0x02,
    380   'SUBLANG_TSWANA_SOUTH_AFRICA' : 0x01,
    381   'SUBLANG_TURKISH_TURKEY' : 0x01,
    382   'SUBLANG_TURKMEN_TURKMENISTAN' : 0x01,
    383   'SUBLANG_UIGHUR_PRC' : 0x01,
    384   'SUBLANG_UKRAINIAN_UKRAINE' : 0x01,
    385   'SUBLANG_UPPER_SORBIAN_GERMANY' : 0x01,
    386   'SUBLANG_URDU_PAKISTAN' : 0x01,
    387   'SUBLANG_URDU_INDIA' : 0x02,
    388   'SUBLANG_UZBEK_LATIN' : 0x01,
    389   'SUBLANG_UZBEK_CYRILLIC' : 0x02,
    390   'SUBLANG_VIETNAMESE_VIETNAM' : 0x01,
    391   'SUBLANG_WELSH_UNITED_KINGDOM' : 0x01,
    392   'SUBLANG_WOLOF_SENEGAL' : 0x01,
    393   'SUBLANG_XHOSA_SOUTH_AFRICA' : 0x01,
    394   'SUBLANG_YAKUT_RUSSIA' : 0x01,
    395   'SUBLANG_YI_PRC' : 0x01,
    396   'SUBLANG_YORUBA_NIGERIA' : 0x01,
    397   'SUBLANG_ZULU_SOUTH_AFRICA' : 0x01,
    398 }
    399 
    400 
    401 '''
    402 This dictionary defines the language lookup table. The key is the language ISO
    403 country code, and the value specifies the corresponding code page, primary
    404 language and sublanguage.
    405 
    406 LCID resource: http://msdn.microsoft.com/en-us/library/ms776294.aspx
    407 Codepage resource: http://www.science.co.il/language/locale-codes.asp
    408 Language ID resource: http://msdn.microsoft.com/en-us/library/ms776294.aspx
    409 
    410 There is no appropriate sublang for Spanish (Latin America) [es-419], so we
    411 use Mexico. SUBLANG_DEFAULT would incorrectly map to Spain. Unlike other
    412 Latin American countries, Mexican Spanish is supported by VERSIONINFO:
    413 http://msdn.microsoft.com/en-us/library/aa381058.aspx
    414 
    415 '''
    416 _LANGUAGE_MAP = {
    417   # Language neutral LCID, unicode(1200) code page.
    418   'neutral' : [ 1200, 'LANG_NEUTRAL', 'SUBLANG_NEUTRAL' ],
    419   # LANG_USER_DEFAULT LCID, unicode(1200) code page.
    420   'userdefault' : [ 1200, 'LANG_NEUTRAL', 'SUBLANG_DEFAULT' ],
    421   'fake-bidi' : [ 1255, 'LANG_HEBREW', 'SUBLANG_DEFAULT' ],
    422   'af' : [ 1252, 'LANG_AFRIKAANS', 'SUBLANG_DEFAULT' ],
    423   'am' : [ 1200, 'LANG_AMHARIC', 'SUBLANG_DEFAULT' ],
    424   'ar' : [ 1256, 'LANG_ARABIC', 'SUBLANG_DEFAULT' ],
    425   'bg' : [ 1251, 'LANG_BULGARIAN', 'SUBLANG_DEFAULT' ],
    426   'bn' : [ 1200, 'LANG_BENGALI', 'SUBLANG_DEFAULT' ],
    427   'ca' : [ 1252, 'LANG_CATALAN', 'SUBLANG_DEFAULT' ],
    428   'cs' : [ 1250, 'LANG_CZECH', 'SUBLANG_DEFAULT' ],
    429   'da' : [ 1252, 'LANG_DANISH', 'SUBLANG_DEFAULT' ],
    430   'de' : [ 1252, 'LANG_GERMAN', 'SUBLANG_GERMAN' ],
    431   'el' : [ 1253, 'LANG_GREEK', 'SUBLANG_DEFAULT' ],
    432   'en' : [ 1200, 'LANG_ENGLISH', 'SUBLANG_ENGLISH_US' ],
    433   'en-GB' : [ 1038, 'LANG_ENGLISH', 'SUBLANG_ENGLISH_UK' ],
    434   'es' : [ 1252, 'LANG_SPANISH', 'SUBLANG_SPANISH_MODERN' ],
    435   # LCID for Mexico; Windows does not support L.A. LCID.
    436   'es-419' : [ 1252, 'LANG_SPANISH', 'SUBLANG_SPANISH_MEXICAN' ],
    437   'et' : [ 1257, 'LANG_ESTONIAN', 'SUBLANG_DEFAULT' ],
    438   'eu' : [ 1252, 'LANG_BASQUE', 'SUBLANG_DEFAULT' ],
    439   'fa' : [ 1256, 'LANG_PERSIAN', 'SUBLANG_DEFAULT' ],
    440   'fi' : [ 1252, 'LANG_FINNISH', 'SUBLANG_DEFAULT' ],
    441   'fil' : [ 1252, 'LANG_FILIPINO', 'SUBLANG_DEFAULT' ],
    442   'fr' : [ 1252, 'LANG_FRENCH', 'SUBLANG_FRENCH' ],
    443   'fr-CA' : [ 1252, 'LANG_FRENCH', 'SUBLANG_FRENCH_CANADIAN' ],
    444   'gl' : [ 1252, 'LANG_GALICIAN', 'SUBLANG_DEFAULT' ],
    445   'gu' : [ 1200, 'LANG_GUJARATI', 'SUBLANG_DEFAULT' ],
    446   'he' : [ 1255, 'LANG_HEBREW', 'SUBLANG_DEFAULT' ],
    447   'hi' : [ 1200, 'LANG_HINDI', 'SUBLANG_DEFAULT' ],
    448   'hr' : [ 1252, 'LANG_CROATIAN', 'SUBLANG_DEFAULT' ],
    449   'hu' : [ 1250, 'LANG_HUNGARIAN', 'SUBLANG_DEFAULT' ],
    450   'id' : [ 1252, 'LANG_INDONESIAN', 'SUBLANG_DEFAULT' ],
    451   'is' : [ 1252, 'LANG_ICELANDIC', 'SUBLANG_DEFAULT' ],
    452   'it' : [ 1252, 'LANG_ITALIAN', 'SUBLANG_DEFAULT' ],
    453   'iw' : [ 1255, 'LANG_HEBREW', 'SUBLANG_DEFAULT' ],
    454   'ja' : [ 932, 'LANG_JAPANESE', 'SUBLANG_DEFAULT' ],
    455   'kn' : [ 1200, 'LANG_KANNADA', 'SUBLANG_DEFAULT' ],
    456   'ko' : [ 949, 'LANG_KOREAN', 'SUBLANG_KOREAN' ],
    457   'lt' : [ 1257, 'LANG_LITHUANIAN', 'SUBLANG_LITHUANIAN' ],
    458   'lv' : [ 1257, 'LANG_LATVIAN', 'SUBLANG_DEFAULT' ],
    459   'ml' : [ 1200, 'LANG_MALAYALAM', 'SUBLANG_DEFAULT' ],
    460   'mr' : [ 1200, 'LANG_MARATHI', 'SUBLANG_DEFAULT' ],
    461   # Malay (Malaysia) [ms-MY]
    462   'ms' : [ 1252, 'LANG_MALAY', 'SUBLANG_DEFAULT' ],
    463   'nb' : [ 1252, 'LANG_NORWEGIAN', 'SUBLANG_NORWEGIAN_BOKMAL' ],
    464   'ne' : [ 1200, 'LANG_NEPALI', 'SUBLANG_NEPALI_NEPAL' ],
    465   'nl' : [ 1252, 'LANG_DUTCH', 'SUBLANG_DEFAULT' ],
    466   'nn' : [ 1252, 'LANG_NORWEGIAN', 'SUBLANG_NORWEGIAN_NYNORSK' ],
    467   'no' : [ 1252, 'LANG_NORWEGIAN', 'SUBLANG_DEFAULT' ],
    468   'or' : [ 1200, 'LANG_ORIYA', 'SUBLANG_DEFAULT' ],
    469   'pa' : [ 1200, 'LANG_PUNJABI', 'SUBLANG_PUNJABI_INDIA' ],
    470   'pl' : [ 1250, 'LANG_POLISH', 'SUBLANG_DEFAULT' ],
    471   'pt-BR' : [ 1252, 'LANG_PORTUGUESE', 'SUBLANG_DEFAULT' ],
    472   'pt-PT' : [ 1252, 'LANG_PORTUGUESE', 'SUBLANG_PORTUGUESE' ],
    473   'ro' : [ 1250, 'LANG_ROMANIAN', 'SUBLANG_DEFAULT' ],
    474   'ru' : [ 1251, 'LANG_RUSSIAN', 'SUBLANG_DEFAULT' ],
    475   'sa' : [ 1200, 'LANG_SANSKRIT', 'SUBLANG_SANSKRIT_INDIA' ],
    476   'si' : [ 1200, 'LANG_SINHALESE', 'SUBLANG_SINHALESE_SRI_LANKA' ],
    477   'sk' : [ 1250, 'LANG_SLOVAK', 'SUBLANG_DEFAULT' ],
    478   'sl' : [ 1250, 'LANG_SLOVENIAN', 'SUBLANG_DEFAULT' ],
    479   'sr' : [ 1250, 'LANG_SERBIAN', 'SUBLANG_SERBIAN_LATIN' ],
    480   'sv' : [ 1252, 'LANG_SWEDISH', 'SUBLANG_SWEDISH' ],
    481   'sw' : [ 1252, 'LANG_SWAHILI', 'SUBLANG_DEFAULT' ],
    482   'ta' : [ 1200, 'LANG_TAMIL', 'SUBLANG_DEFAULT' ],
    483   'te' : [ 1200, 'LANG_TELUGU', 'SUBLANG_DEFAULT' ],
    484   'th' : [ 874, 'LANG_THAI', 'SUBLANG_DEFAULT' ],
    485   'ti' : [ 1200, 'LANG_TIGRIGNA', 'SUBLANG_TIGRIGNA_ERITREA' ],
    486   'tr' : [ 1254, 'LANG_TURKISH', 'SUBLANG_DEFAULT' ],
    487   'uk' : [ 1251, 'LANG_UKRAINIAN', 'SUBLANG_DEFAULT' ],
    488   'ur' : [ 1200, 'LANG_URDU', 'SUBLANG_DEFAULT' ],
    489   'vi' : [ 1258, 'LANG_VIETNAMESE', 'SUBLANG_DEFAULT' ],
    490   'zh-CN' : [ 936, 'LANG_CHINESE', 'SUBLANG_CHINESE_SIMPLIFIED' ],
    491   'zh-HK' : [ 950, 'LANG_CHINESE', 'SUBLANG_CHINESE_HONGKONG' ],
    492   'zh-TW' : [ 950, 'LANG_CHINESE', 'SUBLANG_CHINESE_TRADITIONAL' ],
    493   'zu' : [ 1200, 'LANG_ZULU', 'SUBLANG_DEFAULT' ],
    494 }
    495 
    496 
    497 # Right-To-Left languages
    498 _RTL_LANGUAGES = (
    499   'ar',  # Arabic
    500   'fa',  # Farsi
    501   'iw',  # Hebrew
    502   'ks',  # Kashmiri
    503   'ku',  # Kurdish
    504   'ps',  # Pashto
    505   'ur',  # Urdu
    506   'yi',  # Yiddish
    507 )
    508 
    509 
    510 def GetCodepage(language):
    511   """ Returns the codepage for the given |language|. """
    512   lang = _LANGUAGE_MAP[language]
    513   return "%04x" % lang[0]
    514 
    515 
    516 def GetCodepageDecimal(language):
    517   """ Returns the codepage for the given |language| as a decimal value. """
    518   lang = _LANGUAGE_MAP[language]
    519   return "%d" % lang[0]
    520 
    521 
    522 def GetLangId(language):
    523   """ Returns the language id for the given |language|. """
    524   lang = _LANGUAGE_MAP[language]
    525   return "%04x" % (_LANGUAGE_PRIMARY[lang[1]] | (_LANGUAGE_SUB[lang[2]] << 10))
    526 
    527 
    528 def GetPrimaryLanguage(language):
    529   """ Returns the primary language ID for the given |language|. """
    530   lang = _LANGUAGE_MAP[language]
    531   return _LANGUAGE_PRIMARY[lang[1]]
    532 
    533 
    534 def GetSublanguage(language):
    535   """ Returns the sublanguage ID for the given |language|. """
    536   lang = _LANGUAGE_MAP[language]
    537   return _LANGUAGE_SUB[lang[2]]
    538 
    539 
    540 def IsRtlLanguage(language):
    541   return language in _RTL_LANGUAGES;
    542 
    543 
    544 def NormalizeLanguageCode(language):
    545   lang = language.replace('_', '-', 1)
    546   if lang == 'en-US':
    547     lang = 'en'
    548   return lang
    549 
    550 
    551 def GetDataPackageSuffix(language):
    552   lang = NormalizeLanguageCode(language)
    553   if lang == 'en':
    554     lang = 'en-US'
    555   return lang
    556 
    557 
    558 def GetJsonSuffix(language):
    559   return language.replace('-', '_', 1)
    560 
    561 
    562 def ReadValuesFromFile(values_dict, file_name):
    563   """
    564   Reads NAME=VALUE settings from the specified file.
    565 
    566   Everything to the left of the first '=' is the keyword,
    567   everything to the right is the value.  No stripping of
    568   white space, so beware.
    569 
    570   The file must exist, otherwise you get the Python exception from open().
    571   """
    572   for line in open(file_name, 'r').readlines():
    573     key, val = line.rstrip('\r\n').split('=', 1)
    574     values_dict[key] = val
    575 
    576 
    577 def ReadMessagesFromFile(file_name):
    578   """
    579   Reads messages from a 'chrome_messages_json' file.
    580 
    581   The file must exist, otherwise you get the Python exception from open().
    582   """
    583   messages_file = io.open(file_name, encoding='utf-8-sig')
    584   messages = json.load(messages_file)
    585   messages_file.close()
    586 
    587   values = {}
    588   for key in messages.keys():
    589     values[key] = unicode(messages[key]['message']);
    590   return values
    591 
    592 
    593 def WriteIfChanged(file_name, contents, encoding):
    594   """
    595   Writes the specified contents to the specified file_name
    596   iff the contents are different than the current contents.
    597   """
    598   try:
    599     target = io.open(file_name, 'r')
    600     old_contents = target.read()
    601   except EnvironmentError:
    602     pass
    603   except UnicodeDecodeError:
    604     target.close()
    605     os.unlink(file_name)
    606   else:
    607     if contents == old_contents:
    608       return
    609     target.close()
    610     os.unlink(file_name)
    611   io.open(file_name, 'w', encoding=encoding).write(contents)
    612 
    613 
    614 class MessageMap:
    615   """ Provides a dictionary of localized messages for each language."""
    616   def __init__(self, languages, locale_dir):
    617     self.language = None
    618     self.message_map = {}
    619 
    620     # Populate the message map
    621     if locale_dir:
    622       for language in languages:
    623         file_name = os.path.join(locale_dir,
    624                                  GetJsonSuffix(language),
    625                                  'messages.json')
    626         self.message_map[language] = ReadMessagesFromFile(file_name)
    627 
    628   def GetText(self, message):
    629     """ Returns a localized message for the current language. """
    630     return self.message_map[self.language][message]
    631 
    632   def SelectLanguage(self, language):
    633     """ Selects the language to be used when retrieving localized messages. """
    634     self.language = language
    635 
    636   def MakeSelectLanguage(self):
    637     """ Returns a function that can be used to select the current language. """
    638     return lambda language: self.SelectLanguage(language)
    639 
    640   def MakeGetText(self):
    641     """ Returns a function that can be used to retrieve a localized message. """
    642     return lambda message: self.GetText(message)
    643 
    644 
    645 # Use '@' as a delimiter for string templates instead of '$' to avoid unintended
    646 # expansion when passing the string from GYP.
    647 class GypTemplate(Template):
    648     delimiter = '@'
    649 
    650 
    651 def Localize(source, locales, options):
    652   # Set the list of languages to use.
    653   languages = map(NormalizeLanguageCode, locales)
    654   context = { 'languages' : languages }
    655 
    656   # Load the localized messages.
    657   message_map = MessageMap(languages, options.locale_dir)
    658 
    659   # Add OFFICIAL_BUILD variable the same way build/util/version.py
    660   # does.
    661   if os.environ.get('CHROME_BUILD_TYPE') == '_official':
    662     context['official_build'] = '1'
    663   else:
    664     context['official_build'] = '0'
    665 
    666   # Add all variables defined in the command line.
    667   if options.define:
    668     for define in options.define:
    669       context.update(dict([define.split('=', 1)]));
    670 
    671   # Read NAME=VALUE variables from file.
    672   if options.variables:
    673     for file_name in options.variables:
    674       ReadValuesFromFile(context, file_name)
    675 
    676   env = None
    677   template = None
    678 
    679   if source:
    680     # Load jinja2 library.
    681     if options.jinja2:
    682       jinja2_path = os.path.normpath(options.jinja2)
    683     else:
    684       jinja2_path = os.path.normpath(
    685           os.path.join(os.path.abspath(__file__),
    686                        '../../../../third_party/jinja2'))
    687     sys.path.append(os.path.split(jinja2_path)[0])
    688     from jinja2 import Environment, FileSystemLoader
    689 
    690     # Create jinja2 environment.
    691     (template_path, template_name) = os.path.split(source)
    692     env = Environment(loader=FileSystemLoader(template_path),
    693                       extensions=['jinja2.ext.do', 'jinja2.ext.i18n'])
    694 
    695     # Register custom filters.
    696     env.filters['GetCodepage'] = GetCodepage
    697     env.filters['GetCodepageDecimal'] = GetCodepageDecimal
    698     env.filters['GetLangId'] = GetLangId
    699     env.filters['GetPrimaryLanguage'] = GetPrimaryLanguage
    700     env.filters['GetSublanguage'] = GetSublanguage
    701 
    702     # Register the message map with jinja2.i18n extension.
    703     env.globals['IsRtlLanguage'] = IsRtlLanguage
    704     env.globals['SelectLanguage'] = message_map.MakeSelectLanguage()
    705     env.install_gettext_callables(message_map.MakeGetText(),
    706                                   message_map.MakeGetText());
    707 
    708     template = env.get_template(template_name)
    709 
    710   # Generate a separate file per each locale if requested.
    711   outputs = []
    712   if options.locale_output:
    713     target = GypTemplate(options.locale_output)
    714     for lang in languages:
    715       context['languages'] = [ lang ]
    716       context['language'] = lang
    717       context['pak_suffix'] = GetDataPackageSuffix(lang)
    718       context['json_suffix'] = GetJsonSuffix(lang)
    719       message_map.SelectLanguage(lang)
    720 
    721       template_file_name = target.safe_substitute(context)
    722       outputs.append(template_file_name)
    723       if not options.print_only:
    724         WriteIfChanged(template_file_name, template.render(context),
    725                        options.encoding)
    726   else:
    727     outputs.append(options.output)
    728     if not options.print_only:
    729       WriteIfChanged(options.output, template.render(context), options.encoding)
    730 
    731   if options.print_only:
    732     # Quote each element so filename spaces don't mess up gyp's attempt to parse
    733     # it into a list.
    734     return " ".join(['"%s"' % x for x in outputs])
    735 
    736   return
    737 
    738 
    739 def DoMain(argv):
    740   usage = "Usage: localize [options] locales"
    741   parser = OptionParser(usage=usage)
    742   parser.add_option(
    743       '-d', '--define', dest='define', action='append', type='string',
    744       help='define a variable (NAME=VALUE).')
    745   parser.add_option(
    746       '--encoding', dest='encoding', type='string', default='utf-8',
    747       help="set the encoding of <output>. 'utf-8' is the default.")
    748   parser.add_option(
    749       '--jinja2', dest='jinja2', type='string',
    750       help="specifies path to the jinja2 library.")
    751   parser.add_option(
    752       '--locale_dir', dest='locale_dir', type='string',
    753       help="set path to localized message files.")
    754   parser.add_option(
    755       '--locale_output', dest='locale_output',  type='string',
    756       help='specify the per-locale output file name.')
    757   parser.add_option(
    758       '-o', '--output', dest='output', type='string',
    759       help="specify the output file name.")
    760   parser.add_option(
    761       '--print_only', dest='print_only', action='store_true',
    762       default=False, help='print the output file names only.')
    763   parser.add_option(
    764       '-t', '--template', dest='template', type='string',
    765       help="specify the template file name.")
    766   parser.add_option(
    767       '--variables', dest='variables', action='append', type='string',
    768       help='read variables (NAME=VALUE) from file.')
    769 
    770   options, locales = parser.parse_args(argv)
    771   if not locales:
    772     parser.error('At least one locale must be specified')
    773   if bool(options.output) == bool(options.locale_output):
    774     parser.error(
    775         'Either --output or --locale_output must be specified but not both')
    776   if not options.template and not options.print_only:
    777     parser.error('The template name is required unless --print_only is used')
    778 
    779   return Localize(options.template, locales, options)
    780 
    781 if __name__ == '__main__':
    782   sys.exit(DoMain(sys.argv[1:]))
    783 
    784