#!/usr/bin/env python3 """ Convert the X11 locale.alias file into a mapping dictionary suitable for locale.py. Written by Marc-Andre Lemburg , 2004-12-10. """ import locale import sys _locale = locale # Location of the X11 alias file. LOCALE_ALIAS = '/usr/share/X11/locale/locale.alias' # Location of the glibc SUPPORTED locales file. SUPPORTED = '/usr/share/i18n/SUPPORTED' def parse(filename): with open(filename, encoding='latin1') as f: lines = list(f) # Remove mojibake in /usr/share/X11/locale/locale.alias. # b'\xef\xbf\xbd' == '\ufffd'.encode('utf-8') lines = [line for line in lines if '\xef\xbf\xbd' not in line] data = {} for line in lines: line = line.strip() if not line: continue if line[:1] == '#': continue locale, alias = line.split() # Fix non-standard locale names, e.g. ks_IN@devanagari.UTF-8 if '@' in alias: alias_lang, _, alias_mod = alias.partition('@') if '.' in alias_mod: alias_mod, _, alias_enc = alias_mod.partition('.') alias = alias_lang + '.' + alias_enc + '@' + alias_mod # Strip ':' if locale[-1] == ':': locale = locale[:-1] # Lower-case locale locale = locale.lower() # Ignore one letter locale mappings (except for 'c') if len(locale) == 1 and locale != 'c': continue # Normalize encoding, if given if '.' in locale: lang, encoding = locale.split('.')[:2] encoding = encoding.replace('-', '') encoding = encoding.replace('_', '') locale = lang + '.' + encoding data[locale] = alias return data def parse_glibc_supported(filename): with open(filename, encoding='latin1') as f: lines = list(f) data = {} for line in lines: line = line.strip() if not line: continue if line[:1] == '#': continue line = line.replace('/', ' ').strip() line = line.rstrip('\\').rstrip() words = line.split() if len(words) != 2: continue alias, alias_encoding = words # Lower-case locale locale = alias.lower() # Normalize encoding, if given if '.' in locale: lang, encoding = locale.split('.')[:2] encoding = encoding.replace('-', '') encoding = encoding.replace('_', '') locale = lang + '.' + encoding # Add an encoding to alias alias, _, modifier = alias.partition('@') alias = _locale._replace_encoding(alias, alias_encoding) if modifier and not (modifier == 'euro' and alias_encoding == 'ISO-8859-15'): alias += '@' + modifier data[locale] = alias return data def pprint(data): items = sorted(data.items()) for k, v in items: print(' %-40s%a,' % ('%a:' % k, v)) def print_differences(data, olddata): items = sorted(olddata.items()) for k, v in items: if k not in data: print('# removed %a' % k) elif olddata[k] != data[k]: print('# updated %a -> %a to %a' % \ (k, olddata[k], data[k])) # Additions are not mentioned def optimize(data): locale_alias = locale.locale_alias locale.locale_alias = data.copy() for k, v in data.items(): del locale.locale_alias[k] if locale.normalize(k) != v: locale.locale_alias[k] = v newdata = locale.locale_alias errors = check(data) locale.locale_alias = locale_alias if errors: sys.exit(1) return newdata def check(data): # Check that all alias definitions from the X11 file # are actually mapped to the correct alias locales. errors = 0 for k, v in data.items(): if locale.normalize(k) != v: print('ERROR: %a -> %a != %a' % (k, locale.normalize(k), v), file=sys.stderr) errors += 1 return errors if __name__ == '__main__': import argparse parser = argparse.ArgumentParser() parser.add_argument('--locale-alias', default=LOCALE_ALIAS, help='location of the X11 alias file ' '(default: %a)' % LOCALE_ALIAS) parser.add_argument('--glibc-supported', default=SUPPORTED, help='location of the glibc SUPPORTED locales file ' '(default: %a)' % SUPPORTED) args = parser.parse_args() data = locale.locale_alias.copy() data.update(parse_glibc_supported(args.glibc_supported)) data.update(parse(args.locale_alias)) while True: # Repeat optimization while the size is decreased. n = len(data) data = optimize(data) if len(data) == n: break print_differences(data, locale.locale_alias) print() print('locale_alias = {') pprint(data) print('}')