babel/old/mirror: scripts/import

comparison scripts/import_cldr.py @ 28:695884591af6

* Reduce size of locale data pickles by only storing the data provided by each locale itself, and merging inherited data at runtime. * Move locale data loading from `babel.core` into a separate `babel.localedata` module. * Add curency names and symbols to locale data.

author	cmlenz
date	Sun, 03 Jun 2007 15:27:27 +0000
parents	6c2c9fc7d787
children	9a00ac84004c

comparison

equal deleted inserted replaced

-:8d4cd0856f69
+:695884591af6
 any
 except NameError:
 def any(iterable):
 return filter(None, list(iterable))
-def _parent(locale):
-parts = locale.split('_')
-if len(parts) == 1:
-return 'root'
-else:
-return '_'.join(parts[:-1])
 def _text(elem):
 buf = [elem.text or '']
 for child in elem:
 buf.append(_text(child))
 buf.append(elem.tail or '')
 # build a territory containment mapping for inheritance
 regions = {}
 for elem in sup.findall('//territoryContainment/group'):
 regions[elem.attrib['type']] = elem.attrib['contains'].split()
-from pprint import pprint
 # Resolve territory containment
 territory_containment = {}
 region_items = regions.items()
 region_items.sort()
 print>>sys.stderr, 'Processing input file %r' % filename
 stem, ext = os.path.splitext(filename)
 if ext != '.xml':
 continue
+tree = parse(os.path.join(srcdir, 'main', filename))
 data = {}
-if stem != 'root':
-data.update(copy.deepcopy(dicts[_parent(stem)]))
-tree = parse(os.path.join(srcdir, 'main', filename))
 language = None
 elem = tree.find('//identity/language')
 if elem is not None:
 language = elem.attrib['type']
 continue
 try:
 date_formats[elem.attrib.get('type')] = \
 dates.parse_pattern(unicode(elem.findtext('dateFormat/pattern')))
 except ValueError, e:
-print e
+print>>sys.stderr, 'ERROR: %s' % e
 time_formats = data.setdefault('time_formats', {})
 for elem in calendar.findall('timeFormats/timeFormatLength'):
 if 'draft' in elem.attrib and elem.attrib.get('type') in time_formats:
 continue
 try:
 time_formats[elem.attrib.get('type')] = \
 dates.parse_pattern(unicode(elem.findtext('timeFormat/pattern')))
 except ValueError, e:
-print e
+print>>sys.stderr, 'ERROR: %s' % e
 # <numbers>
 number_symbols = data.setdefault('number_symbols', {})
 for elem in tree.findall('//numbers/symbols/*'):
 decimal_formats = data.setdefault('decimal_formats', {})
 for elem in tree.findall('//decimalFormats/decimalFormatLength'):
 if 'draft' in elem.attrib and elem.attrib.get('type') in decimal_formats:
 continue
-decimal_formats[elem.attrib.get('type')] = numbers.parse_pattern(unicode(elem.findtext('decimalFormat/pattern')))
+pattern = unicode(elem.findtext('decimalFormat/pattern'))
+decimal_formats[elem.attrib.get('type')] = numbers.parse_pattern(pattern)
 scientific_formats = data.setdefault('scientific_formats', {})
 for elem in tree.findall('//scientificFormats/scientificFormatLength'):
 if 'draft' in elem.attrib and elem.attrib.get('type') in scientific_formats:
 continue
+# FIXME: should use numbers.parse_pattern
 scientific_formats[elem.attrib.get('type')] = unicode(elem.findtext('scientificFormat/pattern'))
 currency_formats = data.setdefault('currency_formats', {})
 for elem in tree.findall('//currencyFormats/currencyFormatLength'):
 if 'draft' in elem.attrib and elem.attrib.get('type') in currency_formats:
 continue
+# FIXME: should use numbers.parse_pattern
 currency_formats[elem.attrib.get('type')] = unicode(elem.findtext('currencyFormat/pattern'))
 percent_formats = data.setdefault('percent_formats', {})
 for elem in tree.findall('//percentFormats/percentFormatLength'):
 if 'draft' in elem.attrib and elem.attrib.get('type') in percent_formats:
 continue
-percent_formats[elem.attrib.get('type')] = numbers.parse_pattern(unicode(elem.findtext('percentFormat/pattern')))
+pattern = unicode(elem.findtext('percentFormat/pattern'))
+percent_formats[elem.attrib.get('type')] = numbers.parse_pattern(pattern)
-currencies = data.setdefault('currencies', {})
+currency_names = data.setdefault('currency_names', {})
+currency_symbols = data.setdefault('currency_symbols', {})
 for elem in tree.findall('//currencies/currency'):
-currencies[elem.attrib['type']] = {
+name = elem.findtext('displayName')
-'display_name': unicode(elem.findtext('displayName')),
+if name:
-'symbol': unicode(elem.findtext('symbol'))
+currency_names[elem.attrib['type']] = unicode(name)
-}
+symbol = elem.findtext('symbol')
+if symbol:
+currency_symbols[elem.attrib['type']] = unicode(symbol)
 dicts[stem] = data
 outfile = open(os.path.join(destdir, stem + '.dat'), 'wb')
 try:
 pickle.dump(data, outfile, 2)

Mercurial > babel > old > mirror

comparison scripts/import_cldr.py @ 28:695884591af6