annotate 0.8.x/scripts/import_cldr.py @ 557:3c590f6f5dfa stable tip

Merged revisions 607 via svnmerge from http://svn.edgewall.org/repos/babel/trunk ........ r607 | pjenvey | 2011-04-24 21:41:23 -0700 (Sun, 24 Apr 2011) | 3 lines keywords only support space separated values, not comma separated thanks agronholm ........
author pjenvey
date Mon, 25 Apr 2011 04:44:13 +0000
parents 4a7af44e6695
children
rev   line source
142
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
1 #!/usr/bin/env python
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
2 # -*- coding: utf-8 -*-
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
3 #
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
4 # Copyright (C) 2007 Edgewall Software
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
5 # All rights reserved.
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
6 #
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
7 # This software is licensed as described in the file COPYING, which
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
8 # you should have received as part of this distribution. The terms
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
9 # are also available at http://babel.edgewall.org/wiki/License.
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
10 #
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
11 # This software consists of voluntary contributions made by many
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
12 # individuals. For the exact contribution history, see the revision
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
13 # history and logs, available at http://babel.edgewall.org/log/.
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
14
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
15 import copy
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
16 from optparse import OptionParser
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
17 import os
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
18 import pickle
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
19 import sys
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
20 try:
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
21 from xml.etree.ElementTree import parse
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
22 except ImportError:
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
23 from elementtree.ElementTree import parse
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
24
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
25 # Make sure we're using Babel source, and not some previously installed version
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
26 sys.path.insert(0, os.path.join(os.path.dirname(sys.argv[0]), '..'))
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
27
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
28 from babel import dates, numbers
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
29
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
30 weekdays = {'mon': 0, 'tue': 1, 'wed': 2, 'thu': 3, 'fri': 4, 'sat': 5,
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
31 'sun': 6}
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
32
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
33 try:
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
34 any
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
35 except NameError:
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
36 def any(iterable):
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
37 return filter(None, list(iterable))
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
38
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
39 def _text(elem):
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
40 buf = [elem.text or '']
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
41 for child in elem:
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
42 buf.append(_text(child))
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
43 buf.append(elem.tail or '')
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
44 return u''.join(filter(None, buf)).strip()
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
45
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
46 def main():
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
47 parser = OptionParser(usage='%prog path/to/cldr')
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
48 options, args = parser.parse_args()
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
49 if len(args) != 1:
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
50 parser.error('incorrect number of arguments')
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
51
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
52 srcdir = args[0]
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
53 destdir = os.path.join(os.path.dirname(os.path.abspath(sys.argv[0])),
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
54 '..', 'babel', 'localedata')
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
55
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
56 sup = parse(os.path.join(srcdir, 'supplemental', 'supplementalData.xml'))
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
57
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
58 # build a territory containment mapping for inheritance
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
59 regions = {}
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
60 for elem in sup.findall('//territoryContainment/group'):
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
61 regions[elem.attrib['type']] = elem.attrib['contains'].split()
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
62
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
63 # Resolve territory containment
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
64 territory_containment = {}
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
65 region_items = regions.items()
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
66 region_items.sort()
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
67 for group, territory_list in region_items:
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
68 for territory in territory_list:
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
69 containers = territory_containment.setdefault(territory, set([]))
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
70 if group in territory_containment:
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
71 containers |= territory_containment[group]
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
72 containers.add(group)
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
73
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
74 filenames = os.listdir(os.path.join(srcdir, 'main'))
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
75 filenames.remove('root.xml')
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
76 filenames.sort(lambda a,b: len(a)-len(b))
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
77 filenames.insert(0, 'root.xml')
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
78
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
79 dicts = {}
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
80
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
81 for filename in filenames:
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
82 print>>sys.stderr, 'Processing input file %r' % filename
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
83 stem, ext = os.path.splitext(filename)
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
84 if ext != '.xml':
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
85 continue
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
86
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
87 tree = parse(os.path.join(srcdir, 'main', filename))
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
88 data = {}
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
89
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
90 language = None
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
91 elem = tree.find('//identity/language')
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
92 if elem is not None:
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
93 language = elem.attrib['type']
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
94 print>>sys.stderr, ' Language: %r' % language
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
95
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
96 territory = None
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
97 elem = tree.find('//identity/territory')
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
98 if elem is not None:
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
99 territory = elem.attrib['type']
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
100 else:
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
101 territory = '001' # world
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
102 print>>sys.stderr, ' Territory: %r' % territory
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
103 regions = territory_containment.get(territory, [])
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
104 print>>sys.stderr, ' Regions: %r' % regions
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
105
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
106 # <localeDisplayNames>
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
107
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
108 territories = data.setdefault('territories', {})
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
109 for elem in tree.findall('//territories/territory'):
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
110 if 'draft' in elem.attrib and elem.attrib['type'] in territories:
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
111 continue
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
112 territories[elem.attrib['type']] = _text(elem)
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
113
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
114 languages = data.setdefault('languages', {})
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
115 for elem in tree.findall('//languages/language'):
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
116 if 'draft' in elem.attrib and elem.attrib['type'] in languages:
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
117 continue
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
118 languages[elem.attrib['type']] = _text(elem)
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
119
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
120 variants = data.setdefault('variants', {})
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
121 for elem in tree.findall('//variants/variant'):
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
122 if 'draft' in elem.attrib and elem.attrib['type'] in variants:
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
123 continue
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
124 variants[elem.attrib['type']] = _text(elem)
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
125
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
126 scripts = data.setdefault('scripts', {})
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
127 for elem in tree.findall('//scripts/script'):
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
128 if 'draft' in elem.attrib and elem.attrib['type'] in scripts:
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
129 continue
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
130 scripts[elem.attrib['type']] = _text(elem)
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
131
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
132 # <dates>
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
133
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
134 week_data = data.setdefault('week_data', {})
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
135 supelem = sup.find('//weekData')
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
136
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
137 for elem in supelem.findall('minDays'):
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
138 territories = elem.attrib['territories'].split()
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
139 if territory in territories or any([r in territories for r in regions]):
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
140 week_data['min_days'] = int(elem.attrib['count'])
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
141
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
142 for elem in supelem.findall('firstDay'):
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
143 territories = elem.attrib['territories'].split()
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
144 if territory in territories or any([r in territories for r in regions]):
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
145 week_data['first_day'] = weekdays[elem.attrib['day']]
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
146
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
147 for elem in supelem.findall('weekendStart'):
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
148 territories = elem.attrib['territories'].split()
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
149 if territory in territories or any([r in territories for r in regions]):
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
150 week_data['weekend_start'] = weekdays[elem.attrib['day']]
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
151
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
152 for elem in supelem.findall('weekendEnd'):
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
153 territories = elem.attrib['territories'].split()
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
154 if territory in territories or any([r in territories for r in regions]):
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
155 week_data['weekend_end'] = weekdays[elem.attrib['day']]
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
156
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
157 time_zones = data.setdefault('time_zones', {})
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
158 for elem in tree.findall('//timeZoneNames/zone'):
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
159 info = {}
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
160 city = elem.findtext('exemplarCity')
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
161 if city:
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
162 info['city'] = unicode(city)
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
163 for child in elem.findall('long/*'):
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
164 info.setdefault('long', {})[child.tag] = unicode(child.text)
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
165 for child in elem.findall('short/*'):
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
166 info.setdefault('short', {})[child.tag] = unicode(child.text)
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
167 time_zones[elem.attrib['type']] = info
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
168
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
169 zone_aliases = data.setdefault('zone_aliases', {})
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
170 if stem == 'root':
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
171 for elem in sup.findall('//timezoneData/zoneFormatting/zoneItem'):
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
172 if 'aliases' in elem.attrib:
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
173 canonical_id = elem.attrib['type']
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
174 for alias in elem.attrib['aliases'].split():
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
175 zone_aliases[alias] = canonical_id
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
176
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
177 for calendar in tree.findall('//calendars/calendar'):
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
178 if calendar.attrib['type'] != 'gregorian':
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
179 # TODO: support other calendar types
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
180 continue
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
181
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
182 months = data.setdefault('months', {})
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
183 for ctxt in calendar.findall('months/monthContext'):
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
184 ctxts = months.setdefault(ctxt.attrib['type'], {})
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
185 for width in ctxt.findall('monthWidth'):
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
186 widths = ctxts.setdefault(width.attrib['type'], {})
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
187 for elem in width.findall('month'):
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
188 if 'draft' in elem.attrib and int(elem.attrib['type']) in widths:
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
189 continue
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
190 widths[int(elem.attrib.get('type'))] = unicode(elem.text)
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
191
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
192 days = data.setdefault('days', {})
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
193 for ctxt in calendar.findall('days/dayContext'):
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
194 ctxts = days.setdefault(ctxt.attrib['type'], {})
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
195 for width in ctxt.findall('dayWidth'):
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
196 widths = ctxts.setdefault(width.attrib['type'], {})
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
197 for elem in width.findall('day'):
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
198 dtype = weekdays[elem.attrib['type']]
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
199 if 'draft' in elem.attrib and dtype in widths:
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
200 continue
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
201 widths[dtype] = unicode(elem.text)
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
202
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
203 quarters = data.setdefault('quarters', {})
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
204 for ctxt in calendar.findall('quarters/quarterContext'):
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
205 ctxts = quarters.setdefault(ctxt.attrib['type'], {})
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
206 for width in ctxt.findall('quarterWidth'):
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
207 widths = ctxts.setdefault(width.attrib['type'], {})
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
208 for elem in width.findall('quarter'):
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
209 if 'draft' in elem.attrib and int(elem.attrib['type']) in widths:
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
210 continue
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
211 widths[int(elem.attrib.get('type'))] = unicode(elem.text)
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
212
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
213 eras = data.setdefault('eras', {})
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
214 for width in calendar.findall('eras/*'):
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
215 ewidth = {'eraNames': 'wide', 'eraAbbr': 'abbreviated'}[width.tag]
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
216 widths = eras.setdefault(ewidth, {})
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
217 for elem in width.findall('era'):
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
218 if 'draft' in elem.attrib and int(elem.attrib['type']) in widths:
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
219 continue
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
220 widths[int(elem.attrib.get('type'))] = unicode(elem.text)
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
221
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
222 # AM/PM
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
223 periods = data.setdefault('periods', {})
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
224 for elem in calendar.findall('am'):
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
225 if 'draft' in elem.attrib and elem.tag in periods:
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
226 continue
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
227 periods[elem.tag] = unicode(elem.text)
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
228 for elem in calendar.findall('pm'):
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
229 if 'draft' in elem.attrib and elem.tag in periods:
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
230 continue
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
231 periods[elem.tag] = unicode(elem.text)
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
232
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
233 date_formats = data.setdefault('date_formats', {})
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
234 for elem in calendar.findall('dateFormats/dateFormatLength'):
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
235 if 'draft' in elem.attrib and elem.attrib.get('type') in date_formats:
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
236 continue
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
237 try:
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
238 date_formats[elem.attrib.get('type')] = \
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
239 dates.parse_pattern(unicode(elem.findtext('dateFormat/pattern')))
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
240 except ValueError, e:
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
241 print>>sys.stderr, 'ERROR: %s' % e
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
242
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
243 time_formats = data.setdefault('time_formats', {})
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
244 for elem in calendar.findall('timeFormats/timeFormatLength'):
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
245 if 'draft' in elem.attrib and elem.attrib.get('type') in time_formats:
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
246 continue
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
247 try:
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
248 time_formats[elem.attrib.get('type')] = \
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
249 dates.parse_pattern(unicode(elem.findtext('timeFormat/pattern')))
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
250 except ValueError, e:
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
251 print>>sys.stderr, 'ERROR: %s' % e
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
252
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
253 datetime_formats = data.setdefault('datetime_formats', {})
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
254 for elem in calendar.findall('dateTimeFormats/dateTimeFormatLength'):
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
255 if 'draft' in elem.attrib and elem.attrib.get('type') in datetime_formats:
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
256 continue
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
257 try:
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
258 datetime_formats[elem.attrib.get('type')] = \
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
259 unicode(elem.findtext('dateTimeFormat/pattern'))
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
260 except ValueError, e:
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
261 print>>sys.stderr, 'ERROR: %s' % e
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
262
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
263 # <numbers>
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
264
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
265 number_symbols = data.setdefault('number_symbols', {})
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
266 for elem in tree.findall('//numbers/symbols/*'):
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
267 number_symbols[elem.tag] = unicode(elem.text)
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
268
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
269 decimal_formats = data.setdefault('decimal_formats', {})
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
270 for elem in tree.findall('//decimalFormats/decimalFormatLength'):
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
271 if 'draft' in elem.attrib and elem.attrib.get('type') in decimal_formats:
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
272 continue
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
273 pattern = unicode(elem.findtext('decimalFormat/pattern'))
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
274 decimal_formats[elem.attrib.get('type')] = numbers.parse_pattern(pattern)
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
275
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
276 scientific_formats = data.setdefault('scientific_formats', {})
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
277 for elem in tree.findall('//scientificFormats/scientificFormatLength'):
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
278 if 'draft' in elem.attrib and elem.attrib.get('type') in scientific_formats:
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
279 continue
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
280 pattern = unicode(elem.findtext('scientificFormat/pattern'))
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
281 scientific_formats[elem.attrib.get('type')] = numbers.parse_pattern(pattern)
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
282
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
283 currency_formats = data.setdefault('currency_formats', {})
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
284 for elem in tree.findall('//currencyFormats/currencyFormatLength'):
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
285 if 'draft' in elem.attrib and elem.attrib.get('type') in currency_formats:
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
286 continue
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
287 pattern = unicode(elem.findtext('currencyFormat/pattern'))
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
288 currency_formats[elem.attrib.get('type')] = numbers.parse_pattern(pattern)
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
289
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
290 percent_formats = data.setdefault('percent_formats', {})
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
291 for elem in tree.findall('//percentFormats/percentFormatLength'):
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
292 if 'draft' in elem.attrib and elem.attrib.get('type') in percent_formats:
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
293 continue
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
294 pattern = unicode(elem.findtext('percentFormat/pattern'))
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
295 percent_formats[elem.attrib.get('type')] = numbers.parse_pattern(pattern)
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
296
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
297 currency_names = data.setdefault('currency_names', {})
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
298 currency_symbols = data.setdefault('currency_symbols', {})
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
299 for elem in tree.findall('//currencies/currency'):
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
300 name = elem.findtext('displayName')
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
301 if name:
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
302 currency_names[elem.attrib['type']] = unicode(name)
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
303 symbol = elem.findtext('symbol')
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
304 if symbol:
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
305 currency_symbols[elem.attrib['type']] = unicode(symbol)
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
306
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
307 dicts[stem] = data
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
308 outfile = open(os.path.join(destdir, stem + '.dat'), 'wb')
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
309 try:
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
310 pickle.dump(data, outfile, 2)
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
311 finally:
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
312 outfile.close()
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
313
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
314 if __name__ == '__main__':
4a7af44e6695 Create branch for 0.8.x releases.
cmlenz
parents:
diff changeset
315 main()
Copyright (C) 2012-2017 Edgewall Software