1
|
|
|
#! /usr/bin/env python2 |
2
|
|
|
# -*- coding: utf-8 -*- |
3
|
|
|
|
4
|
|
|
# Written by Martin v. L�wis <[email protected]> |
5
|
|
|
|
6
|
|
|
"""Generate binary message catalog from textual translation description. |
7
|
|
|
|
8
|
|
|
This program converts a textual Uniforum-style message catalog (.po file) into |
9
|
|
|
a binary GNU catalog (.mo file). This is essentially the same function as the |
10
|
|
|
GNU msgfmt program, however, it is a simpler implementation. |
11
|
|
|
|
12
|
|
|
Usage: msgfmt.py [OPTIONS] filename.po |
13
|
|
|
|
14
|
|
|
Options: |
15
|
|
|
-o file |
16
|
|
|
--output-file=file |
17
|
|
|
Specify the output file to write to. If omitted, output will go to a |
18
|
|
|
file named filename.mo (based off the input file name). |
19
|
|
|
|
20
|
|
|
-h |
21
|
|
|
--help |
22
|
|
|
Print this message and exit. |
23
|
|
|
|
24
|
|
|
-V |
25
|
|
|
--version |
26
|
|
|
Display version information and exit. |
27
|
|
|
""" |
28
|
|
|
|
29
|
|
|
import sys |
30
|
|
|
import os |
31
|
|
|
import getopt |
32
|
|
|
import struct |
33
|
|
|
import array |
34
|
|
|
|
35
|
|
|
__version__ = "1.1" |
36
|
|
|
|
37
|
|
|
MESSAGES = {} |
38
|
|
|
|
39
|
|
|
|
40
|
|
|
|
41
|
|
|
def usage(code, msg=''): |
42
|
|
|
print >> sys.stderr, __doc__ |
43
|
|
|
if msg: |
44
|
|
|
print >> sys.stderr, msg |
45
|
|
|
sys.exit(code) |
46
|
|
|
|
47
|
|
|
|
48
|
|
|
|
49
|
|
|
def add(id, str, fuzzy): |
50
|
|
|
"Add a non-fuzzy translation to the dictionary." |
51
|
|
|
global MESSAGES |
52
|
|
|
if not fuzzy and str: |
53
|
|
|
MESSAGES[id] = str |
54
|
|
|
|
55
|
|
|
|
56
|
|
|
|
57
|
|
|
def generate(): |
58
|
|
|
"Return the generated output." |
59
|
|
|
global MESSAGES |
60
|
|
|
keys = MESSAGES.keys() |
61
|
|
|
# the keys are sorted in the .mo file |
62
|
|
|
keys.sort() |
63
|
|
|
offsets = [] |
64
|
|
|
ids = strs = '' |
65
|
|
|
for id in keys: |
66
|
|
|
# For each string, we need size and file offset. Each string is NUL |
67
|
|
|
# terminated; the NUL does not count into the size. |
68
|
|
|
offsets.append((len(ids), len(id), len(strs), len(MESSAGES[id]))) |
69
|
|
|
ids += id + '\0' |
70
|
|
|
strs += MESSAGES[id] + '\0' |
71
|
|
|
output = '' |
72
|
|
|
# The header is 7 32-bit unsigned integers. We don't use hash tables, so |
73
|
|
|
# the keys start right after the index tables. |
74
|
|
|
# translated string. |
75
|
|
|
keystart = 7*4+16*len(keys) |
76
|
|
|
# and the values start after the keys |
77
|
|
|
valuestart = keystart + len(ids) |
78
|
|
|
koffsets = [] |
79
|
|
|
voffsets = [] |
80
|
|
|
# The string table first has the list of keys, then the list of values. |
81
|
|
|
# Each entry has first the size of the string, then the file offset. |
82
|
|
|
for o1, l1, o2, l2 in offsets: |
83
|
|
|
koffsets += [l1, o1+keystart] |
84
|
|
|
voffsets += [l2, o2+valuestart] |
85
|
|
|
offsets = koffsets + voffsets |
86
|
|
|
output = struct.pack("iiiiiii", |
87
|
|
|
0x950412de, # Magic |
88
|
|
|
0, # Version |
89
|
|
|
len(keys), # # of entries |
90
|
|
|
7*4, # start of key index |
91
|
|
|
7*4+len(keys)*8, # start of value index |
92
|
|
|
0, 0) # size and offset of hash table |
93
|
|
|
output += array.array("i", offsets).tostring() |
94
|
|
|
output += ids |
95
|
|
|
output += strs |
96
|
|
|
return output |
97
|
|
|
|
98
|
|
|
|
99
|
|
|
|
100
|
|
|
def make(filename, outfile): |
101
|
|
|
ID = 1 |
102
|
|
|
STR = 2 |
103
|
|
|
|
104
|
|
|
# Compute .mo name from .po name and arguments |
105
|
|
|
if filename.endswith('.po'): |
106
|
|
|
infile = filename |
107
|
|
|
else: |
108
|
|
|
infile = filename + '.po' |
109
|
|
|
if outfile is None: |
110
|
|
|
outfile = os.path.splitext(infile)[0] + '.mo' |
111
|
|
|
|
112
|
|
|
try: |
113
|
|
|
lines = open(infile).readlines() |
114
|
|
|
except IOError, msg: |
115
|
|
|
print >> sys.stderr, msg |
116
|
|
|
sys.exit(1) |
117
|
|
|
|
118
|
|
|
section = None |
119
|
|
|
fuzzy = 0 |
120
|
|
|
|
121
|
|
|
# Parse the catalog |
122
|
|
|
lno = 0 |
123
|
|
|
for l in lines: |
124
|
|
|
lno += 1 |
125
|
|
|
# If we get a comment line after a msgstr, this is a new entry |
126
|
|
|
if l[0] == '#' and section == STR: |
127
|
|
|
add(msgid, msgstr, fuzzy) |
128
|
|
|
section = None |
129
|
|
|
fuzzy = 0 |
130
|
|
|
# Record a fuzzy mark |
131
|
|
|
if l[:2] == '#,' and l.find('fuzzy'): |
|
|
|
|
132
|
|
|
fuzzy = 1 |
133
|
|
|
# Skip comments |
134
|
|
|
if l[0] == '#': |
135
|
|
|
continue |
136
|
|
|
# Now we are in a msgid section, output previous section |
137
|
|
|
if l.startswith('msgid'): |
138
|
|
|
if section == STR: |
139
|
|
|
add(msgid, msgstr, fuzzy) |
140
|
|
|
section = ID |
141
|
|
|
l = l[5:] |
142
|
|
|
msgid = msgstr = '' |
143
|
|
|
# Now we are in a msgstr section |
144
|
|
|
elif l.startswith('msgstr'): |
145
|
|
|
section = STR |
146
|
|
|
l = l[6:] |
147
|
|
|
# Skip empty lines |
148
|
|
|
l = l.strip() |
149
|
|
|
if not l: |
150
|
|
|
continue |
151
|
|
|
# XXX: Does this always follow Python escape semantics? |
152
|
|
|
l = eval(l) |
153
|
|
|
if section == ID: |
154
|
|
|
msgid += l |
155
|
|
|
elif section == STR: |
156
|
|
|
msgstr += l |
157
|
|
|
else: |
158
|
|
|
print >> sys.stderr, 'Syntax error on %s:%d' % (infile, lno), \ |
159
|
|
|
'before:' |
160
|
|
|
print >> sys.stderr, l |
161
|
|
|
sys.exit(1) |
162
|
|
|
# Add last entry |
163
|
|
|
if section == STR: |
164
|
|
|
add(msgid, msgstr, fuzzy) |
165
|
|
|
|
166
|
|
|
# Compute output |
167
|
|
|
output = generate() |
168
|
|
|
|
169
|
|
|
try: |
170
|
|
|
open(outfile,"wb").write(output) |
171
|
|
|
except IOError,msg: |
172
|
|
|
print >> sys.stderr, msg |
173
|
|
|
|
174
|
|
|
|
175
|
|
|
|
176
|
|
|
def main(): |
177
|
|
|
try: |
178
|
|
|
opts, args = getopt.getopt(sys.argv[1:], 'hVo:', |
179
|
|
|
['help', 'version', 'output-file=']) |
180
|
|
|
except getopt.error, msg: |
181
|
|
|
usage(1, msg) |
182
|
|
|
|
183
|
|
|
outfile = None |
184
|
|
|
# parse options |
185
|
|
|
for opt, arg in opts: |
186
|
|
|
if opt in ('-h', '--help'): |
187
|
|
|
usage(0) |
188
|
|
|
elif opt in ('-V', '--version'): |
189
|
|
|
print >> sys.stderr, "msgfmt.py", __version__ |
190
|
|
|
sys.exit(0) |
191
|
|
|
elif opt in ('-o', '--output-file'): |
192
|
|
|
outfile = arg |
193
|
|
|
# do it |
194
|
|
|
if not args: |
195
|
|
|
print >> sys.stderr, 'No input file given' |
196
|
|
|
print >> sys.stderr, "Try `msgfmt --help' for more information." |
197
|
|
|
return |
198
|
|
|
|
199
|
|
|
for filename in args: |
200
|
|
|
make(filename, outfile) |
201
|
|
|
|
202
|
|
|
|
203
|
|
|
if __name__ == '__main__': |
204
|
|
|
main() |
205
|
|
|
|