3 # Written by Martin v. Löwis <loewis@informatik.hu-berlin.de>
5 """Generate binary message catalog from textual translation description.
7 This program converts a textual Uniforum-style message catalog (.po file) into
8 a binary GNU catalog (.mo file). This is essentially the same function as the
9 GNU msgfmt program, however, it is a simpler implementation.
11 Usage: msgfmt.py [OPTIONS] filename.po
16 Print this message and exit.
20 Display version information and exit.
35 def usage(code
, msg
=''):
36 print >> sys
.stderr
, __doc__
38 print >> sys
.stderr
, msg
43 def add(id, str, fuzzy
):
44 "Add a non-fuzzy translation to the dictionary."
52 "Return the generated output."
54 keys
= MESSAGES
.keys()
55 # the keys are sorted in the .mo file
60 # For each string, we need size and file offset. Each string is NUL
61 # terminated; the NUL does not count into the size.
62 offsets
.append((len(ids
), len(id), len(strs
), len(MESSAGES
[id])))
64 strs
+= MESSAGES
[id] + '\0'
66 # The header is 7 32-bit unsigned integers. We don't use hash tables, so
67 # the keys start right after the index tables.
69 keystart
= 7*4+16*len(keys
)
70 # and the values start after the keys
71 valuestart
= keystart
+ len(ids
)
74 # The string table first has the list of keys, then the list of values.
75 # Each entry has first the size of the string, then the file offset.
76 for o1
, l1
, o2
, l2
in offsets
:
77 koffsets
+= [l1
, o1
+keystart
]
78 voffsets
+= [l2
, o2
+valuestart
]
79 offsets
= koffsets
+ voffsets
80 output
= struct
.pack("iiiiiii",
83 len(keys
), # # of entries
84 7*4, # start of key index
85 7*4+len(keys
)*8, # start of value index
86 0, 0) # size and offset of hash table
87 output
+= array
.array("i", offsets
).tostring()
98 # Compute .mo name from .po name
99 if filename
.endswith('.po'):
101 outfile
= filename
[:-2] + 'mo'
103 infile
= filename
+ '.po'
104 outfile
= filename
+ '.mo'
106 lines
= open(infile
).readlines()
108 print >> sys
.stderr
, msg
118 # If we get a comment line after a msgstr, this is a new entry
119 if l
[0] == '#' and section
== STR
:
120 add(msgid
, msgstr
, fuzzy
)
123 # Record a fuzzy mark
124 if l
[:2] == '#,' and l
.find('fuzzy'):
129 # Now we are in a msgid section, output previous section
130 if l
.startswith('msgid'):
132 add(msgid
, msgstr
, fuzzy
)
136 # Now we are in a msgstr section
137 elif l
.startswith('msgstr'):
144 # XXX: Does this always follow Python escape semantics?
151 print >> sys
.stderr
, 'Syntax error on %s:%d' % (infile
, lno
), \
153 print >> sys
.stderr
, l
157 add(msgid
, msgstr
, fuzzy
)
164 open(outfile
,"wb").write(output
)
166 print >> sys
.stderr
, msg
172 opts
, args
= getopt
.getopt(sys
.argv
[1:], 'hV', ['help','version'])
173 except getopt
.error
, msg
:
177 for opt
, arg
in opts
:
178 if opt
in ('-h', '--help'):
180 elif opt
in ('-V', '--version'):
181 print >> sys
.stderr
, "msgfmt.py", __version__
185 print >> sys
.stderr
, 'No input file given'
186 print >> sys
.stderr
, "Try `msgfmt --help' for more information."
189 for filename
in args
:
193 if __name__
== '__main__':