posplit
81 lines
| 2.8 KiB
| text/plain
|
TextLexer
/ i18n / posplit
Wagner Bruna
|
r11389 | #!/usr/bin/env python | ||
# | ||||
# posplit - split messages in paragraphs on .po/.pot files | ||||
# | ||||
# license: MIT/X11/Expat | ||||
# | ||||
Pulkit Goyal
|
r29153 | from __future__ import absolute_import, print_function | ||
Pulkit Goyal
|
r29152 | |||
import polib | ||||
Simon Heimberg
|
r20359 | import re | ||
Wagner Bruna
|
r11389 | import sys | ||
def addentry(po, entry, cache): | ||||
e = cache.get(entry.msgid) | ||||
if e: | ||||
e.occurrences.extend(entry.occurrences) | ||||
else: | ||||
po.append(entry) | ||||
cache[entry.msgid] = entry | ||||
def mkentry(orig, delta, msgid, msgstr): | ||||
entry = polib.POEntry() | ||||
entry.merge(orig) | ||||
entry.msgid = msgid or orig.msgid | ||||
entry.msgstr = msgstr or orig.msgstr | ||||
entry.occurrences = [(p, int(l) + delta) for (p, l) in orig.occurrences] | ||||
return entry | ||||
if __name__ == "__main__": | ||||
po = polib.pofile(sys.argv[1]) | ||||
cache = {} | ||||
entries = po[:] | ||||
po[:] = [] | ||||
Simon Heimberg
|
r20359 | findd = re.compile(r' *\.\. (\w+)::') # for finding directives | ||
Wagner Bruna
|
r11389 | for entry in entries: | ||
msgids = entry.msgid.split(u'\n\n') | ||||
if entry.msgstr: | ||||
msgstrs = entry.msgstr.split(u'\n\n') | ||||
else: | ||||
msgstrs = [u''] * len(msgids) | ||||
if len(msgids) != len(msgstrs): | ||||
# places the whole existing translation as a fuzzy | ||||
# translation for each paragraph, to give the | ||||
# translator a chance to recover part of the old | ||||
# translation - erasing extra paragraphs is | ||||
# probably better than retranslating all from start | ||||
if 'fuzzy' not in entry.flags: | ||||
entry.flags.append('fuzzy') | ||||
msgstrs = [entry.msgstr] * len(msgids) | ||||
delta = 0 | ||||
for msgid, msgstr in zip(msgids, msgstrs): | ||||
Simon Heimberg
|
r20361 | if msgid and msgid != '::': | ||
Wagner Bruna
|
r11389 | newentry = mkentry(entry, delta, msgid, msgstr) | ||
Simon Heimberg
|
r20359 | mdirective = findd.match(msgid) | ||
if mdirective: | ||||
Simon Heimberg
|
r20362 | if not msgid[mdirective.end():].rstrip(): | ||
# only directive, nothing to translate here | ||||
FUJIWARA Katsunori
|
r28074 | delta += 2 | ||
Simon Heimberg
|
r20362 | continue | ||
Simon Heimberg
|
r20359 | directive = mdirective.group(1) | ||
Simon Heimberg
|
r20363 | if directive in ('container', 'include'): | ||
if msgid.rstrip('\n').count('\n') == 0: | ||||
# only rst syntax, nothing to translate | ||||
FUJIWARA Katsunori
|
r28074 | delta += 2 | ||
Simon Heimberg
|
r20363 | continue | ||
else: | ||||
# lines following directly, unexpected | ||||
Pulkit Goyal
|
r29153 | print('Warning: text follows line with directive' \ | ||
' %s' % directive) | ||||
Simon Heimberg
|
r20359 | comment = 'do not translate: .. %s::' % directive | ||
if not newentry.comment: | ||||
newentry.comment = comment | ||||
elif comment not in newentry.comment: | ||||
newentry.comment += '\n' + comment | ||||
Wagner Bruna
|
r11389 | addentry(po, newentry, cache) | ||
delta += 2 + msgid.count('\n') | ||||
po.save() | ||||