X-Git-Url: https://git.lyx.org/gitweb/?a=blobdiff_plain;f=po%2Flyx_pot.py;h=3da45a5a931aa39600aacf2b38adbd4f2a400497;hb=ec7f1239486c40ffd853549a0d03c9ebbaab7164;hp=6119ee6c067790ed678e0321c33693bf92366b4a;hpb=4ec7b36ab7fa34c3b646616ec67cdc1982519d12;p=lyx.git diff --git a/po/lyx_pot.py b/po/lyx_pot.py index 6119ee6c06..3da45a5a93 100755 --- a/po/lyx_pot.py +++ b/po/lyx_pot.py @@ -17,6 +17,8 @@ # to output in gettext .pot format. # import sys, os, re, getopt +if sys.version_info < (2, 4, 0): + from sets import Set as set def relativePath(path, base): '''return relative path from top source dir''' @@ -31,13 +33,23 @@ def relativePath(path, base): return path3 +def writeString(outfile, infile, basefile, lineno, string): + string = string.replace('\\', '\\\\').replace('"', '') + if string == "": + return + print >> outfile, '#: %s:%d\nmsgid "%s"\nmsgstr ""\n' % \ + (relativePath(infile, basefile), lineno, string) + + def ui_l10n(input_files, output, base): '''Generate pot file from lib/ui/*''' output = open(output, 'w') Submenu = re.compile(r'^[^#]*Submenu\s+"([^"]*)"') Popupmenu = re.compile(r'^[^#]*PopupMenu\s+"[^"]+"\s+"([^"]*)"') + IconPalette = re.compile(r'^[^#]*IconPalette\s+"[^"]+"\s+"([^"]*)"') Toolbar = re.compile(r'^[^#]*Toolbar\s+"[^"]+"\s+"([^"]*)"') Item = re.compile(r'[^#]*Item\s+"([^"]*)"') + TableInsert = re.compile(r'[^#]*TableInsert\s+"([^"]*)"') for src in input_files: input = open(src) for lineno, line in enumerate(input.readlines()): @@ -46,10 +58,14 @@ def ui_l10n(input_files, output, base): string = string.replace('_', ' ') elif Popupmenu.match(line): (string,) = Popupmenu.match(line).groups() + elif IconPalette.match(line): + (string,) = IconPalette.match(line).groups() elif Toolbar.match(line): (string,) = Toolbar.match(line).groups() elif Item.match(line): (string,) = Item.match(line).groups() + elif TableInsert.match(line): + (string,) = TableInsert.match(line).groups() else: continue string = string.replace('"', '') @@ -60,34 +76,263 @@ def ui_l10n(input_files, output, base): output.close() -def layouts_l10n(input_files, output, base): - '''Generate pot file from lib/layouts/*.layout and *.inc''' - output = open(output, 'w') - Style = re.compile(r'^Style\s+(.*)') +def layouts_l10n(input_files, output, base, layouttranslations): + '''Generate pot file from lib/layouts/*.{layout,inc,module}''' + Style = re.compile(r'^Style\s+(.*)', re.IGNORECASE) # include ???LabelString???, but exclude comment lines LabelString = re.compile(r'^[^#]*LabelString\S*\s+(.*)') GuiName = re.compile(r'\s*GuiName\s+(.*)') ListName = re.compile(r'\s*ListName\s+(.*)') + CategoryName = re.compile(r'\s*Category\s+(.*)') + NameRE = re.compile(r'DeclareLyXModule.*{(.*)}') + InsetLayout = re.compile(r'^InsetLayout\s+\"?(.*)\"?') + FlexCheck = re.compile(r'^Flex:(.*)') + DescBegin = re.compile(r'#+\s*DescriptionBegin\s*$') + DescEnd = re.compile(r'#+\s*DescriptionEnd\s*$') + Category = re.compile(r'#Category: (.*)$') + I18nPreamble = re.compile(r'\s*(Lang)|(Babel)Preamble\s*$') + EndI18nPreamble = re.compile(r'\s*End(Lang)|(Babel)Preamble\s*$') + I18nString = re.compile(r'_\(([^\)]+)\)') + CounterFormat = re.compile(r'\s*PrettyFormat\s+"?(.*)"?') + CiteFormat = re.compile(r'\s*CiteFormat') + KeyVal = re.compile(r'^\s*_\w+\s+(.*)$') + Float = re.compile(r'\s*Float') + End = re.compile(r'\s*End') + Comment = re.compile(r'\s*#') + Translation = re.compile(r'\s*Translation\s+(.*)\s*$') + KeyValPair = re.compile(r'\s*"(.*)"\s+"(.*)"') + + oldlanguages = [] + languages = [] + keyset = set() + oldtrans = dict() + if layouttranslations: + linguas_file = os.path.join(base, 'po/LINGUAS') + for line in open(linguas_file).readlines(): + if Comment.search(line) == None: + languages.extend(line.split()) + + # read old translations if available + try: + input = open(output) + lang = '' + for line in input.readlines(): + res = Comment.search(line) + if res: + continue + if line.strip() == '': + continue + res = Translation.search(line) + if res: + lang = res.group(1) + if lang not in languages: + oldlanguages.append(lang) + languages.append(lang) + oldtrans[lang] = dict() + continue + res = End.search(line) + if res: + lang = '' + continue + res = KeyValPair.search(line) + if res and lang != '': + key = res.group(1).decode('utf-8') + val = res.group(2).decode('utf-8') + key = key.replace('\\"', '"').replace('\\\\', '\\') + val = val.replace('\\"', '"').replace('\\\\', '\\') + oldtrans[lang][key] = val + keyset.add(key) + continue + print "Error: Unable to handle line:" + print line + except IOError: + pass + + # walon is not a known document language + # FIXME: Do not hardcode, read from lib/languages! + if 'wa' in languages: + languages.remove('wa') + + out = open(output, 'w') for src in input_files: - input = open(src) - for lineno, line in enumerate(input.readlines()): - if Style.match(line): - (string,) = Style.match(line).groups() + readingDescription = False + readingI18nPreamble = False + readingFloat = False + readingCiteFormats = False + descStartLine = -1 + descLines = [] + lineno = 0 + for line in open(src).readlines(): + lineno += 1 + if readingDescription: + res = DescEnd.search(line) + if res != None: + readingDescription = False + desc = " ".join(descLines) + if not layouttranslations: + writeString(out, src, base, lineno + 1, desc) + continue + descLines.append(line[1:].strip()) + continue + res = DescBegin.search(line) + if res != None: + readingDescription = True + descStartLine = lineno + continue + if readingI18nPreamble: + res = EndI18nPreamble.search(line) + if res != None: + readingI18nPreamble = False + continue + res = I18nString.search(line) + if res != None: + string = res.group(1) + if layouttranslations: + keyset.add(string) + else: + writeString(out, src, base, lineno, string) + continue + res = I18nPreamble.search(line) + if res != None: + readingI18nPreamble = True + continue + res = NameRE.search(line) + if res != None: + string = res.group(1) + if not layouttranslations: + writeString(out, src, base, lineno + 1, string) + continue + res = Style.search(line) + if res != None: + string = res.group(1) string = string.replace('_', ' ') - elif LabelString.match(line): - (string,) = LabelString.match(line).groups() - elif GuiName.match(line): - (string,) = GuiName.match(line).groups() - elif ListName.match(line): - (string,) = ListName.match(line).groups() - else: + if not layouttranslations: + writeString(out, src, base, lineno, string) continue - string = string.replace('\\', '\\\\').replace('"', '') - if string != "": - print >> output, '#: %s:%d\nmsgid "%s"\nmsgstr ""\n' % \ - (relativePath(src, base), lineno+1, string) - input.close() - output.close() + res = LabelString.search(line) + if res != None: + string = res.group(1) + if not layouttranslations: + writeString(out, src, base, lineno, string) + continue + res = GuiName.search(line) + if res != None: + string = res.group(1) + if layouttranslations: + # gui name must only be added for floats + if readingFloat: + keyset.add(string) + else: + writeString(out, src, base, lineno, string) + continue + res = CategoryName.search(line) + if res != None: + string = res.group(1) + if not layouttranslations: + writeString(out, src, base, lineno, string) + continue + res = ListName.search(line) + if res != None: + string = res.group(1) + if layouttranslations: + keyset.add(string.strip('"')) + else: + writeString(out, src, base, lineno, string) + continue + res = InsetLayout.search(line) + if res != None: + string = res.group(1) + string = string.replace('_', ' ') + #Flex:xxx is not used in translation + #if not layouttranslations: + # writeString(out, src, base, lineno, string) + m = FlexCheck.search(string) + if m: + if not layouttranslations: + writeString(out, src, base, lineno, m.group(1)) + continue + res = Category.search(line) + if res != None: + string = res.group(1) + if not layouttranslations: + writeString(out, src, base, lineno, string) + continue + res = CounterFormat.search(line) + if res != None: + string = res.group(1) + if not layouttranslations: + writeString(out, src, base, lineno, string) + continue + res = Float.search(line) + if res != None: + readingFloat = True + continue + res = CiteFormat.search(line) + if res != None: + readingCiteFormats = True + res = End.search(line) + if res != None: + readingCiteFormats = False + readingFloat = False + if readingCiteFormats: + res = KeyVal.search(line) + if res != None: + val = res.group(1) + if not layouttranslations: + writeString(out, src, base, lineno, val) + + if layouttranslations: + # Extract translations of layout files + import polib + + # Sort languages and key to minimize the diff between different runs + # with changed translations + languages.sort() + keys = [] + for key in keyset: + keys.append(key) + keys.sort() + + print >> out, '''# This file has been automatically generated by po/lyx_pot.py. +# PLEASE MODIFY ONLY THE LAGUAGES HAVING NO .po FILE! If you want to regenerate +# this file from the translations, run `make ../lib/layouttranslations' in po. +# Python polib library is needed for building the output file. +# +# This file should remain fixed during minor LyX releases.''' + for lang in languages: + print >> out, '\nTranslation %s' % lang + if lang in oldtrans.keys(): + trans = oldtrans[lang] + else: + trans = dict() + if not lang in oldlanguages: + poname = os.path.join(base, 'po/' + lang + '.po') + po = polib.pofile(poname) + # Iterate through po entries and not keys for speed reasons. + # FIXME: The code is still too slow + for entry in po: + if not entry.translated(): + continue + if entry.msgid in keys: + key = entry.msgid + val = entry.msgstr + # some translators keep untranslated entries + if val != key: + trans[key] = val + for key in keys: + if key in trans.keys(): + val = trans[key].replace('\\', '\\\\').replace('"', '\\"') + key = key.replace('\\', '\\\\').replace('"', '\\"') + print >> out, '\t"%s" "%s"' % \ + (key.encode('utf-8'), val.encode('utf-8')) + # to print untranslated entries, uncomment the following lines + #else: + # key = key.replace('\\', '\\\\').replace('"', '\\"') + # print >> out, '\t"%s" "%s"' % \ + # (key.encode('utf-8'), key.encode('utf-8')) + print >> out, 'End' + + out.close() def qt4_l10n(input_files, output, base): @@ -109,61 +354,167 @@ def qt4_l10n(input_files, output, base): # get lines that match ... if pat.match(line): (string,) = pat.match(line).groups() - string = string.replace('&', '&').replace('<', '<').replace('>', '>').replace('"', r'\"') + string = string.replace('&', '&').replace('"', '"') + string = string.replace('<', '<').replace('>', '>') + string = string.replace('\\', '\\\\').replace('"', r'\"') + string = string.replace(' ', r'\n') print >> output, '#: %s:%d\nmsgid "%s"\nmsgstr ""\n' % \ - (relativePath(src, base), lineno+1, string) + (relativePath(src, base), lineno+1, string) input.close() output.close() def languages_l10n(input_files, output, base): - '''Generate pot file from lib/language''' + '''Generate pot file from lib/languages''' + out = open(output, 'w') + GuiName = re.compile(r'^[^#]*GuiName\s+(.*)') + + for src in input_files: + descStartLine = -1 + descLines = [] + lineno = 0 + for line in open(src).readlines(): + lineno += 1 + res = GuiName.search(line) + if res != None: + string = res.group(1) + writeString(out, src, base, lineno, string) + continue + + out.close() + + +def external_l10n(input_files, output, base): + '''Generate pot file from lib/external_templates''' output = open(output, 'w') - # assuming only one language file - reg = re.compile('[\w-]+\s+[\w"]+\s+"([\w \-\(\)]+)"\s+(true|false)\s+[\w-]+\s+\w+\s+"[^"]*"') + Template = re.compile(r'^Template\s+(.*)') + GuiName = re.compile(r'\s*GuiName\s+(.*)') + HelpTextStart = re.compile(r'\s*HelpText\s') + HelpTextSection = re.compile(r'\s*(\S.*)\s*$') + HelpTextEnd = re.compile(r'\s*HelpTextEnd\s') + i = -1 + for src in input_files: + input = open(src) + inHelp = False + hadHelp = False + prev_help_string = '' + for lineno, line in enumerate(input.readlines()): + if Template.match(line): + (string,) = Template.match(line).groups() + elif GuiName.match(line): + (string,) = GuiName.match(line).groups() + elif inHelp: + if HelpTextEnd.match(line): + if hadHelp: + print >> output, '\nmsgstr ""\n' + inHelp = False + hadHelp = False + prev_help_string = '' + elif HelpTextSection.match(line): + (help_string,) = HelpTextSection.match(line).groups() + help_string = help_string.replace('"', '') + if help_string != "" and prev_help_string == '': + print >> output, '#: %s:%d\nmsgid ""\n"%s\\n"' % \ + (relativePath(src, base), lineno+1, help_string) + hadHelp = True + elif help_string != "": + print >> output, '"%s\\n"' % help_string + prev_help_string = help_string + elif HelpTextStart.match(line): + inHelp = True + prev_help_string = '' + else: + continue + string = string.replace('"', '') + if string != "" and not inHelp: + print >> output, '#: %s:%d\nmsgid "%s"\nmsgstr ""\n' % \ + (relativePath(src, base), lineno+1, string) + input.close() + output.close() + + +def formats_l10n(input_files, output, base): + '''Generate pot file from configure.py''' + output = open(output, 'w') + GuiName = re.compile(r'.*\Format\s+\S+\s+\S+\s+"([^"]*)"\s+(\S*)\s+.*') + GuiName2 = re.compile(r'.*\Format\s+\S+\s+\S+\s+([^"]\S+)\s+(\S*)\s+.*') + input = open(input_files[0]) + for lineno, line in enumerate(input.readlines()): + label = "" + labelsc = "" + if GuiName.match(line): + label = GuiName.match(line).group(1) + shortcut = GuiName.match(line).group(2).replace('"', '') + elif GuiName2.match(line): + label = GuiName2.match(line).group(1) + shortcut = GuiName2.match(line).group(2).replace('"', '') + else: + continue + label = label.replace('\\', '\\\\').replace('"', '') + if shortcut != "": + labelsc = label + "|" + shortcut + if label != "": + print >> output, '#: %s:%d\nmsgid "%s"\nmsgstr ""\n' % \ + (relativePath(input_files[0], base), lineno+1, label) + if labelsc != "": + print >> output, '#: %s:%d\nmsgid "%s"\nmsgstr ""\n' % \ + (relativePath(input_files[0], base), lineno+1, labelsc) + input.close() + output.close() + + +def encodings_l10n(input_files, output, base): + '''Generate pot file from lib/encodings''' + output = open(output, 'w') + # assuming only one encodings file + # Encoding utf8 utf8 "Unicode (utf8)" UTF-8 variable inputenc + reg = re.compile('Encoding [\w-]+\s+[\w-]+\s+"([\w \-\(\)]+)"\s+[\w-]+\s+(fixed|variable)\s+\w+.*') input = open(input_files[0]) for lineno, line in enumerate(input.readlines()): - if line[0] == '#': + if not line.startswith('Encoding'): continue - # From: - # afrikaans afrikaans "Afrikaans" false iso8859-15 af_ZA "" - # To: - # #: lib/languages:2 - # msgid "Afrikaans" - # msgstr "" if reg.match(line): print >> output, '#: %s:%d\nmsgid "%s"\nmsgstr ""\n' % \ (relativePath(input_files[0], base), lineno+1, reg.match(line).groups()[0]) else: print "Error: Unable to handle line:" print line - sys.exit(1) + # No need to abort if the parsing fails + # sys.exit(1) input.close() output.close() + Usage = ''' -lyx_pot.py [-b|--base top_src_dir] [-o|--output output_file] [-h|--help] -t|--type input_type input_files +lyx_pot.py [-b|--base top_src_dir] [-o|--output output_file] [-h|--help] [-s|src_file filename] -t|--type input_type input_files -where +where --base: path to the top source directory. default to '.' --output: output pot file, default to './lyx.pot' + --src_file + filename that contains a list of input files in each line --input_type can be ui: lib/ui/* layouts: lib/layouts/* + layouttranslations: create lib/layouttranslations from po/*.po and lib/layouts/* qt4: qt4 ui files languages: file lib/languages + encodings: file lib/encodings + external: external templates file + formats: formats predefined in lib/configure.py ''' if __name__ == '__main__': input_type = None output = 'lyx.pot' base = '.' + input_files = [] # - optlist, args = getopt.getopt(sys.argv[1:], 'ht:o:b:', - ['help', 'type=', 'output=', 'base=']) + optlist, args = getopt.getopt(sys.argv[1:], 'ht:o:b:s:', + ['help', 'type=', 'output=', 'base=', 'src_file=']) for (opt, value) in optlist: if opt in ['-h', '--help']: print Usage @@ -174,15 +525,30 @@ if __name__ == '__main__': base = value elif opt in ['-t', '--type']: input_type = value - if input_type not in ['ui', 'layouts', 'qt4', 'languages'] or output is None: + elif opt in ['-s', '--src_file']: + input_files = [f.strip() for f in open(value)] + + if input_type not in ['ui', 'layouts', 'layouttranslations', 'qt4', 'languages', 'encodings', 'external', 'formats'] or output is None: print 'Wrong input type or output filename.' sys.exit(1) + + input_files += args + if input_type == 'ui': - ui_l10n(args, output, base) + ui_l10n(input_files, output, base) elif input_type == 'layouts': - layouts_l10n(args, output, base) + layouts_l10n(input_files, output, base, False) + elif input_type == 'layouttranslations': + layouts_l10n(input_files, output, base, True) elif input_type == 'qt4': - qt4_l10n(args, output, base) + qt4_l10n(input_files, output, base) + elif input_type == 'external': + external_l10n(input_files, output, base) + elif input_type == 'formats': + formats_l10n(input_files, output, base) + elif input_type == 'encodings': + encodings_l10n(input_files, output, base) else: - languages_l10n(args, output, base) + languages_l10n(input_files, output, base) +