]> git.lyx.org Git - lyx.git/blobdiff - po/lyx_pot.py
Add comment
[lyx.git] / po / lyx_pot.py
index 2dd883aec5fd0fc5e45fd8df6b26ee59c9cae824..3da45a5a931aa39600aacf2b38adbd4f2a400497 100755 (executable)
@@ -17,6 +17,8 @@
 # to output in gettext .pot format.
 #
 import sys, os, re, getopt
+if sys.version_info < (2, 4, 0):
+    from sets import Set as set
 
 def relativePath(path, base):
     '''return relative path from top source dir'''
@@ -25,28 +27,48 @@ def relativePath(path, base):
     path2 = os.path.normpath(os.path.realpath(base)).split(os.sep)
     if path1[:len(path2)] != path2:
         print "Path %s is not under top source directory" % path
-    return os.path.join(*path1[len(path2):])
+    path3 = os.path.join(*path1[len(path2):]);
+    # replace all \ by / such that we get the same comments on Windows and *nix
+    path3 = path3.replace('\\', '/')
+    return path3
+
+
+def writeString(outfile, infile, basefile, lineno, string):
+    string = string.replace('\\', '\\\\').replace('"', '')
+    if string == "":
+        return
+    print >> outfile, '#: %s:%d\nmsgid "%s"\nmsgstr ""\n' % \
+        (relativePath(infile, basefile), lineno, string)
 
 
 def ui_l10n(input_files, output, base):
     '''Generate pot file from lib/ui/*'''
     output = open(output, 'w')
     Submenu = re.compile(r'^[^#]*Submenu\s+"([^"]*)"')
+    Popupmenu = re.compile(r'^[^#]*PopupMenu\s+"[^"]+"\s+"([^"]*)"')
+    IconPalette = re.compile(r'^[^#]*IconPalette\s+"[^"]+"\s+"([^"]*)"')
     Toolbar = re.compile(r'^[^#]*Toolbar\s+"[^"]+"\s+"([^"]*)"')
     Item = re.compile(r'[^#]*Item\s+"([^"]*)"')
+    TableInsert = re.compile(r'[^#]*TableInsert\s+"([^"]*)"')
     for src in input_files:
         input = open(src)
         for lineno, line in enumerate(input.readlines()):
             if Submenu.match(line):
                 (string,) = Submenu.match(line).groups()
                 string = string.replace('_', ' ')
+            elif Popupmenu.match(line):
+                (string,) = Popupmenu.match(line).groups()
+            elif IconPalette.match(line):
+                (string,) = IconPalette.match(line).groups()
             elif Toolbar.match(line):
                 (string,) = Toolbar.match(line).groups()
             elif Item.match(line):
                 (string,) = Item.match(line).groups()
+            elif TableInsert.match(line):
+                (string,) = TableInsert.match(line).groups()
             else:
                 continue
-            string = string.replace('\\', '\\\\').replace('"', '')
+            string = string.replace('"', '')
             if string != "":
                 print >> output, '#: %s:%d\nmsgid "%s"\nmsgstr ""\n' % \
                     (relativePath(src, base), lineno+1, string)
@@ -54,34 +76,263 @@ def ui_l10n(input_files, output, base):
     output.close()
 
 
-def layouts_l10n(input_files, output, base):
-    '''Generate pot file from lib/layouts/*.layout and *.inc'''
-    output = open(output, 'w')
-    Style = re.compile(r'^Style\s+(.*)')
+def layouts_l10n(input_files, output, base, layouttranslations):
+    '''Generate pot file from lib/layouts/*.{layout,inc,module}'''
+    Style = re.compile(r'^Style\s+(.*)', re.IGNORECASE)
     # include ???LabelString???, but exclude comment lines
     LabelString = re.compile(r'^[^#]*LabelString\S*\s+(.*)')
     GuiName = re.compile(r'\s*GuiName\s+(.*)')
     ListName = re.compile(r'\s*ListName\s+(.*)')
+    CategoryName = re.compile(r'\s*Category\s+(.*)')
+    NameRE = re.compile(r'DeclareLyXModule.*{(.*)}')
+    InsetLayout = re.compile(r'^InsetLayout\s+\"?(.*)\"?')
+    FlexCheck = re.compile(r'^Flex:(.*)')
+    DescBegin = re.compile(r'#+\s*DescriptionBegin\s*$')
+    DescEnd = re.compile(r'#+\s*DescriptionEnd\s*$')
+    Category = re.compile(r'#Category: (.*)$')
+    I18nPreamble = re.compile(r'\s*(Lang)|(Babel)Preamble\s*$')
+    EndI18nPreamble = re.compile(r'\s*End(Lang)|(Babel)Preamble\s*$')
+    I18nString = re.compile(r'_\(([^\)]+)\)')
+    CounterFormat = re.compile(r'\s*PrettyFormat\s+"?(.*)"?')
+    CiteFormat = re.compile(r'\s*CiteFormat')
+    KeyVal = re.compile(r'^\s*_\w+\s+(.*)$')
+    Float = re.compile(r'\s*Float')
+    End = re.compile(r'\s*End')
+    Comment = re.compile(r'\s*#')
+    Translation = re.compile(r'\s*Translation\s+(.*)\s*$')
+    KeyValPair = re.compile(r'\s*"(.*)"\s+"(.*)"')
+
+    oldlanguages = []
+    languages = []
+    keyset = set()
+    oldtrans = dict()
+    if layouttranslations:
+        linguas_file = os.path.join(base, 'po/LINGUAS')
+        for line in open(linguas_file).readlines():
+            if Comment.search(line) == None:
+                languages.extend(line.split())
+
+        # read old translations if available
+        try:
+            input = open(output)
+            lang = ''
+            for line in input.readlines():
+                res = Comment.search(line)
+                if res:
+                    continue
+                if line.strip() == '':
+                    continue
+                res = Translation.search(line)
+                if res:
+                    lang = res.group(1)
+                    if lang not in languages:
+                        oldlanguages.append(lang)
+                        languages.append(lang)
+                    oldtrans[lang] = dict()
+                    continue
+                res = End.search(line)
+                if res:
+                    lang = ''
+                    continue
+                res = KeyValPair.search(line)
+                if res and lang != '':
+                    key = res.group(1).decode('utf-8')
+                    val = res.group(2).decode('utf-8')
+                    key = key.replace('\\"', '"').replace('\\\\', '\\')
+                    val = val.replace('\\"', '"').replace('\\\\', '\\')
+                    oldtrans[lang][key] = val
+                    keyset.add(key)
+                    continue
+                print "Error: Unable to handle line:"
+                print line
+        except IOError:
+            pass
+
+        # walon is not a known document language
+        # FIXME: Do not hardcode, read from lib/languages!
+        if 'wa' in languages:
+            languages.remove('wa')
+
+    out = open(output, 'w')
     for src in input_files:
-        input = open(src)
-        for lineno, line in enumerate(input.readlines()):
-            if Style.match(line):
-                (string,) = Style.match(line).groups()
+        readingDescription = False
+        readingI18nPreamble = False
+        readingFloat = False
+        readingCiteFormats = False
+        descStartLine = -1
+        descLines = []
+        lineno = 0
+        for line in open(src).readlines():
+            lineno += 1
+            if readingDescription:
+                res = DescEnd.search(line)
+                if res != None:
+                    readingDescription = False
+                    desc = " ".join(descLines)
+                    if not layouttranslations:
+                        writeString(out, src, base, lineno + 1, desc)
+                    continue
+                descLines.append(line[1:].strip())
+                continue
+            res = DescBegin.search(line)
+            if res != None:
+                readingDescription = True
+                descStartLine = lineno
+                continue
+            if readingI18nPreamble:
+                res = EndI18nPreamble.search(line)
+                if res != None:
+                    readingI18nPreamble = False
+                    continue
+                res = I18nString.search(line)
+                if res != None:
+                    string = res.group(1)
+                    if layouttranslations:
+                        keyset.add(string)
+                    else:
+                        writeString(out, src, base, lineno, string)
+                continue
+            res = I18nPreamble.search(line)
+            if res != None:
+                readingI18nPreamble = True
+                continue
+            res = NameRE.search(line)
+            if res != None:
+                string = res.group(1)
+                if not layouttranslations:
+                    writeString(out, src, base, lineno + 1, string)
+                continue
+            res = Style.search(line)
+            if res != None:
+                string = res.group(1)
                 string = string.replace('_', ' ')
-            elif LabelString.match(line):
-                (string,) = LabelString.match(line).groups()
-            elif GuiName.match(line):
-                (string,) = GuiName.match(line).groups()
-            elif ListName.match(line):
-                (string,) = ListName.match(line).groups()
-            else:
+                if not layouttranslations:
+                    writeString(out, src, base, lineno, string)
                 continue
-            string = string.replace('\\', '\\\\').replace('"', '')
-            if string != "":
-                print >> output, '#: %s:%d\nmsgid "%s"\nmsgstr ""\n' % \
-                    (relativePath(src, base), lineno+1, string)
-        input.close()
-    output.close()
+            res = LabelString.search(line)
+            if res != None:
+                string = res.group(1)
+                if not layouttranslations:
+                    writeString(out, src, base, lineno, string)
+                continue
+            res = GuiName.search(line)
+            if res != None:
+                string = res.group(1)
+                if layouttranslations:
+                    # gui name must only be added for floats
+                    if readingFloat:
+                        keyset.add(string)
+                else:
+                    writeString(out, src, base, lineno, string)
+                continue
+            res = CategoryName.search(line)
+            if res != None:
+                string = res.group(1)
+                if not layouttranslations:
+                    writeString(out, src, base, lineno, string)
+                continue
+            res = ListName.search(line)
+            if res != None:
+                string = res.group(1)
+                if layouttranslations:
+                    keyset.add(string.strip('"'))
+                else:
+                    writeString(out, src, base, lineno, string)
+                continue
+            res = InsetLayout.search(line)
+            if res != None:
+                string = res.group(1)
+                string = string.replace('_', ' ')
+                #Flex:xxx is not used in translation
+                #if not layouttranslations:
+                #    writeString(out, src, base, lineno, string)
+                m = FlexCheck.search(string)
+                if m:
+                    if not layouttranslations:
+                        writeString(out, src, base, lineno, m.group(1))
+                continue
+            res = Category.search(line)
+            if res != None:
+                string = res.group(1)
+                if not layouttranslations:
+                    writeString(out, src, base, lineno, string)
+                continue
+            res = CounterFormat.search(line)
+            if res != None:
+                string = res.group(1)
+                if not layouttranslations:
+                    writeString(out, src, base, lineno, string)
+                continue
+            res = Float.search(line)
+            if res != None:
+                readingFloat = True
+                continue
+            res = CiteFormat.search(line)
+            if res != None:
+                readingCiteFormats = True
+            res = End.search(line)
+            if res != None:
+                readingCiteFormats = False
+                readingFloat = False
+            if readingCiteFormats:
+                res = KeyVal.search(line)
+                if res != None:
+                    val = res.group(1)
+                    if not layouttranslations:
+                        writeString(out, src, base, lineno, val)
+
+    if layouttranslations:
+        # Extract translations of layout files
+        import polib
+
+        # Sort languages and key to minimize the diff between different runs
+        # with changed translations
+        languages.sort()
+        keys = []
+        for key in keyset:
+            keys.append(key)
+        keys.sort()
+
+        print >> out, '''# This file has been automatically generated by po/lyx_pot.py.
+# PLEASE MODIFY ONLY THE LAGUAGES HAVING NO .po FILE! If you want to regenerate
+# this file from the translations, run `make ../lib/layouttranslations' in po.
+# Python polib library is needed for building the output file.
+#
+# This file should remain fixed during minor LyX releases.'''
+        for lang in languages:
+            print >> out, '\nTranslation %s' % lang
+            if lang in oldtrans.keys():
+                trans = oldtrans[lang]
+            else:
+                trans = dict()
+            if not lang in oldlanguages:
+                poname = os.path.join(base, 'po/' + lang + '.po')
+                po = polib.pofile(poname)
+                # Iterate through po entries and not keys for speed reasons.
+                # FIXME: The code is still too slow
+                for entry in po:
+                    if not entry.translated():
+                        continue
+                    if entry.msgid in keys:
+                        key = entry.msgid
+                        val = entry.msgstr
+                        # some translators keep untranslated entries
+                        if val != key:
+                            trans[key] = val
+            for key in keys:
+                if key in trans.keys():
+                    val = trans[key].replace('\\', '\\\\').replace('"', '\\"')
+                    key = key.replace('\\', '\\\\').replace('"', '\\"')
+                    print >> out, '\t"%s" "%s"' % \
+                             (key.encode('utf-8'), val.encode('utf-8'))
+                # to print untranslated entries, uncomment the following lines
+                #else:
+                #    key = key.replace('\\', '\\\\').replace('"', '\\"')
+                #    print >> out, '\t"%s" "%s"' % \
+                #             (key.encode('utf-8'), key.encode('utf-8'))
+            print >> out, 'End'
+
+    out.close()
 
 
 def qt4_l10n(input_files, output, base):
@@ -103,59 +354,167 @@ def qt4_l10n(input_files, output, base):
             # get lines that match <string>...</string>
             if pat.match(line):
                 (string,) = pat.match(line).groups()
-                string = string.replace('&amp;', '&').replace('&lt;', '<').replace('&gt;', '>').replace('"', r'\"')
+                string = string.replace('&amp;', '&').replace('&quot;', '"')
+                string = string.replace('&lt;', '<').replace('&gt;', '>')
+                string = string.replace('\\', '\\\\').replace('"', r'\"')
+                string = string.replace('&#x0a;', r'\n')
                 print >> output, '#: %s:%d\nmsgid "%s"\nmsgstr ""\n' % \
-                    (relativePath(src, base), lineno+1, string) 
+                    (relativePath(src, base), lineno+1, string)
         input.close()
     output.close()
 
 
 def languages_l10n(input_files, output, base):
-    '''Generate pot file from lib/language'''
+    '''Generate pot file from lib/languages'''
+    out = open(output, 'w')
+    GuiName = re.compile(r'^[^#]*GuiName\s+(.*)')
+    
+    for src in input_files:
+        descStartLine = -1
+        descLines = []
+        lineno = 0
+        for line in open(src).readlines():
+            lineno += 1
+            res = GuiName.search(line)
+            if res != None:
+                string = res.group(1)
+                writeString(out, src, base, lineno, string)
+                continue
+               
+    out.close()
+
+
+def external_l10n(input_files, output, base):
+    '''Generate pot file from lib/external_templates'''
+    output = open(output, 'w')
+    Template = re.compile(r'^Template\s+(.*)')
+    GuiName = re.compile(r'\s*GuiName\s+(.*)')
+    HelpTextStart = re.compile(r'\s*HelpText\s')
+    HelpTextSection = re.compile(r'\s*(\S.*)\s*$')
+    HelpTextEnd = re.compile(r'\s*HelpTextEnd\s')
+    i = -1
+    for src in input_files:
+        input = open(src)
+        inHelp = False
+        hadHelp = False
+        prev_help_string = ''
+        for lineno, line in enumerate(input.readlines()):
+            if Template.match(line):
+                (string,) = Template.match(line).groups()
+            elif GuiName.match(line):
+                (string,) = GuiName.match(line).groups()
+            elif inHelp:
+                if HelpTextEnd.match(line):
+                    if hadHelp:
+                        print >> output, '\nmsgstr ""\n'
+                    inHelp = False
+                    hadHelp = False
+                    prev_help_string = ''
+                elif HelpTextSection.match(line):
+                    (help_string,) = HelpTextSection.match(line).groups()
+                    help_string = help_string.replace('"', '')
+                    if help_string != "" and prev_help_string == '':
+                        print >> output, '#: %s:%d\nmsgid ""\n"%s\\n"' % \
+                            (relativePath(src, base), lineno+1, help_string)
+                        hadHelp = True
+                    elif help_string != "":
+                        print >> output, '"%s\\n"' % help_string
+                    prev_help_string = help_string
+            elif HelpTextStart.match(line):
+                inHelp = True
+                prev_help_string = ''
+            else:
+                continue
+            string = string.replace('"', '')
+            if string != "" and not inHelp:
+                print >> output, '#: %s:%d\nmsgid "%s"\nmsgstr ""\n' % \
+                    (relativePath(src, base), lineno+1, string)
+        input.close()
+    output.close()
+
+
+def formats_l10n(input_files, output, base):
+    '''Generate pot file from configure.py'''
     output = open(output, 'w')
-    # assuming only one language file
+    GuiName = re.compile(r'.*\Format\s+\S+\s+\S+\s+"([^"]*)"\s+(\S*)\s+.*')
+    GuiName2 = re.compile(r'.*\Format\s+\S+\s+\S+\s+([^"]\S+)\s+(\S*)\s+.*')
     input = open(input_files[0])
     for lineno, line in enumerate(input.readlines()):
-        if line[0] == '#':
+        label = ""
+        labelsc = ""
+        if GuiName.match(line):
+            label = GuiName.match(line).group(1)
+            shortcut = GuiName.match(line).group(2).replace('"', '')
+        elif GuiName2.match(line):
+            label = GuiName2.match(line).group(1)
+            shortcut = GuiName2.match(line).group(2).replace('"', '')
+        else:
             continue
-        items = line.split('"')
-        # empty lines?
-        if len(items) < 3:
+        label = label.replace('\\', '\\\\').replace('"', '')
+        if shortcut != "":
+            labelsc = label + "|" + shortcut
+        if label != "":
+            print >> output, '#: %s:%d\nmsgid "%s"\nmsgstr ""\n' % \
+                (relativePath(input_files[0], base), lineno+1, label)
+        if labelsc != "":
+            print >> output, '#: %s:%d\nmsgid "%s"\nmsgstr ""\n' % \
+                (relativePath(input_files[0], base), lineno+1, labelsc)
+    input.close()
+    output.close()
+
+
+def encodings_l10n(input_files, output, base):
+    '''Generate pot file from lib/encodings'''
+    output = open(output, 'w')
+    # assuming only one encodings file
+    #                 Encoding utf8      utf8    "Unicode (utf8)" UTF-8    variable inputenc
+    reg = re.compile('Encoding [\w-]+\s+[\w-]+\s+"([\w \-\(\)]+)"\s+[\w-]+\s+(fixed|variable)\s+\w+.*')
+    input = open(input_files[0])
+    for lineno, line in enumerate(input.readlines()):
+        if not line.startswith('Encoding'):
             continue
-        # From:
-        #   afrikaans   afrikaans      "Afrikaans"     false  iso8859-15 af_ZA  ""
-        # To:
-        #   #: lib/languages:2
-        #   msgid "Afrikaans"
-        #   msgstr ""
-        # I do not care extra "s like "af_ZA"
-        print >> output, '#: %s:%d\nmsgid "%s"\nmsgstr ""\n' % (relativePath(input_files[0], base), lineno+1, items[1])
+        if reg.match(line):
+            print >> output, '#: %s:%d\nmsgid "%s"\nmsgstr ""\n' % \
+                (relativePath(input_files[0], base), lineno+1, reg.match(line).groups()[0])
+        else:
+            print "Error: Unable to handle line:"
+            print line
+            # No need to abort if the parsing fails
+            # sys.exit(1)
     input.close()
     output.close()
 
 
+
 Usage = '''
-lyx_pot.py [-b|--base top_src_dir] [-o|--output output_file] [-h|--help] -t|--type input_type input_files
+lyx_pot.py [-b|--base top_src_dir] [-o|--output output_file] [-h|--help] [-s|src_file filename] -t|--type input_type input_files
 
-where 
+where
     --base:
         path to the top source directory. default to '.'
     --output:
         output pot file, default to './lyx.pot'
+    --src_file
+        filename that contains a list of input files in each line
     --input_type can be
         ui: lib/ui/*
         layouts: lib/layouts/*
+        layouttranslations: create lib/layouttranslations from po/*.po and lib/layouts/*
         qt4: qt4 ui files
         languages: file lib/languages
+        encodings: file lib/encodings
+        external: external templates file
+        formats: formats predefined in lib/configure.py
 '''
 
 if __name__ == '__main__':
     input_type = None
     output = 'lyx.pot'
     base = '.'
+    input_files = []
     #
-    optlist, args = getopt.getopt(sys.argv[1:], 'ht:o:b:',
-        ['help', 'type=', 'output=', 'base='])
+    optlist, args = getopt.getopt(sys.argv[1:], 'ht:o:b:s:',
+        ['help', 'type=', 'output=', 'base=', 'src_file='])
     for (opt, value) in optlist:
         if opt in ['-h', '--help']:
             print Usage
@@ -166,15 +525,30 @@ if __name__ == '__main__':
             base = value
         elif opt in ['-t', '--type']:
             input_type = value
-    if input_type not in ['ui', 'layouts', 'qt4', 'languages'] or output is None:
+        elif opt in ['-s', '--src_file']:
+            input_files = [f.strip() for f in open(value)]
+
+    if input_type not in ['ui', 'layouts', 'layouttranslations', 'qt4', 'languages', 'encodings', 'external', 'formats'] or output is None:
         print 'Wrong input type or output filename.'
         sys.exit(1)
+
+    input_files += args
+
     if input_type == 'ui':
-        ui_l10n(args, output, base)
+        ui_l10n(input_files, output, base)
     elif input_type == 'layouts':
-        layouts_l10n(args, output, base)
+        layouts_l10n(input_files, output, base, False)
+    elif input_type == 'layouttranslations':
+        layouts_l10n(input_files, output, base, True)
     elif input_type == 'qt4':
-        qt4_l10n(args, output, base)
+        qt4_l10n(input_files, output, base)
+    elif input_type == 'external':
+        external_l10n(input_files, output, base)
+    elif input_type == 'formats':
+        formats_l10n(input_files, output, base)
+    elif input_type == 'encodings':
+        encodings_l10n(input_files, output, base)
     else:
-        languages_l10n(args, output, base)
+        languages_l10n(input_files, output, base)
+