Fix the configure script. Python apparently does not like tabs as much as spaces.

[lyx.git] / lib / lyx2lyx / lyx_1_6.py
diff --git a/lib/lyx2lyx/lyx_1_6.py b/lib/lyx2lyx/lyx_1_6.py

index 21c3c26d264cdf9193093c7560899f88ed5813be..562f32946bcef81216f61757e8e2d703b472b5d1 100644 (file)
--- a/lib/lyx2lyx/lyx_1_6.py
+++ b/lib/lyx2lyx/lyx_1_6.py
@@ -50,6 +50,8 @@ def wrap_into_ert(string, src, dst):
        + dst + '\n\\end_layout\n\\end_inset\n')
  
  def put_cmd_in_ert(string):
+    for rep in unicode_reps:
+        string = string.replace(rep[1], rep[0].replace('\\\\', '\\'))
      string = string.replace('\\', "\\backslash\n")
      string = "\\begin_inset ERT\nstatus collapsed\n\\begin_layout Standard\n" \
        + string + "\n\\end_layout\n\\end_inset"
@@ -64,6 +66,11 @@ def add_to_preamble(document, text):
  
      document.preamble.extend(text)
  
+def insert_to_preamble(index, document, text):
+    """ Insert text to the preamble at a given line"""
+
+    document.preamble.insert(index, text)
+
  # Convert a LyX length into a LaTeX length
  def convert_len(len):
      units = {"text%":"\\backslash\ntextwidth", "col%":"\\backslash\ncolumnwidth",
@@ -130,7 +137,7 @@ def read_unicodesymbols():
      # Two backslashes, followed by some non-word character, and then a character
      # in brackets. The idea is to check for constructs like: \"{u}, which is how
      # they are written in the unicodesymbols file; but they can also be written
-    # as: \"u.
+    # as: \"u or even \" u.
      r = re.compile(r'\\\\(\W)\{(\w)\}')
      for line in fp.readlines():
          if line[0] != '#' and line.strip() != "":
@@ -151,8 +158,11 @@ def read_unicodesymbols():
                  # since it is done that way in the LyX file.
                  if m.group(1) == "\"":
                      command += "\\"
+                commandbl = command
                  command += m.group(1) + m.group(2)
+                commandbl += m.group(1) + ' ' + m.group(2)
                  spec_chars.append([command, unichr(eval(ucs4))])
+                spec_chars.append([commandbl, unichr(eval(ucs4))])
      fp.close()
      return spec_chars
  
@@ -199,7 +209,7 @@ def extract_argument(line):
      return (line[:pos + 1], line[pos + 1:])
  
  
-def latex2ert(line):
+def latex2ert(line, isindex):
      '''Converts LaTeX commands into ERT. line may well be a multi-line
         string when it is returned.'''
      if not line:
@@ -207,7 +217,11 @@ def latex2ert(line):
  
      retval = ""
      ## FIXME Escaped \ ??
-    labelre = re.compile(r'(.*?)\\(\\(?:[a-zA-Z]+|.))(.*)')
+    # This regex looks for a LaTeX command---i.e., something of the form
+    # "\alPhaStuFF", or "\X", where X is any character---where the command
+    # may also be preceded by an additional backslash, which is how it would
+    # appear (e.g.) in an InsetIndex.
+    labelre = re.compile(r'(.*?)\\?(\\(?:[a-zA-Z]+|.))(.*)')
  
      m = labelre.match(line)
      while m != None:
@@ -221,28 +235,48 @@ def latex2ert(line):
                  break
              cmd += arg
              end = rest
+        # If we wanted to put labels into an InsetLabel, for example, then we
+        # would just need to test here for cmd == "label" and then take some
+        # appropriate action, i.e., to use arg to get the content and then
+        # wrap it appropriately.
          cmd = put_cmd_in_ert(cmd)
          retval += "\n" + cmd + "\n"
          line = end
          m = labelre.match(line)
+    # put all remaining braces in ERT
+    line = wrap_into_ert(line, '}', '}')
+    line = wrap_into_ert(line, '{', '{')
+    if isindex:
+        # active character that is not available in all font encodings
+        line = wrap_into_ert(line, '|', '|')
      retval += line
      return retval
  
  
-def latex2lyx(data):
-    '''Takes a string, possibly multi-line, and returns the result of 
+unicode_reps = read_unicodesymbols()
+
+#Bug 5022....
+#Might should do latex2ert first, then deal with stuff that DOESN'T
+#end up inside ERT. That routine could be modified so that it returned
+#a list of lines, and we could then skip ERT bits and only deal with
+#the other bits.
+def latex2lyx(data, isindex):
+    '''Takes a string, possibly multi-line, and returns the result of
      converting LaTeX constructs into LyX constructs. Returns a list of
-    lines, suitable for insertion into document.body.'''
+    lines, suitable for insertion into document.body.
+    The bool isindex specifies whether we are in an index macro (which
+    has some specific active characters that need to be ERTed).'''
  
+    if not data:
+        return [""]
      retval = []
  
      # Convert LaTeX to Unicode
-    reps = read_unicodesymbols()
      # Commands of this sort need to be checked to make sure they are
      # followed by a non-alpha character, lest we replace too much.
      hardone = re.compile(r'^\\\\[a-zA-Z]+$')
-    
-    for rep in reps:
+
+    for rep in unicode_reps:
          if hardone.match(rep[0]):
              pos = 0
              while True:
@@ -259,8 +293,11 @@ def latex2lyx(data):
          else:
              data = data.replace(rep[0], rep[1])
  
-    # Generic, \" -> ":
+    # Generic
+    # \" -> ":
      data = wrap_into_ert(data, r'\"', '"')
+    # \\ -> \:
+    data = data.replace('\\\\', '\\')
  
      # Math:
      mathre = re.compile('^(.*?)(\$.*?\$)(.*)')
@@ -277,83 +314,100 @@ def latex2lyx(data):
              g = m.group(3)
              if s:
                  # this is non-math!
-                s = latex2ert(s)
+                s = latex2ert(s, isindex)
                  subst = s.split('\n')
                  retval += subst
              retval.append("\\begin_inset Formula " + f)
              retval.append("\\end_inset")
              m = mathre.match(g)
          # Handle whatever is left, which is just text
-        g = latex2ert(g)
+        g = latex2ert(g, isindex)
          subst = g.split('\n')
          retval += subst
      return retval
  
  
-def lyx2latex(lines):
+def lyxline2latex(document, line, inert):
+    'Convert some LyX stuff into corresponding LaTeX stuff line-wise, as best we can.'
+    if line.startswith("\\begin_inset Formula"):
+        line = line[20:]
+    elif line.startswith("\\begin_inset Quotes"):
+        # For now, we do a very basic reversion. Someone who understands
+        # quotes is welcome to fix it up.
+        qtype = line[20:].strip()
+        # lang = qtype[0]
+        side = qtype[1]
+        dbls = qtype[2]
+        if side == "l":
+            if dbls == "d":
+                line = "``"
+            else:
+                line = "`"
+        else:
+            if dbls == "d":
+                line = "''"
+            else:
+                line = "'"
+    elif line.isspace() or \
+          line.startswith("\\begin_layout") or \
+          line.startswith("\\end_layout") or \
+          line.startswith("\\begin_inset") or \
+          line.startswith("\\end_inset") or \
+          line.startswith("\\lang") or \
+          line.strip() == "status collapsed" or \
+          line.strip() == "status open":
+        #skip all that stuff
+        return ""
+
+    # this needs to be added to the preamble because of cases like
+    # \textmu, \textbackslash, etc.
+    add_to_preamble(document, ['% added by lyx2lyx for converted entries',
+                               '\\@ifundefined{textmu}',
+                               ' {\\usepackage{textcomp}}{}'])
+    # a lossless reversion is not possible
+    # try at least to handle some common insets and settings
+    if inert:
+        line = line.replace(r'\backslash', '\\')
+    else:
+        line = line.replace('&', '\\&{}')
+        line = line.replace('#', '\\#{}')
+        line = line.replace('^', '\\^{}')
+        line = line.replace('%', '\\%{}')
+        line = line.replace('_', '\\_{}')
+        line = line.replace('$', '\\${}')
+
+        # Do the LyX text --> LaTeX conversion
+        for rep in unicode_reps:
+            line = line.replace(rep[1], rep[0].replace('\\\\', '\\') + "{}")
+            line = line.replace(r'\backslash', r'\textbackslash{}')
+            line = line.replace(r'\series bold', r'\bfseries{}').replace(r'\series default', r'\mdseries{}')
+            line = line.replace(r'\shape italic', r'\itshape{}').replace(r'\shape smallcaps', r'\scshape{}')
+            line = line.replace(r'\shape slanted', r'\slshape{}').replace(r'\shape default', r'\upshape{}')
+            line = line.replace(r'\emph on', r'\em{}').replace(r'\emph default', r'\em{}')
+            line = line.replace(r'\noun on', r'\scshape{}').replace(r'\noun default', r'\upshape{}')
+            line = line.replace(r'\bar under', r'\underbar{').replace(r'\bar default', r'}')
+            line = line.replace(r'\family sans', r'\sffamily{}').replace(r'\family default', r'\normalfont{}')
+            line = line.replace(r'\family typewriter', r'\ttfamily{}').replace(r'\family roman', r'\rmfamily{}')
+            line = line.replace(r'\InsetSpace ', r'').replace(r'\SpecialChar ', r'')
+    return line
+
+
+def lyx2latex(document, lines):
      'Convert some LyX stuff into corresponding LaTeX stuff, as best we can.'
      # clean up multiline stuff
      content = ""
      ert_end = 0
-    reps = read_unicodesymbols()
-  
+
      for curline in range(len(lines)):
-      line = lines[curline]
-      if line.startswith("\\begin_inset ERT"):
-          # We don't want to replace things inside ERT, so figure out
-          # where the end of the inset is.
-          ert_end = find_end_of_inset(lines, curline + 1)
-          continue
-      elif line.startswith("\\begin_inset Formula"):
-          line = line[20:]
-      elif line.startswith("\\begin_inset Quotes"):
-          # For now, we do a very basic reversion. Someone who understands
-          # quotes is welcome to fix it up.
-          qtype = line[20:].strip()
-          # lang = qtype[0]
-          side = qtype[1]
-          dbls = qtype[2]
-          if side == "l":
-              if dbls == "d":
-                  line = "``"
-              else:
-                  line = "`"
-          else:
-              if dbls == "d":
-                  line = "''"
-              else:
-                  line = "'"
-      elif line.isspace() or \
-            line.startswith("\\begin_layout") or \
-            line.startswith("\\end_layout") or \
-            line.startswith("\\begin_inset") or \
-            line.startswith("\\end_inset") or \
-            line.startswith("\\lang") or \
-            line.strip() == "status collapsed" or \
-            line.strip() == "status open":
-          #skip all that stuff
-          continue
-  
-      # a lossless reversion is not possible
-      # try at least to handle some common insets and settings
-      # do not replace inside ERTs
-      if ert_end >= curline:
-          line = line.replace(r'\backslash', r'\\')
-      else:
-          # Do the LyX text --> LaTeX conversion
-          for rep in reps:
-            line = line.replace(rep[1], rep[0])
-          line = line.replace(r'\backslash', r'\textbackslash{}')
-          line = line.replace(r'\series bold', r'\bfseries{}').replace(r'\series default', r'\mdseries{}')
-          line = line.replace(r'\shape italic', r'\itshape{}').replace(r'\shape smallcaps', r'\scshape{}')
-          line = line.replace(r'\shape slanted', r'\slshape{}').replace(r'\shape default', r'\upshape{}')
-          line = line.replace(r'\emph on', r'\em{}').replace(r'\emph default', r'\em{}')
-          line = line.replace(r'\noun on', r'\scshape{}').replace(r'\noun default', r'\upshape{}')
-          line = line.replace(r'\bar under', r'\underbar{').replace(r'\bar default', r'}')
-          line = line.replace(r'\family sans', r'\sffamily{}').replace(r'\family default', r'\normalfont{}')
-          line = line.replace(r'\family typewriter', r'\ttfamily{}').replace(r'\family roman', r'\rmfamily{}')
-          line = line.replace(r'\InsetSpace ', r'').replace(r'\SpecialChar ', r'')
-      content += line
+        line = lines[curline]
+        if line.startswith("\\begin_inset ERT"):
+            # We don't want to replace things inside ERT, so figure out
+            # where the end of the inset is.
+            ert_end = find_end_of_inset(lines, curline + 1)
+            continue
+        inert = ert_end >= curline
+        content += lyxline2latex(document, lines[curline], inert)
+      
      return content
  
  
@@ -655,7 +709,7 @@ def revert_long_charstyle_names(document):
          i = find_token(document.body, "\\begin_inset CharStyle", i)
          if i == -1:
              return
-        document.body[i] = document.body[i].replace("CharStyle CharStyle:", "CharStyle")
+        document.body[i] = document.body[i].replace("CharStyle CharStyle:", "CharStyle ")
          i += 1
  
  
@@ -727,7 +781,6 @@ def revert_flex(document):
          document.body[i] = document.body[i].replace('\\begin_inset Flex', '\\begin_inset CharStyle')
  
  
-#  Discard PDF options for hyperref
  def revert_pdf_options(document):
          "Revert PDF options for hyperref."
          # store the PDF options and delete the entries from the Lyx file
@@ -864,9 +917,12 @@ def revert_pdf_options(document):
                  setupstart = ""
                  setupend = ""
              # write the preamble
-            add_to_preamble(document,
-                                ['% Commands inserted by lyx2lyx for PDF properties',
-                                 '\\usepackage[unicode=true'
+            # babel must be loaded before hyperref and hyperref the first part
+            # of the preamble, like in LyX 1.6
+            insert_to_preamble(0, document,
+                                 '% Commands inserted by lyx2lyx for PDF properties\n'
+                                 + '\\usepackage{babel}\n'
+                                 + '\\usepackage[unicode=true'
                                   + bookmarks
                                   + breaklinks
                                   + pdfborder
@@ -875,14 +931,14 @@ def revert_pdf_options(document):
                                   + colorlinks
                                   + pagemode
                                   + ']\n'
-                                 ' {hyperref}\n'
+                                 + ' {hyperref}\n'
                                   + setupstart
                                   + title
                                   + author
                                   + subject
                                   + keywords
                                   + otheroptions
-                                 + setupend])
+                                 + setupend)
  
  
  def remove_inzip_options(document):
@@ -962,6 +1018,7 @@ def revert_inset_command(document):
          m = r.match(nextline)
          if not m:
              document.warning("Malformed LyX document: Missing LatexCommand in " + document.body[i] + ".")
+            i += 1
              continue
          cmdName = m.group(1)
          insertion = ["\\begin_inset LatexCommand " + cmdName]
@@ -1030,27 +1087,27 @@ def convert_latexcommand_index(document):
          if i == -1:
              return
          if document.body[i + 1] != "LatexCommand index": # Might also be index_print
-            return
+            i += 1
+            continue
+        j = find_end_of_inset(document.body, i + 1)
+        if j == -1:
+            document.warning("Unable to find end of index inset at line " + str(i) + "!")
+            i += 2
+            continue
          m = r1.match(document.body[i + 2])
          if m == None:
              document.warning("Unable to match: " + document.body[i+2])
-            i += 1
-            continue
-        fullcontent = m.group(1)
+            # this can happen with empty index insets!
+            linelist = [""]
+        else:
+            fullcontent = m.group(1)
+            linelist = latex2lyx(fullcontent, True)
          #document.warning(fullcontent)
-        document.body[i:i + 3] = ["\\begin_inset Index",
-          "status collapsed",
-          "\\begin_layout Standard"]
-        i += 3
-        # We are now on the blank line preceding "\end_inset"
-        # We will write the content here, into the inset.
-
-        linelist = latex2lyx(fullcontent)
-        document.body[i+1:i+1] = linelist
-        i += len(linelist)
-
-        document.body.insert(i + 1, "\\end_layout")
-        i += 1
+
+        linelist = ["\\begin_inset Index", "status collapsed", "\\begin_layout Standard", ""] + \
+                   linelist + ["\\end_layout"]
+        document.body[i : j] = linelist
+        i += len(linelist) - (j - i)
  
  
  def revert_latexcommand_index(document):
@@ -1064,7 +1121,7 @@ def revert_latexcommand_index(document):
          if j == -1:
            return
  
-        content = lyx2latex(document.body[i:j])
+        content = lyx2latex(document, document.body[i:j])
          # escape quotes
          content = content.replace('"', r'\"')
          document.body[i:j] = ["\\begin_inset CommandInset index", "LatexCommand index",
@@ -1187,7 +1244,16 @@ def revert_inset_info(document):
          arg = ''
          for k in range(i, j+1):
              if document.body[k].startswith("arg"):
-                arg = document.body[k][3:].strip().strip('"')
+                arg = document.body[k][3:].strip()
+                # remove embracing quotation marks
+                if arg[0] == '"':
+                    arg = arg[1:]
+                if arg[len(arg) - 1] == '"':
+                    arg = arg[:len(arg) - 1]
+                # \" to straight quote
+                arg = arg.replace(r'\"', '"')
+                # \ to \backslash
+                arg = arg.replace(r'\\', "\\backslash\n")
              if document.body[k].startswith("type"):
                  type = document.body[k][4:].strip().strip('"')
          # I think there is a newline after \\end_inset, which should be removed.
@@ -1260,13 +1326,13 @@ def convert_url(document):
        j = find_token(document.body, "target", i)
        if j == -1:
          document.warning("Malformed LyX document: Can't find target for url inset")
-        i = j
+        i += 1
          continue
        target = document.body[j][8:-1]
        k = find_token(document.body, "\\end_inset", j)
        if k == -1:
          document.warning("Malformed LyX document: Can't find end of url inset")
-        i = k
+        i = j
          continue
        newstuff = ["\\begin_inset Flex URL",
          "status collapsed", "",
@@ -1276,7 +1342,7 @@ def convert_url(document):
          "\\end_layout",
          ""]
        document.body[i:k] = newstuff
-      i = k
+      i = i + len(newstuff)
  
  def convert_ams_classes(document):
    tc = document.textclass
@@ -1307,7 +1373,8 @@ def convert_ams_classes(document):
        return
      m = r.match(document.body[i])
      if m == None:
-      document.warning("Weirdly formed \\begin_layout at line %d of body!" % i)
+      # This is an empty layout
+      # document.warning("Weirdly formed \\begin_layout at line %d of body!" % i)
        i += 1
        continue
      m = m.group(1)
@@ -1398,11 +1465,6 @@ def revert_include(document):
      if i == -1:
        return
      nextline = i + 1
-    if r0.match(document.body[nextline]):
-      previewline = document.body[nextline]
-      nextline += 1
-    else:
-      previewline = ""
      m = r1.match(document.body[nextline])
      if m == None:
        document.warning("Malformed LyX document: No LatexCommand line for `" +
@@ -1411,6 +1473,11 @@ def revert_include(document):
        continue
      cmd = m.group(1)
      nextline += 1
+    if r0.match(document.body[nextline]):
+      previewline = document.body[nextline]
+      nextline += 1
+    else:
+      previewline = ""
      m = r2.match(document.body[nextline])
      if m == None:
        document.warning("Malformed LyX document: No filename line for `" + \
@@ -1504,6 +1571,44 @@ def convert_usorbian(document):
          j = j + 1
  
  
+def convert_macro_global(document):
+    "Remove TeX code command \global when it is in front of a macro"
+    # math macros are nowadays already defined \global, so that an additional
+    # \global would make the document uncompilable, see
+    # http://bugzilla.lyx.org/show_bug.cgi?id=5371
+    # We're looking for something like this:
+    # \begin_inset ERT
+    # status collapsed
+    #
+    # \begin_layout Plain Layout
+    #
+    #
+    # \backslash
+    # global
+    # \end_layout
+    #
+    # \end_inset
+    #
+    #
+    # \begin_inset FormulaMacro
+    # \renewcommand{\foo}{123}
+    # \end_inset
+    i = 0
+    while True:
+        i = find_token(document.body, "\\begin_inset FormulaMacro", i)
+        if i == -1:
+            return
+        # if i <= 13, then there isn't enough room for the ERT
+        if i <= 12:
+            i += 1
+            continue
+        if document.body[i-6] == "global":
+            del document.body[i-13 : i]
+            i = i - 12
+        else:
+            i += 1
+
+
  def revert_macro_optional_params(document):
      "Convert macro definitions with optional parameters into ERTs"
      # Stub to convert macro definitions with one or more optional parameters
@@ -1614,7 +1719,7 @@ def convert_framed_notes(document):
                   'position "t"',
                   'hor_pos "c"',
                   'has_inner_box 0',
-                 'inner_pos "t"', 
+                 'inner_pos "t"',
                   'use_parbox 0',
                   'width "100col%"',
                   'special "none"',
@@ -1724,40 +1829,45 @@ def revert_framed_notes(document):
  
  def revert_slash(document):
      'Revert \\SpecialChar \\slash{} to ERT'
-    r = re.compile(r'\\SpecialChar \\slash{}')
      i = 0
      while i < len(document.body):
-        m = r.match(document.body[i])
+        m = re.match(r'(.*)\\SpecialChar \\slash{}(.*)', document.body[i])
          if m:
-          subst = ['\\begin_inset ERT',
-                   'status collapsed', '',
-                   '\\begin_layout Standard',
-                   '', '', '\\backslash',
-                   'slash{}',
-                   '\\end_layout', '',
-                   '\\end_inset', '']
-          document.body[i: i+1] = subst
-          i = i + len(subst)
+            before = m.group(1)
+            after = m.group(2)
+            subst = [before,
+                     '\\begin_inset ERT',
+                     'status collapsed', '',
+                     '\\begin_layout Standard',
+                     '', '', '\\backslash',
+                     'slash{}',
+                     '\\end_layout', '',
+                     '\\end_inset', '',
+                     after]
+            document.body[i: i+1] = subst
+            i = i + len(subst)
          else:
-          i = i + 1
+            i = i + 1
  
  
  def revert_nobreakdash(document):
      'Revert \\SpecialChar \\nobreakdash- to ERT'
      i = 0
      while i < len(document.body):
-        line = document.body[i]
-        r = re.compile(r'\\SpecialChar \\nobreakdash-')
-        m = r.match(line)
+        m = re.match(r'(.*)\\SpecialChar \\nobreakdash-(.*)', document.body[i])
          if m:
-            subst = ['\\begin_inset ERT',
+            before = m.group(1)
+            after = m.group(2)
+            subst = [before,
+                     '\\begin_inset ERT',
                      'status collapsed', '',
                      '\\begin_layout Standard', '', '',
                      '\\backslash',
                      'nobreakdash-',
                      '\\end_layout', '',
-                    '\\end_inset', '']
-            document.body[i:i+1] = subst
+                    '\\end_inset', '',
+                     after]
+            document.body[i: i+1] = subst
              i = i + len(subst)
              j = find_token(document.header, "\\use_amsmath", 0)
              if j == -1:
@@ -1770,7 +1880,7 @@ def revert_nobreakdash(document):
  
  #Returns number of lines added/removed
  def revert_nocite_key(body, start, end):
-    'key "..." -> \nocite{...}' 
+    'key "..." -> \nocite{...}'
      r = re.compile(r'^key "(.*)"')
      i = start
      j = end
@@ -1940,17 +2050,17 @@ def revert_rotfloat(document):
          subst = ['\\begin_layout Standard',
                    '\\begin_inset ERT',
                    'status collapsed', '',
-                  '\\begin_layout Standard', '', '', 
+                  '\\begin_layout Standard', '', '',
                    '\\backslash', '',
                    'end{sideways' + floattype + '}',
                    '\\end_layout', '', '\\end_inset']
          document.body[j : j+1] = subst
          addedLines = len(subst) - 1
          del document.body[i+1 : l]
-        addedLines -= (l-1) - (i+1) 
+        addedLines -= (l-1) - (i+1)
          subst = ['\\begin_inset ERT', 'status collapsed', '',
-                  '\\begin_layout Standard', '', '', '\\backslash', 
-                  'begin{sideways' + floattype + '}', 
+                  '\\begin_layout Standard', '', '', '\\backslash',
+                  'begin{sideways' + floattype + '}',
                    '\\end_layout', '', '\\end_inset', '',
                    '\\end_layout', '']
          document.body[i : i+1] = subst
@@ -1999,10 +2109,10 @@ def revert_widesideways(document):
          if l == -1:
              document.warning("Malformed LyX document: Missing `\\begin_layout' in Float inset.")
              return
-        subst = ['\\begin_layout Standard', '\\begin_inset ERT', 
-                  'status collapsed', '', 
+        subst = ['\\begin_layout Standard', '\\begin_inset ERT',
+                  'status collapsed', '',
                    '\\begin_layout Standard', '', '', '\\backslash',
-                  'end{sideways' + floattype + '*}', 
+                  'end{sideways' + floattype + '*}',
                    '\\end_layout', '', '\\end_inset']
          document.body[j : j+1] = subst
          addedLines = len(subst) - 1
@@ -2047,6 +2157,7 @@ def convert_subfig(document):
      " Convert subfigures to subfloats. "
      i = 0
      while 1:
+        addedLines = 0
          i = find_token(document.body, '\\begin_inset Graphics', i)
          if i == -1:
              return
@@ -2061,17 +2172,17 @@ def convert_subfig(document):
              continue
          l = find_token(document.body, '\tsubcaptionText', i, endInset)
          if l == -1:
-            document.warning("Malformed lyx document: Can't find subcaptionText!")
-            i = endInset
-            continue
-        caption = document.body[l][16:].strip('"')
-        del document.body[l]
+            caption = ""
+        else:
+            caption = document.body[l][16:].strip('"')
+            del document.body[l]
+            addedLines -= 1
          del document.body[k]
-        addedLines = -2
-        subst = ['\\begin_inset Float figure', 'wide false', 'sideways false', 
-                 'status open', '', '\\begin_layout Plain Layout', '\\begin_inset Caption', 
-                 '', '\\begin_layout Plain Layout'] + latex2lyx(caption) + \
-                 [ '\\end_layout', '', '\\end_inset', '', 
+        addedLines -= 1
+        subst = ['\\begin_inset Float figure', 'wide false', 'sideways false',
+                 'status open', '', '\\begin_layout Plain Layout', '\\begin_inset Caption',
+                 '', '\\begin_layout Plain Layout'] + latex2lyx(caption, False) + \
+                 [ '\\end_layout', '', '\\end_inset', '',
                   '\\end_layout', '', '\\begin_layout Plain Layout']
          document.body[i : i] = subst
          addedLines += len(subst)
@@ -2104,11 +2215,25 @@ def revert_subfig(document):
              k = find_token(document.body, '\\begin_inset Float ', i + 1, j)
              if k == -1:
                  break
+            # is the subfloat aligned?
+            al = find_token(document.body, '\\align ', k - 1, j)
+            alignment_beg = ""
+            alignment_end = ""
+            if al != -1:
+                if get_value(document.body, '\\align', al) == "center":
+                    alignment_beg = "\\backslash\nbegin{centering}"
+                    alignment_end = "\\backslash\npar\\backslash\nend{centering}"
+                elif get_value(document.body, '\\align', al) == "left":
+                    alignment_beg = "\\backslash\nbegin{raggedright}"
+                    alignment_end = "\\backslash\npar\\backslash\nend{raggedright}"
+                elif get_value(document.body, '\\align', al) == "right":
+                    alignment_beg = "\\backslash\nbegin{raggedleft}"
+                    alignment_end = "\\backslash\npar\\backslash\nend{raggedleft}"
              l = find_end_of_inset(document.body, k)
              if l == -1:
                  document.warning("Malformed lyx document: Missing '\\end_inset' (embedded float).")
                  i += 1
-                j == -1
+                j = -1
                  continue # escape to the outer loop
              m = find_default_layout(document, k + 1, l)
              # caption?
@@ -2160,13 +2285,15 @@ def revert_subfig(document):
                          continue
                      elif line in document.body[opt:optend]:
                          continue
-                    elif not line.startswith('\\'):
-                        caption += line.strip()
+                    else:
+                        inert = True
+                        caption += lyxline2latex(document, line, inert)
                  if len(label) > 0:
-                    caption += "\\backslash\nlabel{" + label + "}"
-            subst = '\\begin_layout Plain Layout\n\\begin_inset ERT\nstatus collapsed\n\n' \
-                      '\\begin_layout Plain Layout\n\n}\n\\end_layout\n\n\\end_inset\n\n' \
-                      '\\end_layout\n\n\\begin_layout Plain Layout\n'
+                    caption += "\n\\backslash\nlabel{" + label + "}"
+            subst = '\\begin_layout PlainLayout\n\\begin_inset ERT\nstatus collapsed\n\n' \
+                      '\\begin_layout PlainLayout\n\n}' + alignment_end + \
+                      '\n\\end_layout\n\n\\end_inset\n\n' \
+                      '\\end_layout\n\n\\begin_layout PlainLayout\n'
              subst = subst.split('\n')
              document.body[l : l+1] = subst
              addedLines = len(subst) - 1
@@ -2177,7 +2304,7 @@ def revert_subfig(document):
              del document.body[k+1:m-1]
              addedLines -= (m - 1 - (k + 1))
              insertion = '\\begin_inset ERT\nstatus collapsed\n\n' \
-                        '\\begin_layout Plain Layout\n\n\\backslash\n' \
+                        '\\begin_layout PlainLayout\n\n' + alignment_beg + '\n\\backslash\n' \
                          'subfloat'
              if len(shortcap) > 0:
                  insertion = insertion + "[" + shortcap + "]"
@@ -2187,6 +2314,10 @@ def revert_subfig(document):
              insertion = insertion.split('\n')
              document.body[k : k + 1] = insertion
              addedLines += len(insertion) - 1
+            al = find_token(document.body, '\\align ', k - 1, j + addedLines)
+            if al != -1:
+                del document.body[al]
+                addedLines -= 1
              add_to_preamble(document, ['\\usepackage{subfig}\n'])
          i += addedLines + 1
  
@@ -2204,11 +2335,12 @@ def revert_wrapplacement(document):
              document.warning("Malformed LyX document: Couldn't find placement parameter of wrap float.")
              i += 1
              continue
-        r = re.compile("placement (o|i|l|r)")
+        r = re.compile("placement (o|i|l|r|O|I|L|R)")
          m = r.match(document.body[j])
          if m == None:
              document.warning("Malformed LyX document: Placement option isn't O|I|R|L!")
-        document.body[j] = "placement " + m.group(1).lower()
+        else:
+            document.body[j] = "placement " + m.group(1).lower()
          i = j
  
  
@@ -2797,7 +2929,7 @@ def remove_fontsCJK(document):
  
  
  def convert_plain_layout(document):
-    " Convert 'PlainLayout' to 'Plain Layout'" 
+    " Convert 'PlainLayout' to 'Plain Layout'"
      i = 0
      while True:
          i = find_token(document.body, '\\begin_layout PlainLayout', i)
@@ -2809,7 +2941,7 @@ def convert_plain_layout(document):
  
  
  def revert_plain_layout(document):
-    " Convert 'PlainLayout' to 'Plain Layout'" 
+    " Revert 'Plain Layout' to 'PlainLayout'"
      i = 0
      while True:
          i = find_token(document.body, '\\begin_layout Plain Layout', i)
@@ -2821,7 +2953,7 @@ def revert_plain_layout(document):
  
  
  def revert_plainlayout(document):
-    " Convert 'PlainLayout' to 'Plain Layout'" 
+    " Revert 'PlainLayout' to 'Standard'"
      i = 0
      while True:
          i = find_token(document.body, '\\begin_layout PlainLayout', i)
@@ -2852,6 +2984,140 @@ def revert_polytonicgreek(document):
          j = j + 1
  
  
+def revert_removed_modules(document):
+    i = 0
+    while True:
+        i = find_token(document.header, "\\begin_remove_modules", i)
+        if i == -1:
+            return
+        j = find_end_of(document.header, i, "\\begin_remove_modules", "\\end_remove_modules")
+        if j == -1:
+            # this should not happen
+            break
+        document.header[i : j + 1] = []
+
+
+def add_plain_layout(document):
+    i = 0
+    while True:
+        i = find_token(document.body, "\\begin_layout", i)
+        if i == -1:
+            return
+        if len(document.body[i].split()) == 1:
+            document.body[i] = "\\begin_layout Plain Layout"
+        i += 1
+
+
+def revert_tabulators(document):
+    "Revert tabulators to 4 spaces"
+    i = 0
+    while True:
+        i = find_token(document.body, "\t", i)
+        if i == -1:
+            return
+        document.body[i] = document.body[i].replace("\t", "    ")
+        i += 1
+
+
+def revert_tabsize(document):
+    "Revert the tabsize parameter of listings"
+    i = 0
+    j = 0
+    while True:
+        # either it is the only parameter
+        i = find_token(document.body, 'lstparams "tabsize=4"', i)
+        if i != -1:
+            del document.body[i]
+        # or the last one
+        j = find_token(document.body, "lstparams", j)
+        if j == -1:
+            return
+        pos = document.body[j].find(",tabsize=")
+        document.body[j] = document.body[j][:pos] + '"'
+        i += 1
+        j += 1
+
+
+def revert_mongolian(document):
+    "Set language Mongolian to English"
+    i = 0
+    if document.language == "mongolian":
+        document.language = "english"
+        i = find_token(document.header, "\\language", 0)
+        if i != -1:
+            document.header[i] = "\\language english"
+    j = 0
+    while True:
+        j = find_token(document.body, "\\lang mongolian", j)
+        if j == -1:
+            return
+        document.body[j] = document.body[j].replace("\\lang mongolian", "\\lang english")
+        j = j + 1
+
+
+def revert_default_options(document):
+    ' Remove param use_default_options '
+    i = find_token(document.header, "\\use_default_options", 0)
+    if i != -1:
+        del document.header[i]
+
+
+def convert_default_options(document):
+    ' Add param use_default_options and set it to false '
+    i = find_token(document.header, "\\textclass", 0)
+    if i == -1:
+        document.warning("Malformed LyX document: Missing `\\textclass'.")
+        return
+    document.header.insert(i, '\\use_default_options false')
+
+
+def revert_backref_options(document):
+    ' Revert option pdf_backref=page to pagebackref '
+    i = find_token(document.header, "\\pdf_backref page", 0)
+    if i != -1:
+        document.header[i] = "\\pdf_pagebackref true"
+
+
+def convert_backref_options(document):
+    ' We have changed the option pagebackref to backref=true '
+    i = find_token(document.header, "\\pdf_pagebackref true", 0)
+    if i != -1:
+        document.header[i] = "\\pdf_backref page"
+    j = find_token(document.header, "\\pdf_pagebackref false", 0)
+    if j != -1:
+        del document.header[j]
+    # backref=true was not a valid option, we meant backref=section
+    k = find_token(document.header, "\\pdf_backref true", 0)
+    if k != -1 and i != -1:
+        del document.header[k]
+    elif k != -1 and j != -1:
+        document.header[k] = "\\pdf_backref section"
+
+
+def convert_charstyle_element(document):
+    "Convert CharStyle to Element for docbook backend"
+    if document.backend != "docbook":
+        return
+    i = 0
+    while True:
+        i = find_token(document.body, "\\begin_inset Flex CharStyle:", i)
+        if i == -1:
+            return
+        document.body[i] = document.body[i].replace('\\begin_inset Flex CharStyle:',
+                                                    '\\begin_inset Flex Element:')
+
+def revert_charstyle_element(document):
+    "Convert Element to CharStyle for docbook backend"
+    if document.backend != "docbook":
+        return
+    i = 0
+    while True:
+        i = find_token(document.body, "\\begin_inset Flex Element:", i)
+        if i == -1:
+            return
+        document.body[i] = document.body[i].replace('\\begin_inset Flex Element:',
+                                                    '\\begin_inset Flex CharStyle:')
+
  ##
  # Conversion hub
  #
@@ -2878,7 +3144,7 @@ convert = [[277, [fix_wrong_tables]],
             [295, [convert_htmlurl, convert_url]],
             [296, [convert_include]],
             [297, [convert_usorbian]],
-           [298, []],
+           [298, [convert_macro_global]],
             [299, []],
             [300, []],
             [301, []],
@@ -2919,9 +3185,23 @@ convert = [[277, [fix_wrong_tables]],
             [336, []],
             [337, [convert_display_enum]],
             [338, []],
+           [339, []],
+           [340, [add_plain_layout]],
+           [341, []],
+           [342, []],
+           [343, [convert_default_options]],
+           [344, [convert_backref_options]],
+           [345, [convert_charstyle_element]]
            ]
  
-revert =  [[337, [revert_polytonicgreek]],
+revert =  [[344, [revert_charstyle_element]],
+           [343, [revert_backref_options]],
+           [342, [revert_default_options]],
+           [341, [revert_mongolian]],
+           [340, [revert_tabulators, revert_tabsize]],
+           [339, []],
+           [338, [revert_removed_modules]],
+           [337, [revert_polytonicgreek]],
             [336, [revert_display_enum]],
             [335, [remove_fontsCJK]],
             [334, [revert_InsetSpace]],