lib/lyx2lyx/lyx_2_0.py

   1 # -*- coding: utf-8 -*-
   2 # This file is part of lyx2lyx
   3 # -*- coding: utf-8 -*-
   4 # Copyright (C) 2010 The LyX team
   5 #
   6 # This program is free software; you can redistribute it and/or
   7 # modify it under the terms of the GNU General Public License
   8 # as published by the Free Software Foundation; either version 2
   9 # of the License, or (at your option) any later version.
  10 #
  11 # This program is distributed in the hope that it will be useful,
  12 # but WITHOUT ANY WARRANTY; without even the implied warranty of
  13 # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
  14 # GNU General Public License for more details.
  15 #
  16 # You should have received a copy of the GNU General Public License
  17 # along with this program; if not, write to the Free Software
  18 # Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
  19
  20 """ Convert files to the file format generated by lyx 2.0"""
  21
  22 import re, string
  23 import unicodedata
  24 import sys, os
  25
  26 from parser_tools import find_token, find_end_of, find_tokens, \
  27   find_token_exact, find_end_of_inset, find_end_of_layout, \
  28   find_token_backwards, is_in_inset, get_value, get_quoted_value, \
  29   del_token, check_token
  30
  31 from lyx2lyx_tools import add_to_preamble, insert_to_preamble, \
  32   put_cmd_in_ert, lyx2latex, latex_length, revert_flex_inset, \
  33   revert_font_attrs, hex2ratio, str2bool
  34
  35 ####################################################################
  36 # Private helper functions
  37
  38 def remove_option(lines, m, option):
  39     ''' removes option from line m. returns whether we did anything '''
  40     l = lines[m].find(option)
  41     if l == -1:
  42         return False
  43     val = lines[m][l:].split('"')[1]
  44     lines[m] = lines[m][:l - 1] + lines[m][l+len(option + '="' + val + '"'):]
  45     return True
  46
  47
  48 # DO NOT USE THIS ROUTINE ANY MORE. Better yet, replace the uses that
  49 # have been made of it with uses of put_cmd_in_ert.
  50 def old_put_cmd_in_ert(string):
  51     for rep in unicode_reps:
  52         string = string.replace(rep[1], rep[0].replace('\\\\', '\\'))
  53     string = string.replace('\\', "\\backslash\n")
  54     string = "\\begin_inset ERT\nstatus collapsed\n\\begin_layout Plain Layout\n" \
  55       + string + "\n\\end_layout\n\\end_inset"
  56     return string
  57
  58
  59 ###############################################################################
  60 ###
  61 ### Conversion and reversion routines
  62 ###
  63 ###############################################################################
  64
  65 def revert_swiss(document):
  66     " Set language german-ch to ngerman "
  67     i = 0
  68     if document.language == "german-ch":
  69         document.language = "ngerman"
  70         i = find_token(document.header, "\\language", 0)
  71         if i != -1:
  72             document.header[i] = "\\language ngerman"
  73     j = 0
  74     while True:
  75         j = find_token(document.body, "\\lang german-ch", j)
  76         if j == -1:
  77             return
  78         document.body[j] = document.body[j].replace("\\lang german-ch", "\\lang ngerman")
  79         j = j + 1
  80
  81
  82 def revert_tabularvalign(document):
  83    " Revert the tabular valign option "
  84    i = 0
  85    while True:
  86       i = find_token(document.body, "\\begin_inset Tabular", i)
  87       if i == -1:
  88           return
  89       end = find_end_of_inset(document.body, i)
  90       if end == -1:
  91           document.warning("Can't find end of inset at line " + str(i))
  92           i += 1
  93           continue
  94       fline = find_token(document.body, "<features", i, end)
  95       if fline == -1:
  96           document.warning("Can't find features for inset at line " + str(i))
  97           i += 1
  98           continue
  99       p = document.body[fline].find("islongtable")
 100       if p != -1:
 101           q = document.body[fline].find("tabularvalignment")
 102           if q != -1:
 103               # FIXME
 104               # This seems wrong: It removes everything after
 105               # tabularvalignment, too.
 106               document.body[fline] = document.body[fline][:q - 1] + '>'
 107           i += 1
 108           continue
 109
 110        # no longtable
 111       tabularvalignment = 'c'
 112       # which valignment is specified?
 113       m = document.body[fline].find('tabularvalignment="top"')
 114       if m != -1:
 115           tabularvalignment = 't'
 116       m = document.body[fline].find('tabularvalignment="bottom"')
 117       if m != -1:
 118           tabularvalignment = 'b'
 119       # delete tabularvalignment
 120       q = document.body[fline].find("tabularvalignment")
 121       if q != -1:
 122           # FIXME
 123           # This seems wrong: It removes everything after
 124           # tabularvalignment, too.
 125           document.body[fline] = document.body[fline][:q - 1] + '>'
 126
 127       # don't add a box when centered
 128       if tabularvalignment == 'c':
 129           i = end
 130           continue
 131       subst = ['\\end_layout', '\\end_inset']
 132       document.body[end:end] = subst # just inserts those lines
 133       subst = ['\\begin_inset Box Frameless',
 134           'position "' + tabularvalignment +'"',
 135           'hor_pos "c"',
 136           'has_inner_box 1',
 137           'inner_pos "c"',
 138           'use_parbox 0',
 139           # we don't know the width, assume 50%
 140           'width "50col%"',
 141           'special "none"',
 142           'height "1in"',
 143           'height_special "totalheight"',
 144           'status open',
 145           '',
 146           '\\begin_layout Plain Layout']
 147       document.body[i:i] = subst # this just inserts the array at i
 148       # since there could be a tabular inside a tabular, we cannot
 149       # jump to end
 150       i += len(subst)
 151
 152
 153 def revert_phantom_types(document, ptype, cmd):
 154     " Reverts phantom to ERT "
 155     i = 0
 156     while True:
 157       i = find_token(document.body, "\\begin_inset Phantom " + ptype, i)
 158       if i == -1:
 159           return
 160       end = find_end_of_inset(document.body, i)
 161       if end == -1:
 162           document.warning("Can't find end of inset at line " + str(i))
 163           i += 1
 164           continue
 165       blay = find_token(document.body, "\\begin_layout Plain Layout", i, end)
 166       if blay == -1:
 167           document.warning("Can't find layout for inset at line " + str(i))
 168           i = end
 169           continue
 170       bend = find_end_of_layout(document.body, blay)
 171       if bend == -1:
 172           document.warning("Malformed LyX document: Could not find end of Phantom inset's layout.")
 173           i = end
 174           continue
 175       substi = ["\\begin_inset ERT", "status collapsed", "",
 176                 "\\begin_layout Plain Layout", "", "", "\\backslash",
 177                 cmd + "{", "\\end_layout", "", "\\end_inset"]
 178       substj = ["\\size default", "", "\\begin_inset ERT", "status collapsed", "",
 179                 "\\begin_layout Plain Layout", "", "}", "\\end_layout", "", "\\end_inset"]
 180       # do the later one first so as not to mess up the numbering
 181       document.body[bend:end + 1] = substj
 182       document.body[i:blay + 1] = substi
 183       i = end + len(substi) + len(substj) - (end - bend) - (blay - i) - 2
 184
 185
 186 def revert_phantom(document):
 187     revert_phantom_types(document, "Phantom", "phantom")
 188
 189 def revert_hphantom(document):
 190     revert_phantom_types(document, "HPhantom", "hphantom")
 191
 192 def revert_vphantom(document):
 193     revert_phantom_types(document, "VPhantom", "vphantom")
 194
 195
 196 def revert_xetex(document):
 197     " Reverts documents that use XeTeX "
 198
 199     i = find_token(document.header, '\\use_xetex', 0)
 200     if i == -1:
 201         document.warning("Malformed LyX document: Missing \\use_xetex.")
 202         return
 203     if not str2bool(get_value(document.header, "\\use_xetex", i)):
 204         del document.header[i]
 205         return
 206     del document.header[i]
 207
 208     # 1.) set doc encoding to utf8-plain
 209     i = find_token(document.header, "\\inputencoding", 0)
 210     if i == -1:
 211         document.warning("Malformed LyX document: Missing \\inputencoding.")
 212     else:
 213         document.header[i] = "\\inputencoding utf8-plain"
 214
 215     # 2.) check font settings
 216     # defaults
 217     roman = sans = typew = default
 218     osf = False
 219     sf_scale = tt_scale = 100.0
 220
 221     i = find_token(document.header, "\\font_roman", 0)
 222     if i == -1:
 223         document.warning("Malformed LyX document: Missing \\font_roman.")
 224     else:
 225         roman = get_value(document.header, "\\font_roman", i)
 226         document.header[i] = "\\font_roman default"
 227
 228     i = find_token(document.header, "\\font_sans", 0)
 229     if i == -1:
 230         document.warning("Malformed LyX document: Missing \\font_sans.")
 231     else:
 232         sans = get_value(document.header, "\\font_sans", i)
 233         document.header[i] = "\\font_sans default"
 234
 235     i = find_token(document.header, "\\font_typewriter", 0)
 236     if i == -1:
 237         document.warning("Malformed LyX document: Missing \\font_typewriter.")
 238     else:
 239         typew = get_value(document.header, "\\font_typewriter", i)
 240         document.header[i] = "\\font_typewriter default"
 241
 242     i = find_token(document.header, "\\font_osf", 0)
 243     if i == -1:
 244         document.warning("Malformed LyX document: Missing \\font_osf.")
 245     else:
 246         osf = str2bool(get_value(document.header, "\\font_osf", i))
 247         document.header[i] = "\\font_osf false"
 248
 249     i = find_token(document.header, "\\font_sc", 0)
 250     if i == -1:
 251         document.warning("Malformed LyX document: Missing \\font_sc.")
 252     else:
 253         # we do not need this value.
 254         document.header[i] = "\\font_sc false"
 255
 256     i = find_token(document.header, "\\font_sf_scale", 0)
 257     if i == -1:
 258         document.warning("Malformed LyX document: Missing \\font_sf_scale.")
 259     else:
 260       val = get_value(document.header, '\\font_sf_scale', i)
 261       try:
 262         # float() can throw
 263         sf_scale = float(val)
 264       except:
 265         document.warning("Invalid font_sf_scale value: " + val)
 266       document.header[i] = "\\font_sf_scale 100"
 267
 268     i = find_token(document.header, "\\font_tt_scale", 0)
 269     if i == -1:
 270         document.warning("Malformed LyX document: Missing \\font_tt_scale.")
 271     else:
 272         val = get_value(document.header, '\\font_tt_scale', i)
 273         try:
 274           # float() can throw
 275           tt_scale = float(val)
 276         except:
 277           document.warning("Invalid font_tt_scale value: " + val)
 278         document.header[i] = "\\font_tt_scale 100"
 279
 280     # 3.) set preamble stuff
 281     pretext = ['%% This document must be processed with xelatex!']
 282     pretext.append('\\usepackage{fontspec}')
 283     if roman != "default":
 284         pretext.append('\\setmainfont[Mapping=tex-text]{' + roman + '}')
 285     if sans != "default":
 286         sf = '\\setsansfont['
 287         if sf_scale != 100.0:
 288             sf += 'Scale=' + str(sf_scale / 100.0) + ','
 289         sf += 'Mapping=tex-text]{' + sans + '}'
 290         pretext.append(sf)
 291     if typewriter != "default":
 292         tw = '\\setmonofont'
 293         if tt_scale != 100.0:
 294             tw += '[Scale=' + str(tt_scale / 100.0) + ']'
 295         tw += '{' + typewriter + '}'
 296         pretext.append(tw)
 297     if osf:
 298         pretext.append('\\defaultfontfeatures{Numbers=OldStyle}')
 299     pretext.append('\usepackage{xunicode}')
 300     pretext.append('\usepackage{xltxtra}')
 301     insert_to_preamble(document, pretext)
 302
 303
 304 def revert_outputformat(document):
 305     " Remove default output format param "
 306
 307     if not del_token(document.header, '\\default_output_format', 0):
 308         document.warning("Malformed LyX document: Missing \\default_output_format.")
 309
 310
 311 def revert_backgroundcolor(document):
 312     " Reverts background color to preamble code "
 313     i = find_token(document.header, "\\backgroundcolor", 0)
 314     if i == -1:
 315         return
 316     colorcode = get_value(document.header, '\\backgroundcolor', i)
 317     del document.header[i]
 318     # don't clutter the preamble if backgroundcolor is not set
 319     if colorcode == "#ffffff":
 320         return
 321     red   = hex2ratio(colorcode[1:3])
 322     green = hex2ratio(colorcode[3:5])
 323     blue  = hex2ratio(colorcode[5:7])
 324     insert_to_preamble(document, \
 325         ['% To set the background color',
 326         '\\@ifundefined{definecolor}{\\usepackage{color}}{}',
 327         '\\definecolor{page_backgroundcolor}{rgb}{' + red + ',' + green + ',' + blue + '}',
 328         '\\pagecolor{page_backgroundcolor}'])
 329
 330
 331 def revert_splitindex(document):
 332     " Reverts splitindex-aware documents "
 333     i = find_token(document.header, '\\use_indices', 0)
 334     if i == -1:
 335         document.warning("Malformed LyX document: Missing \\use_indices.")
 336         return
 337     useindices = str2bool(get_value(document.header, "\\use_indices", i))
 338     del document.header[i]
 339     preamble = []
 340     if useindices:
 341          preamble.append("\\usepackage{splitidx})")
 342
 343     # deal with index declarations in the preamble
 344     i = 0
 345     while True:
 346         i = find_token(document.header, "\\index", i)
 347         if i == -1:
 348             break
 349         k = find_token(document.header, "\\end_index", i)
 350         if k == -1:
 351             document.warning("Malformed LyX document: Missing \\end_index.")
 352             return
 353         if useindices:
 354           line = document.header[i]
 355           l = re.compile(r'\\index (.*)$')
 356           m = l.match(line)
 357           iname = m.group(1)
 358           ishortcut = get_value(document.header, '\\shortcut', i, k)
 359           if ishortcut != "":
 360               preamble.append("\\newindex[" + iname + "]{" + ishortcut + "}")
 361         del document.header[i:k + 1]
 362     if preamble:
 363         insert_to_preamble(document, preamble)
 364
 365     # deal with index insets
 366     # these need to have the argument removed
 367     i = 0
 368     while True:
 369         i = find_token(document.body, "\\begin_inset Index", i)
 370         if i == -1:
 371             break
 372         line = document.body[i]
 373         l = re.compile(r'\\begin_inset Index (.*)$')
 374         m = l.match(line)
 375         itype = m.group(1)
 376         if itype == "idx" or indices == "false":
 377             document.body[i] = "\\begin_inset Index"
 378         else:
 379             k = find_end_of_inset(document.body, i)
 380             if k == -1:
 381                 document.warning("Can't find end of index inset!")
 382                 i += 1
 383                 continue
 384             content = lyx2latex(document, document.body[i:k])
 385             # escape quotes
 386             content = content.replace('"', r'\"')
 387             subst = put_cmd_in_ert("\\sindex[" + itype + "]{" + content + "}")
 388             document.body[i:k + 1] = subst
 389         i = i + 1
 390
 391     # deal with index_print insets
 392     i = 0
 393     while True:
 394         i = find_token(document.body, "\\begin_inset CommandInset index_print", i)
 395         if i == -1:
 396             return
 397         k = find_end_of_inset(document.body, i)
 398         ptype = get_quoted_value(document.body, 'type', i, k)
 399         if ptype == "idx":
 400             j = find_token(document.body, "type", i, k)
 401             del document.body[j]
 402         elif not useindices:
 403             del document.body[i:k + 1]
 404         else:
 405             subst = put_cmd_in_ert("\\printindex[" + ptype + "]{}")
 406             document.body[i:k + 1] = subst
 407         i = i + 1
 408
 409
 410 def convert_splitindex(document):
 411     " Converts index and printindex insets to splitindex-aware format "
 412     i = 0
 413     while True:
 414         i = find_token(document.body, "\\begin_inset Index", i)
 415         if i == -1:
 416             break
 417         document.body[i] = document.body[i].replace("\\begin_inset Index",
 418             "\\begin_inset Index idx")
 419         i = i + 1
 420     i = 0
 421     while True:
 422         i = find_token(document.body, "\\begin_inset CommandInset index_print", i)
 423         if i == -1:
 424             return
 425         if document.body[i + 1].find('LatexCommand printindex') == -1:
 426             document.warning("Malformed LyX document: Incomplete printindex inset.")
 427             return
 428         subst = ["LatexCommand printindex",
 429             "type \"idx\""]
 430         document.body[i + 1:i + 2] = subst
 431         i = i + 1
 432
 433
 434 def revert_subindex(document):
 435     " Reverts \\printsubindex CommandInset types "
 436     i = find_token(document.header, '\\use_indices', 0)
 437     if i == -1:
 438         document.warning("Malformed LyX document: Missing \\use_indices.")
 439         return
 440     useindices = str2bool(get_value(document.header, "\\use_indices", i))
 441     i = 0
 442     while True:
 443         i = find_token(document.body, "\\begin_inset CommandInset index_print", i)
 444         if i == -1:
 445             return
 446         k = find_end_of_inset(document.body, i)
 447         ctype = get_value(document.body, 'LatexCommand', i, k)
 448         if ctype != "printsubindex":
 449             i = k + 1
 450             continue
 451         ptype = get_quoted_value(document.body, 'type', i, k)
 452         if not useindices:
 453             del document.body[i:k + 1]
 454         else:
 455             subst = put_cmd_in_ert("\\printsubindex[" + ptype + "]{}")
 456             document.body[i:k + 1] = subst
 457         i = i + 1
 458
 459
 460 def revert_printindexall(document):
 461     " Reverts \\print[sub]index* CommandInset types "
 462     i = find_token(document.header, '\\use_indices', 0)
 463     if i == -1:
 464         document.warning("Malformed LyX document: Missing \\use_indices.")
 465         return
 466     useindices = str2bool(get_value(document.header, "\\use_indices", i))
 467     i = 0
 468     while True:
 469         i = find_token(document.body, "\\begin_inset CommandInset index_print", i)
 470         if i == -1:
 471             return
 472         k = find_end_of_inset(document.body, i)
 473         ctype = get_value(document.body, 'LatexCommand', i, k)
 474         if ctype != "printindex*" and ctype != "printsubindex*":
 475             i = k
 476             continue
 477         if not useindices:
 478             del document.body[i:k + 1]
 479         else:
 480             subst = put_cmd_in_ert("\\" + ctype + "{}")
 481             document.body[i:k + 1] = subst
 482         i = i + 1
 483
 484
 485 def revert_strikeout(document):
 486   " Reverts \\strikeout font attribute "
 487   changed = revert_font_attrs(document.body, "\\uuline", "\\uuline")
 488   changed = revert_font_attrs(document.body, "\\uwave", "\\uwave") or changed
 489   changed = revert_font_attrs(document.body, "\\strikeout", "\\sout")  or changed
 490   if changed == True:
 491     insert_to_preamble(document, \
 492         ['%  for proper underlining',
 493         '\\PassOptionsToPackage{normalem}{ulem}',
 494         '\\usepackage{ulem}'])
 495
 496
 497 def revert_ulinelatex(document):
 498     " Reverts \\uline font attribute "
 499     i = find_token(document.body, '\\bar under', 0)
 500     if i == -1:
 501         return
 502     insert_to_preamble(document,\
 503             ['%  for proper underlining',
 504             '\\PassOptionsToPackage{normalem}{ulem}',
 505             '\\usepackage{ulem}',
 506             '\\let\\cite@rig\\cite',
 507             '\\newcommand{\\b@xcite}[2][\\%]{\\def\\def@pt{\\%}\\def\\pas@pt{#1}',
 508             '  \\mbox{\\ifx\\def@pt\\pas@pt\\cite@rig{#2}\\else\\cite@rig[#1]{#2}\\fi}}',
 509             '\\renewcommand{\\underbar}[1]{{\\let\\cite\\b@xcite\\uline{#1}}}'])
 510
 511
 512 def revert_custom_processors(document):
 513     " Remove bibtex_command and index_command params "
 514
 515     if not del_token(document.header, '\\bibtex_command', 0):
 516         document.warning("Malformed LyX document: Missing \\bibtex_command.")
 517
 518     if not del_token(document.header, '\\index_command', 0):
 519         document.warning("Malformed LyX document: Missing \\index_command.")
 520
 521
 522 def convert_nomencl_width(document):
 523     " Add set_width param to nomencl_print "
 524     i = 0
 525     while True:
 526       i = find_token(document.body, "\\begin_inset CommandInset nomencl_print", i)
 527       if i == -1:
 528         break
 529       document.body.insert(i + 2, "set_width \"none\"")
 530       i = i + 1
 531
 532
 533 def revert_nomencl_width(document):
 534     " Remove set_width param from nomencl_print "
 535     i = 0
 536     while True:
 537       i = find_token(document.body, "\\begin_inset CommandInset nomencl_print", i)
 538       if i == -1:
 539         break
 540       j = find_end_of_inset(document.body, i)
 541       if not del_token(document.body, "set_width", i, j):
 542         document.warning("Can't find set_width option for nomencl_print!")
 543       i = j
 544
 545
 546 def revert_nomencl_cwidth(document):
 547     " Remove width param from nomencl_print "
 548     i = 0
 549     while True:
 550       i = find_token(document.body, "\\begin_inset CommandInset nomencl_print", i)
 551       if i == -1:
 552         break
 553       j = find_end_of_inset(document.body, i)
 554       l = find_token(document.body, "width", i, j)
 555       if l == -1:
 556         document.warning("Can't find width option for nomencl_print!")
 557         i = j
 558         continue
 559       width = get_quoted_value(document.body, "width", i, j)
 560       del document.body[l]
 561       insert_to_preamble(document, ["\\setlength{\\nomlabelwidth}{" + width + "}"])
 562       i = j - 1
 563
 564
 565 def revert_applemac(document):
 566     " Revert applemac encoding to auto "
 567     if document.encoding != "applemac":
 568       return
 569     document.encoding = "auto"
 570     i = find_token(document.header, "\\encoding", 0)
 571     if i != -1:
 572         document.header[i] = "\\encoding auto"
 573
 574
 575 def revert_longtable_align(document):
 576     " Remove longtable alignment setting "
 577     i = 0
 578     while True:
 579       i = find_token(document.body, "\\begin_inset Tabular", i)
 580       if i == -1:
 581           break
 582       end = find_end_of_inset(document.body, i)
 583       if end == -1:
 584           document.warning("Can't find end of inset at line " + str(i))
 585           i += 1
 586           continue
 587       fline = find_token(document.body, "<features", i, end)
 588       if fline == -1:
 589           document.warning("Can't find features for inset at line " + str(i))
 590           i += 1
 591           continue
 592       j = document.body[fline].find("longtabularalignment")
 593       if j == -1:
 594           i += 1
 595           continue
 596       # FIXME Is this correct? It wipes out everything after the
 597       # one we found.
 598       document.body[fline] = document.body[fline][:j - 1] + '>'
 599       # since there could be a tabular inside this one, we
 600       # cannot jump to end.
 601       i += 1
 602
 603
 604 def revert_branch_filename(document):
 605     " Remove \\filename_suffix parameter from branches "
 606     i = 0
 607     while True:
 608         i = find_token(document.header, "\\filename_suffix", i)
 609         if i == -1:
 610             return
 611         del document.header[i]
 612
 613
 614 def revert_paragraph_indentation(document):
 615     " Revert custom paragraph indentation to preamble code "
 616     i = find_token(document.header, "\\paragraph_indentation", 0)
 617     if i == -1:
 618       return
 619     length = get_value(document.header, "\\paragraph_indentation", i)
 620     # we need only remove the line if indentation is default
 621     if length != "default":
 622       # handle percent lengths
 623       length = latex_length(length)[1]
 624       insert_to_preamble(document, ["\\setlength{\\parindent}{" + length + "}"])
 625     del document.header[i]
 626
 627
 628 def revert_percent_skip_lengths(document):
 629     " Revert relative lengths for paragraph skip separation to preamble code "
 630     i = find_token(document.header, "\\defskip", 0)
 631     if i == -1:
 632         return
 633     length = get_value(document.header, "\\defskip", i)
 634     # only revert when a custom length was set and when
 635     # it used a percent length
 636     if length in ('smallskip', 'medskip', 'bigskip'):
 637         return
 638     # handle percent lengths
 639     percent, length = latex_length(length)
 640     if percent:
 641         insert_to_preamble(document, ["\\setlength{\\parskip}{" + length + "}"])
 642         # set defskip to medskip as default
 643         document.header[i] = "\\defskip medskip"
 644
 645
 646 def revert_percent_vspace_lengths(document):
 647     " Revert relative VSpace lengths to ERT "
 648     i = 0
 649     while True:
 650       i = find_token(document.body, "\\begin_inset VSpace", i)
 651       if i == -1:
 652           break
 653       # only revert if a custom length was set and if
 654       # it used a percent length
 655       r = re.compile(r'\\begin_inset VSpace (.*)$')
 656       m = r.match(document.body[i])
 657       length = m.group(1)
 658       if length in ('defskip', 'smallskip', 'medskip', 'bigskip', 'vfill'):
 659          i += 1
 660          continue
 661       # check if the space has a star (protected space)
 662       protected = (document.body[i].rfind("*") != -1)
 663       if protected:
 664           length = length.rstrip('*')
 665       # handle percent lengths
 666       percent, length = latex_length(length)
 667       # revert the VSpace inset to ERT
 668       if percent:
 669           if protected:
 670               subst = put_cmd_in_ert("\\vspace*{" + length + "}")
 671           else:
 672               subst = put_cmd_in_ert("\\vspace{" + length + "}")
 673           document.body[i:i + 2] = subst
 674       i += 1
 675
 676
 677 def revert_percent_hspace_lengths(document):
 678     " Revert relative HSpace lengths to ERT "
 679     i = 0
 680     while True:
 681       i = find_token_exact(document.body, "\\begin_inset space \\hspace", i)
 682       if i == -1:
 683           break
 684       j = find_end_of_inset(document.body, i)
 685       if j == -1:
 686           document.warning("Can't find end of inset at line " + str(i))
 687           i += 1
 688           continue
 689       # only revert if a custom length was set...
 690       length = get_value(document.body, '\\length', i + 1, j)
 691       if length == '':
 692           document.warning("Malformed lyx document: Missing '\\length' in Space inset.")
 693           i = j
 694           continue
 695       protected = ""
 696       if document.body[i].find("\\hspace*{}") != -1:
 697           protected = "*"
 698       # ...and if it used a percent length
 699       percent, length = latex_length(length)
 700       # revert the HSpace inset to ERT
 701       if percent:
 702           subst = put_cmd_in_ert("\\hspace" + protected + "{" + length + "}")
 703           document.body[i:j + 1] = subst
 704       # if we did a substitution, this will still be ok
 705       i = j
 706
 707
 708 def revert_hspace_glue_lengths(document):
 709     " Revert HSpace glue lengths to ERT "
 710     i = 0
 711     while True:
 712       i = find_token_exact(document.body, "\\begin_inset space \\hspace", i)
 713       if i == -1:
 714           break
 715       j = find_end_of_inset(document.body, i)
 716       if j == -1:
 717           document.warning("Can't find end of inset at line " + str(i))
 718           i += 1
 719           continue
 720       length = get_value(document.body, '\\length', i + 1, j)
 721       if length == '':
 722           document.warning("Malformed lyx document: Missing '\\length' in Space inset.")
 723           i = j
 724           continue
 725       protected = ""
 726       if document.body[i].find("\\hspace*{}") != -1:
 727           protected = "*"
 728       # only revert if the length contains a plus or minus at pos != 0
 729       if length.find('-',1) != -1 or length.find('+',1) != -1:
 730           # handle percent lengths
 731           length = latex_length(length)[1]
 732           # revert the HSpace inset to ERT
 733           subst = put_cmd_in_ert("\\hspace" + protected + "{" + length + "}")
 734           document.body[i:j+1] = subst
 735       i = j
 736
 737
 738 def convert_author_id(document):
 739     " Add the author_id to the \\author definition and make sure 0 is not used"
 740     i = 0
 741     anum = 1
 742     re_author = re.compile(r'(\\author) (\".*\")\s*(.*)$')
 743
 744     while True:
 745         i = find_token(document.header, "\\author", i)
 746         if i == -1:
 747             break
 748         m = re_author.match(document.header[i])
 749         if m:
 750             name = m.group(2)
 751             email = m.group(3)
 752             document.header[i] = "\\author %i %s %s" % (anum, name, email)
 753         anum += 1
 754         i += 1
 755
 756     i = 0
 757     while True:
 758         i = find_token(document.body, "\\change_", i)
 759         if i == -1:
 760             break
 761         change = document.body[i].split(' ');
 762         if len(change) == 3:
 763             type = change[0]
 764             author_id = int(change[1])
 765             time = change[2]
 766             document.body[i] = "%s %i %s" % (type, author_id + 1, time)
 767         i += 1
 768
 769
 770 def revert_author_id(document):
 771     " Remove the author_id from the \\author definition "
 772     i = 0
 773     anum = 0
 774     rx = re.compile(r'(\\author)\s+(\d+)\s+(\".*\")\s*(.*)$')
 775     idmap = dict()
 776
 777     while True:
 778         i = find_token(document.header, "\\author", i)
 779         if i == -1:
 780             break
 781         m = rx.match(document.header[i])
 782         if m:
 783             author_id = int(m.group(2))
 784             idmap[author_id] = anum
 785             name = m.group(3)
 786             email = m.group(4)
 787             document.header[i] = "\\author %s %s" % (name, email)
 788         i += 1
 789         # FIXME Should this be incremented if we didn't match?
 790         anum += 1
 791
 792     i = 0
 793     while True:
 794         i = find_token(document.body, "\\change_", i)
 795         if i == -1:
 796             break
 797         change = document.body[i].split(' ');
 798         if len(change) == 3:
 799             type = change[0]
 800             author_id = int(change[1])
 801             time = change[2]
 802             document.body[i] = "%s %i %s" % (type, idmap[author_id], time)
 803         i += 1
 804
 805
 806 def revert_suppress_date(document):
 807     " Revert suppressing of default document date to preamble code "
 808     i = find_token(document.header, "\\suppress_date", 0)
 809     if i == -1:
 810         return
 811     # remove the preamble line and write to the preamble
 812     # when suppress_date was true
 813     date = str2bool(get_value(document.header, "\\suppress_date", i))
 814     if date:
 815         add_to_preamble(document, ["\\date{}"])
 816     del document.header[i]
 817
 818
 819 def revert_mhchem(document):
 820     "Revert mhchem loading to preamble code"
 821
 822     mhchem = "off"
 823     i = find_token(document.header, "\\use_mhchem", 0)
 824     if i == -1:
 825         document.warning("Malformed LyX document: Could not find mhchem setting.")
 826         mhchem = "auto"
 827     else:
 828         val = get_value(document.header, "\\use_mhchem", i)
 829         if val == "1":
 830             mhchem = "auto"
 831         elif val == "2":
 832             mhchem = "on"
 833         del document.header[i]
 834
 835     if mhchem == "off":
 836       # don't load case
 837       return
 838
 839     if mhchem == "auto":
 840         i = 0
 841         while True:
 842             i = find_token(document.body, "\\begin_inset Formula", i)
 843             if i == -1:
 844                break
 845             line = document.body[i]
 846             if line.find("\\ce{") != -1 or line.find("\\cf{") != -1:
 847               mhchem = "on"
 848               break
 849             i += 1
 850
 851     if mhchem == "on":
 852         pre = ["\\PassOptionsToPackage{version=3}{mhchem}",
 853           "\\usepackage{mhchem}"]
 854         insert_to_preamble(document, pre)
 855
 856
 857 def revert_fontenc(document):
 858     " Remove fontencoding param "
 859     if not del_token(document.header, '\\fontencoding', 0):
 860         document.warning("Malformed LyX document: Missing \\fontencoding.")
 861
 862
 863 def merge_gbrief(document):
 864     " Merge g-brief-en and g-brief-de to one class "
 865
 866     if document.textclass != "g-brief-de":
 867         if document.textclass == "g-brief-en":
 868             document.textclass = "g-brief"
 869             document.set_textclass()
 870         return
 871
 872     obsoletedby = { "Brieftext":       "Letter",
 873                     "Unterschrift":    "Signature",
 874                     "Strasse":         "Street",
 875                     "Zusatz":          "Addition",
 876                     "Ort":             "Town",
 877                     "Land":            "State",
 878                     "RetourAdresse":   "ReturnAddress",
 879                     "MeinZeichen":     "MyRef",
 880                     "IhrZeichen":      "YourRef",
 881                     "IhrSchreiben":    "YourMail",
 882                     "Telefon":         "Phone",
 883                     "BLZ":             "BankCode",
 884                     "Konto":           "BankAccount",
 885                     "Postvermerk":     "PostalComment",
 886                     "Adresse":         "Address",
 887                     "Datum":           "Date",
 888                     "Betreff":         "Reference",
 889                     "Anrede":          "Opening",
 890                     "Anlagen":         "Encl.",
 891                     "Verteiler":       "cc",
 892                     "Gruss":           "Closing"}
 893     i = 0
 894     while 1:
 895         i = find_token(document.body, "\\begin_layout", i)
 896         if i == -1:
 897             break
 898
 899         layout = document.body[i][14:]
 900         if layout in obsoletedby:
 901             document.body[i] = "\\begin_layout " + obsoletedby[layout]
 902
 903         i += 1
 904
 905     document.textclass = "g-brief"
 906     document.set_textclass()
 907
 908
 909 def revert_gbrief(document):
 910     " Revert g-brief to g-brief-en "
 911     if document.textclass == "g-brief":
 912         document.textclass = "g-brief-en"
 913         document.set_textclass()
 914
 915
 916 def revert_html_options(document):
 917     " Remove html options "
 918     del_token(document.header, '\\html_use_mathml', 0)
 919     del_token(document.header, '\\html_be_strict', 0)
 920
 921
 922 def revert_includeonly(document):
 923     i = 0
 924     while True:
 925         i = find_token(document.header, "\\begin_includeonly", i)
 926         if i == -1:
 927             return
 928         j = find_end_of(document.header, i, "\\begin_includeonly", "\\end_includeonly")
 929         if j == -1:
 930             document.warning("Unable to find end of includeonly section!!")
 931             break
 932         document.header[i : j + 1] = []
 933
 934
 935 def revert_includeall(document):
 936     " Remove maintain_unincluded_children param "
 937     del_token(document.header, '\\maintain_unincluded_children', 0)
 938
 939
 940 def revert_multirow(document):
 941     " Revert multirow cells in tables to TeX-code"
 942     i = 0
 943     begin_table = 0
 944     bottom_index = 0
 945     multirow = False
 946     # cell type 3 is multirow begin cell
 947     i = find_token(document.body, '<cell multirow="3"', i)
 948     if i == -1:
 949       return
 950     # a multirow cell was found
 951     multirow = True
 952     while True:
 953       # find begin/end of table
 954       begin_table = find_token(document.body, '<lyxtabular version=', begin_table)
 955       if begin_table == -1:
 956           break
 957       end_table = find_token(document.body, '</lyxtabular>', begin_table)
 958       if end_table == -1:
 959           document.warning("Malformed LyX document: Could not find end of table.")
 960           break
 961       # store the number of rows
 962       begin = document.body[begin_table].find('rows="')
 963       end = document.body[begin_table].find('" ', begin)
 964       rows = document.body[begin_table][begin + 6:end]
 965       # store the number of columns
 966       begin = document.body[begin_table].find('columns="')
 967       end = document.body[begin_table].find('">', begin)
 968       columns = document.body[begin_table][begin + 9:end]
 969       # find column number of the multirows
 970       begin_row = begin_table
 971       for row in range(int(rows)):
 972         begin_row = find_token(document.body, '<row>', begin_row)
 973         begin_cell = begin_row
 974         for column in range(int(columns)):
 975           begin_cell = find_token(document.body, '<cell ', begin_cell)
 976           i = document.body[begin_cell].find('multirow="3"')
 977           if i <> -1:
 978             # we found a multirow in column number column - 1
 979             # store column width
 980             begin = document.body[begin_table + 2 + column].find('width="')
 981             end = document.body[begin_table + 2 + column].find('">', begin)
 982             col_width = document.body[begin_table + 2 + column][begin + 7:end]
 983             # "0pt" means that no width is specified
 984             if col_width == "0pt":
 985               col_width = "*"
 986             # determine the number of cells that are part of the multirow
 987             begin_row2 = begin_table
 988             # we have the multirow begin cell as minimal span
 989             span = 1
 990             # go one row behind the row where we found the multirow begin
 991             row2 = -1
 992             while row2 < row:
 993               begin_row2 = find_token(document.body, '<row>', begin_row2)
 994               row2 += 1
 995               begin_row2 += 1
 996             # step now through all rows until we reach the last table row
 997             rows2 = row
 998             while row2 < rows:
 999               begin_row2 = find_token(document.body, '<row>', begin_row2)
1000               begin_cell2 = begin_row2
1001               # look now for the column-th cell in the row
1002               column2 = 0
1003               while column2 < column:
1004                 begin_cell2 = find_token(document.body, '<cell ', begin_cell2)
1005                 column2 += 1
1006                 begin_cell2 += 1
1007               # cell type 4 is multirow-part cell
1008               begin_cell2 = find_token(document.body, '<cell ', begin_cell2)
1009               j = document.body[begin_cell2].find('multirow="4"')
1010               if j <> -1:
1011                 span += 1
1012                 # remove bottom line of previous multirow-part cell
1013                 if span > 1:
1014                   document.body[bottom_index] = document.body[bottom_index].replace(' bottomline="true" ', ' ')
1015                 # save index to be later able to remove bottom line
1016                 bottom_index = begin_cell2
1017               else:
1018                 break
1019               begin_row2 = find_token(document.body, '</row>', begin_row2)
1020             # remove the multirow tag, set the valignment to top
1021             # and remove the bottom line
1022             document.body[begin_cell] = document.body[begin_cell].replace(' multirow="3" ', ' ')
1023             document.body[begin_cell] = document.body[begin_cell].replace('valignment="middle"', 'valignment="top"')
1024             # only remove the bottom line if it is not a single cell as multirow
1025             if span > 1:
1026               document.body[begin_cell] = document.body[begin_cell].replace(' bottomline="true" ', ' ')
1027             # write ERT to create the multirow cell
1028             cend = find_token(document.body, "</cell>", begin_cell)
1029             if cend == -1:
1030               document.warning("Malformed LyX document: Could not find end of tabular cell.")
1031               i += 1
1032               continue
1033             blay = find_token(document.body, "\\begin_layout", begin_cell, cend)
1034             if blay == -1:
1035               document.warning("Can't find layout for cell!")
1036               i = j
1037               continue
1038             bend = find_end_of_layout(document.body, blay)
1039             if bend == -1:
1040               document.warning("Can't find end of layout for cell!")
1041               i = cend
1042               continue
1043             # do the later one first, so as not to mess up the numbering
1044             # we are wrapping the whole cell in this ert
1045             # so before the end of the layout...
1046             document.body[bend:bend] = put_cmd_in_ert("}")
1047             # ...and after the beginning
1048             document.body[blay + 1:blay + 1] = put_cmd_in_ert("\\multirow{" + str(span) + "}{" + col_width + "}{")
1049           # set index to end of current cell (that is now much bigger due to the ERT addition)
1050           begin_cell = find_token(document.body, '</cell>', begin_cell) + 1
1051         begin_row = find_token(document.body, '</row>', begin_row) + 1
1052
1053       # revert now all multirow part cells
1054       while True:
1055         # cell type 4 is multirow part cell
1056         k = find_token(document.body, '<cell multirow="4"', begin_table)
1057         if k == -1:
1058           break
1059         # remove the multirow tag, set the valignment to top
1060         # and remove the top line
1061         document.body[k] = document.body[k].replace(' multirow="4" ', ' ')
1062         document.body[k] = document.body[k].replace('valignment="middle"', 'valignment="top"')
1063         document.body[k] = document.body[k].replace(' topline="true" ', ' ')
1064         k += 1
1065       # go to the next table
1066       begin_table = end_table + 1
1067
1068     if multirow == True:
1069         add_to_preamble(document, ["\\usepackage{multirow}"])
1070
1071
1072 def convert_math_output(document):
1073     " Convert \html_use_mathml to \html_math_output "
1074     i = find_token(document.header, "\\html_use_mathml", 0)
1075     if i == -1:
1076         return
1077     rgx = re.compile(r'\\html_use_mathml\s+(\w+)')
1078     m = rgx.match(document.header[i])
1079     newval = "0" # MathML
1080     if m:
1081       val = str2bool(m.group(1))
1082       if not val:
1083         newval = "2" # Images
1084     else:
1085       document.warning("Can't match " + document.header[i])
1086     document.header[i] = "\\html_math_output " + newval
1087
1088
1089 def revert_math_output(document):
1090     " Revert \html_math_output to \html_use_mathml "
1091     i = find_token(document.header, "\\html_math_output", 0)
1092     if i == -1:
1093         return
1094     rgx = re.compile(r'\\html_math_output\s+(\d)')
1095     m = rgx.match(document.header[i])
1096     newval = "true"
1097     if m:
1098         val = m.group(1)
1099         if val == "1" or val == "2":
1100             newval = "false"
1101     else:
1102         document.warning("Unable to match " + document.header[i])
1103     document.header[i] = "\\html_use_mathml " + newval
1104
1105
1106
1107 def revert_inset_preview(document):
1108     " Dissolves the preview inset "
1109     i = 0
1110     while True:
1111       i = find_token(document.body, "\\begin_inset Preview", i)
1112       if i == -1:
1113           return
1114       iend = find_end_of_inset(document.body, i)
1115       if iend == -1:
1116           document.warning("Malformed LyX document: Could not find end of Preview inset.")
1117           i += 1
1118           continue
1119
1120       # This has several issues.
1121       # We need to do something about the layouts inside InsetPreview.
1122       # If we just leave the first one, then we have something like:
1123       # \begin_layout Standard
1124       # ...
1125       # \begin_layout Standard
1126       # and we get a "no \end_layout" error. So something has to be done.
1127       # Ideally, we would check if it is the same as the layout we are in.
1128       # If so, we just remove it; if not, we end the active one. But it is
1129       # not easy to know what layout we are in, due to depth changes, etc,
1130       # and it is not clear to me how much work it is worth doing. In most
1131       # cases, the layout will probably be the same.
1132       #
1133       # For the same reason, we have to remove the \end_layout tag at the
1134       # end of the last layout in the inset. Again, that will sometimes be
1135       # wrong, but it will usually be right. To know what to do, we would
1136       # again have to know what layout the inset is in.
1137
1138       blay = find_token(document.body, "\\begin_layout", i, iend)
1139       if blay == -1:
1140           document.warning("Can't find layout for preview inset!")
1141           # always do the later one first...
1142           del document.body[iend]
1143           del document.body[i]
1144           # deletions mean we do not need to reset i
1145           continue
1146
1147       # This is where we would check what layout we are in.
1148       # The check for Standard is definitely wrong.
1149       #
1150       # lay = document.body[blay].split(None, 1)[1]
1151       # if lay != oldlayout:
1152       #     # record a boolean to tell us what to do later....
1153       #     # better to do it later, since (a) it won't mess up
1154       #     # the numbering and (b) we only modify at the end.
1155
1156       # we want to delete the last \\end_layout in this inset, too.
1157       # note that this may not be the \\end_layout that goes with blay!!
1158       bend = find_end_of_layout(document.body, blay)
1159       while True:
1160           tmp = find_token(document.body, "\\end_layout", bend + 1, iend)
1161           if tmp == -1:
1162               break
1163           bend = tmp
1164       if bend == blay:
1165           document.warning("Unable to find last layout in preview inset!")
1166           del document.body[iend]
1167           del document.body[i]
1168           # deletions mean we do not need to reset i
1169           continue
1170       # always do the later one first...
1171       del document.body[iend]
1172       del document.body[bend]
1173       del document.body[i:blay + 1]
1174       # we do not need to reset i
1175
1176
1177 def revert_equalspacing_xymatrix(document):
1178     " Revert a Formula with xymatrix@! to an ERT inset "
1179     i = 0
1180     has_preamble = False
1181     has_equal_spacing = False
1182
1183     while True:
1184       i = find_token(document.body, "\\begin_inset Formula", i)
1185       if i == -1:
1186           break
1187       j = find_end_of_inset(document.body, i)
1188       if j == -1:
1189           document.warning("Malformed LyX document: Could not find end of Formula inset.")
1190           i += 1
1191           continue
1192
1193       for curline in range(i,j):
1194           found = document.body[curline].find("\\xymatrix@!")
1195           if found != -1:
1196               break
1197
1198       if found != -1:
1199           has_equal_spacing = True
1200           content = [document.body[i][21:]]
1201           content += document.body[i + 1:j]
1202           subst = put_cmd_in_ert(content)
1203           document.body[i:j + 1] = subst
1204           i += len(subst) - (j - i) + 1
1205       else:
1206           for curline in range(i,j):
1207               l = document.body[curline].find("\\xymatrix")
1208               if l != -1:
1209                   has_preamble = True;
1210                   break;
1211           i = j + 1
1212
1213     if has_equal_spacing and not has_preamble:
1214         add_to_preamble(document, ['\\usepackage[all]{xy}'])
1215
1216
1217 def revert_notefontcolor(document):
1218     " Reverts greyed-out note font color to preamble code "
1219
1220     i = find_token(document.header, "\\notefontcolor", 0)
1221     if i == -1:
1222         return
1223
1224     colorcode = get_value(document.header, '\\notefontcolor', i)
1225     del document.header[i]
1226
1227     # are there any grey notes?
1228     if find_token(document.body, "\\begin_inset Note Greyedout", 0) == -1:
1229         # no need to do anything else, and \renewcommand will throw
1230         # an error since lyxgreyedout will not exist.
1231         return
1232
1233     # the color code is in the form #rrggbb where every character denotes a hex number
1234     red = hex2ratio(colorcode[1:3])
1235     green = hex2ratio(colorcode[3:5])
1236     blue = hex2ratio(colorcode[5:7])
1237     # write the preamble
1238     insert_to_preamble(document,
1239       [ '%  for greyed-out notes',
1240         '\\@ifundefined{definecolor}{\\usepackage{color}}{}'
1241         '\\definecolor{note_fontcolor}{rgb}{%s,%s,%s}' % (red, green, blue),
1242         '\\renewenvironment{lyxgreyedout}',
1243         ' {\\textcolor{note_fontcolor}\\bgroup}{\\egroup}'])
1244
1245
1246 def revert_turkmen(document):
1247     "Set language Turkmen to English"
1248
1249     if document.language == "turkmen":
1250         document.language = "english"
1251         i = find_token(document.header, "\\language", 0)
1252         if i != -1:
1253             document.header[i] = "\\language english"
1254
1255     j = 0
1256     while True:
1257         j = find_token(document.body, "\\lang turkmen", j)
1258         if j == -1:
1259             return
1260         document.body[j] = document.body[j].replace("\\lang turkmen", "\\lang english")
1261         j += 1
1262
1263
1264 def revert_fontcolor(document):
1265     " Reverts font color to preamble code "
1266     i = find_token(document.header, "\\fontcolor", 0)
1267     if i == -1:
1268         return
1269     colorcode = get_value(document.header, '\\fontcolor', i)
1270     del document.header[i]
1271     # don't clutter the preamble if font color is not set
1272     if colorcode == "#000000":
1273         return
1274     # the color code is in the form #rrggbb where every character denotes a hex number
1275     red = hex2ratio(colorcode[1:3])
1276     green = hex2ratio(colorcode[3:5])
1277     blue = hex2ratio(colorcode[5:7])
1278     # write the preamble
1279     insert_to_preamble(document,
1280       ['%  Set the font color',
1281       '\\@ifundefined{definecolor}{\\usepackage{color}}{}',
1282       '\\definecolor{document_fontcolor}{rgb}{%s,%s,%s}' % (red, green, blue),
1283       '\\color{document_fontcolor}'])
1284
1285
1286 def revert_shadedboxcolor(document):
1287     " Reverts shaded box color to preamble code "
1288     i = find_token(document.header, "\\boxbgcolor", 0)
1289     if i == -1:
1290         return
1291     colorcode = get_value(document.header, '\\boxbgcolor', i)
1292     del document.header[i]
1293     # the color code is in the form #rrggbb
1294     red = hex2ratio(colorcode[1:3])
1295     green = hex2ratio(colorcode[3:5])
1296     blue = hex2ratio(colorcode[5:7])
1297     # write the preamble
1298     insert_to_preamble(document,
1299       ['%  Set the color of boxes with shaded background',
1300       '\\@ifundefined{definecolor}{\\usepackage{color}}{}',
1301       "\\definecolor{shadecolor}{rgb}{%s,%s,%s}" % (red, green, blue)])
1302
1303
1304 def revert_lyx_version(document):
1305     " Reverts LyX Version information from Inset Info "
1306     version = "LyX version"
1307     try:
1308         import lyx2lyx_version
1309         version = lyx2lyx_version.version
1310     except:
1311         pass
1312
1313     i = 0
1314     while 1:
1315         i = find_token(document.body, '\\begin_inset Info', i)
1316         if i == -1:
1317             return
1318         j = find_end_of_inset(document.body, i + 1)
1319         if j == -1:
1320             document.warning("Malformed LyX document: Could not find end of Info inset.")
1321             i += 1
1322             continue
1323
1324         # We expect:
1325         # \begin_inset Info
1326         # type  "lyxinfo"
1327         # arg   "version"
1328         # \end_inset
1329         typ = get_quoted_value(document.body, "type", i, j)
1330         arg = get_quoted_value(document.body, "arg", i, j)
1331         if arg != "version" or typ != "lyxinfo":
1332             i = j + 1
1333             continue
1334
1335         # We do not actually know the version of LyX used to produce the document.
1336         # But we can use our version, since we are reverting.
1337         s = [version]
1338         # Now we want to check if the line after "\end_inset" is empty. It normally
1339         # is, so we want to remove it, too.
1340         lastline = j + 1
1341         if document.body[j + 1].strip() == "":
1342             lastline = j + 2
1343         document.body[i: lastline] = s
1344         i = i + 1
1345
1346
1347 def revert_math_scale(document):
1348   " Remove math scaling and LaTeX options "
1349   del_token(document.header, '\\html_math_img_scale', 0)
1350   del_token(document.header, '\\html_latex_start', 0)
1351   del_token(document.header, '\\html_latex_end', 0)
1352
1353
1354 def revert_pagesizes(document):
1355   " Revert page sizes to default "
1356   i = find_token(document.header, '\\papersize', 0)
1357   if i != -1:
1358     size = document.header[i][11:]
1359     if size == "a0paper" or size == "a1paper" or size == "a2paper" \
1360     or size == "a6paper" or size == "b0paper" or size == "b1paper" \
1361     or size == "b2paper" or size == "b6paper" or size == "b0j" \
1362     or size == "b1j" or size == "b2j" or size == "b3j" or size == "b4j" \
1363     or size == "b5j" or size == "b6j":
1364       del document.header[i]
1365
1366
1367 def revert_DIN_C_pagesizes(document):
1368   " Revert DIN C page sizes to default "
1369   i = find_token(document.header, '\\papersize', 0)
1370   if i != -1:
1371     size = document.header[i][11:]
1372     if size == "c0paper" or size == "c1paper" or size == "c2paper" \
1373     or size == "c3paper" or size == "c4paper" or size == "c5paper" \
1374     or size == "c6paper":
1375       del document.header[i]
1376
1377
1378 def convert_html_quotes(document):
1379   " Remove quotes around html_latex_start and html_latex_end "
1380
1381   i = find_token(document.header, '\\html_latex_start', 0)
1382   if i != -1:
1383     line = document.header[i]
1384     l = re.compile(r'\\html_latex_start\s+"(.*)"')
1385     m = l.match(line)
1386     if m:
1387       document.header[i] = "\\html_latex_start " + m.group(1)
1388
1389   i = find_token(document.header, '\\html_latex_end', 0)
1390   if i != -1:
1391     line = document.header[i]
1392     l = re.compile(r'\\html_latex_end\s+"(.*)"')
1393     m = l.match(line)
1394     if m:
1395       document.header[i] = "\\html_latex_end " + m.group(1)
1396
1397
1398 def revert_html_quotes(document):
1399   " Remove quotes around html_latex_start and html_latex_end "
1400
1401   i = find_token(document.header, '\\html_latex_start', 0)
1402   if i != -1:
1403     line = document.header[i]
1404     l = re.compile(r'\\html_latex_start\s+(.*)')
1405     m = l.match(line)
1406     if not m:
1407         document.warning("Weird html_latex_start line: " + line)
1408         del document.header[i]
1409     else:
1410         document.header[i] = "\\html_latex_start \"" + m.group(1) + "\""
1411
1412   i = find_token(document.header, '\\html_latex_end', 0)
1413   if i != -1:
1414     line = document.header[i]
1415     l = re.compile(r'\\html_latex_end\s+(.*)')
1416     m = l.match(line)
1417     if not m:
1418         document.warning("Weird html_latex_end line: " + line)
1419         del document.header[i]
1420     else:
1421         document.header[i] = "\\html_latex_end \"" + m.group(1) + "\""
1422
1423
1424 def revert_output_sync(document):
1425   " Remove forward search options "
1426   del_token(document.header, '\\output_sync_macro', 0)
1427   del_token(document.header, '\\output_sync', 0)
1428
1429
1430 def revert_align_decimal(document):
1431   i = 0
1432   while True:
1433     i = find_token(document.body, "\\begin_inset Tabular", i)
1434     if i == -1:
1435       return
1436     j = find_end_of_inset(document.body, i)
1437     if j == -1:
1438       document.warning("Unable to find end of Tabular inset at line " + str(i))
1439       i += 1
1440       continue
1441     cell = find_token(document.body, "<cell", i, j)
1442     if cell == -1:
1443       document.warning("Can't find any cells in Tabular inset at line " + str(i))
1444       i = j
1445       continue
1446     k = i + 1
1447     while True:
1448       k = find_token(document.body, "<column", k, cell)
1449       if k == -1:
1450         return
1451       if document.body[k].find('alignment="decimal"') == -1:
1452         k += 1
1453         continue
1454       remove_option(document.body, k, 'decimal_point')
1455       document.body[k] = \
1456         document.body[k].replace('alignment="decimal"', 'alignment="center"')
1457       k += 1
1458
1459
1460 def convert_optarg(document):
1461   " Convert \\begin_inset OptArg to \\begin_inset Argument "
1462   i = 0
1463   while 1:
1464     i = find_token(document.body, '\\begin_inset OptArg', i)
1465     if i == -1:
1466       return
1467     document.body[i] = "\\begin_inset Argument"
1468     i += 1
1469
1470
1471 def revert_argument(document):
1472   " Convert \\begin_inset Argument to \\begin_inset OptArg "
1473   i = 0
1474   while 1:
1475     i = find_token(document.body, '\\begin_inset Argument', i)
1476     if i == -1:
1477       return
1478     document.body[i] = "\\begin_inset OptArg"
1479     i += 1
1480
1481
1482 def revert_makebox(document):
1483   " Convert \\makebox to TeX code "
1484   i = 0
1485   while 1:
1486     i = find_token(document.body, '\\begin_inset Box', i)
1487     if i == -1:
1488       break
1489     z = find_end_of_inset(document.body, i)
1490     if z == -1:
1491       document.warning("Malformed LyX document: Can't find end of box inset.")
1492       i += 1
1493       continue
1494     blay = find_token(document.body, "\\begin_layout", i, z)
1495     if blay == -1:
1496       document.warning("Malformed LyX document: Can't find layout in box.")
1497       i = z
1498       continue
1499     # by looking before the layout we make sure we're actually finding
1500     # an option, not text.
1501     j = find_token(document.body, 'use_makebox', i, blay)
1502     if j == -1:
1503         i = z
1504         continue
1505
1506     if not check_token(document.body[i], "\\begin_inset Box Frameless") \
1507       or get_value(document.body, 'use_makebox', j) != 1:
1508         del document.body[j]
1509         i = z
1510         continue
1511     bend = find_end_of_layout(document.body, blay)
1512     if bend == -1 or bend > z:
1513         document.warning("Malformed LyX document: Can't find end of layout in box.")
1514         i = z
1515         continue
1516     # determine the alignment
1517     align = get_quoted_value(document.body, 'hor_pos', i, blay, "c")
1518     # determine the width
1519     length = get_quoted_value(document.body, 'width', i, blay, "50col%")
1520     length = latex_length(length)[1]
1521     # remove the \end_layout \end_inset pair
1522     document.body[bend:z + 1] = put_cmd_in_ert("}")
1523     subst = "\\makebox[" + length + "][" \
1524       + align + "]{"
1525     document.body[i:blay + 1] = put_cmd_in_ert(subst)
1526     i += 1
1527
1528
1529 def convert_use_makebox(document):
1530   " Adds use_makebox option for boxes "
1531   i = 0
1532   while 1:
1533     i = find_token(document.body, '\\begin_inset Box', i)
1534     if i == -1:
1535       return
1536     # all of this is to make sure we actually find the use_parbox
1537     # that is an option for this box, not some text elsewhere.
1538     z = find_end_of_inset(document.body, i)
1539     if z == -1:
1540       document.warning("Can't find end of box inset!!")
1541       i += 1
1542       continue
1543     blay = find_token(document.body, "\\begin_layout", i, z)
1544     if blay == -1:
1545       document.warning("Can't find layout in box inset!!")
1546       i = z
1547       continue
1548     # so now we are looking for use_parbox before the box's layout
1549     k = find_token(document.body, 'use_parbox', i, blay)
1550     if k == -1:
1551       document.warning("Malformed LyX document: Can't find use_parbox statement in box.")
1552       i = z
1553       continue
1554     document.body.insert(k + 1, "use_makebox 0")
1555     i = z + 1
1556
1557
1558 def revert_IEEEtran(document):
1559   " Convert IEEEtran layouts and styles to TeX code "
1560   if document.textclass != "IEEEtran":
1561     return
1562   revert_flex_inset(document.body, "IEEE membership", "\\IEEEmembership")
1563   revert_flex_inset(document.body, "Lowercase", "\\MakeLowercase")
1564   layouts = ("Special Paper Notice", "After Title Text", "Publication ID",
1565              "Page headings", "Biography without photo")
1566   latexcmd = {"Special Paper Notice": "\\IEEEspecialpapernotice",
1567               "After Title Text":     "\\IEEEaftertitletext",
1568               "Publication ID":       "\\IEEEpubid"}
1569   obsoletedby = {"Page headings":            "MarkBoth",
1570                  "Biography without photo":  "BiographyNoPhoto"}
1571   for layout in layouts:
1572     i = 0
1573     while True:
1574         i = find_token(document.body, '\\begin_layout ' + layout, i)
1575         if i == -1:
1576           break
1577         j = find_end_of_layout(document.body, i)
1578         if j == -1:
1579           document.warning("Malformed LyX document: Can't find end of " + layout + " layout.")
1580           i += 1
1581           continue
1582         if layout in obsoletedby:
1583           document.body[i] = "\\begin_layout " + obsoletedby[layout]
1584           i = j
1585           continue
1586         content = lyx2latex(document, document.body[i:j + 1])
1587         add_to_preamble(document, [latexcmd[layout] + "{" + content + "}"])
1588         del document.body[i:j + 1]
1589         # no need to reset i
1590
1591
1592 def convert_prettyref(document):
1593         " Converts prettyref references to neutral formatted refs "
1594         re_ref = re.compile("^\s*reference\s+\"(\w+):(\S+)\"")
1595         nm_ref = re.compile("^\s*name\s+\"(\w+):(\S+)\"")
1596
1597         i = 0
1598         while True:
1599                 i = find_token(document.body, "\\begin_inset CommandInset ref", i)
1600                 if i == -1:
1601                         break
1602                 j = find_end_of_inset(document.body, i)
1603                 if j == -1:
1604                         document.warning("Malformed LyX document: No end of InsetRef!")
1605                         i += 1
1606                         continue
1607                 k = find_token(document.body, "LatexCommand prettyref", i, j)
1608                 if k != -1:
1609                         document.body[k] = "LatexCommand formatted"
1610                 i = j + 1
1611         document.header.insert(-1, "\\use_refstyle 0")
1612
1613
1614 def revert_refstyle(document):
1615         " Reverts neutral formatted refs to prettyref "
1616         re_ref = re.compile("^reference\s+\"(\w+):(\S+)\"")
1617         nm_ref = re.compile("^\s*name\s+\"(\w+):(\S+)\"")
1618
1619         i = 0
1620         while True:
1621                 i = find_token(document.body, "\\begin_inset CommandInset ref", i)
1622                 if i == -1:
1623                         break
1624                 j = find_end_of_inset(document.body, i)
1625                 if j == -1:
1626                         document.warning("Malformed LyX document: No end of InsetRef")
1627                         i += 1
1628                         continue
1629                 k = find_token(document.body, "LatexCommand formatted", i, j)
1630                 if k != -1:
1631                         document.body[k] = "LatexCommand prettyref"
1632                 i = j + 1
1633         i = find_token(document.header, "\\use_refstyle", 0)
1634         if i != -1:
1635                 document.header.pop(i)
1636
1637
1638 def revert_nameref(document):
1639   " Convert namerefs to regular references "
1640   cmds = ["Nameref", "nameref"]
1641   foundone = False
1642   rx = re.compile(r'reference "(.*)"')
1643   for cmd in cmds:
1644     i = 0
1645     oldcmd = "LatexCommand " + cmd
1646     while 1:
1647       # It seems better to look for this, as most of the reference
1648       # insets won't be ones we care about.
1649       i = find_token(document.body, oldcmd, i)
1650       if i == -1:
1651         break
1652       cmdloc = i
1653       i += 1
1654       # Make sure it is actually in an inset!
1655       # A normal line could begin with "LatexCommand nameref"!
1656       val = is_in_inset(document.body, cmdloc, \
1657           "\\begin_inset CommandInset ref")
1658       if not val:
1659           continue
1660       stins, endins = val
1661
1662       # ok, so it is in an InsetRef
1663       refline = find_token(document.body, "reference", stins, endins)
1664       if refline == -1:
1665         document.warning("Can't find reference for inset at line " + stinst + "!!")
1666         continue
1667       m = rx.match(document.body[refline])
1668       if not m:
1669         document.warning("Can't match reference line: " + document.body[ref])
1670         continue
1671       foundone = True
1672       ref = m.group(1)
1673       newcontent = put_cmd_in_ert('\\' + cmd + '{' + ref + '}')
1674       document.body[stins:endins + 1] = newcontent
1675
1676   if foundone:
1677     add_to_preamble(document, ["\usepackage{nameref}"])
1678
1679
1680 def remove_Nameref(document):
1681   " Convert Nameref commands to nameref commands "
1682   i = 0
1683   while 1:
1684     # It seems better to look for this, as most of the reference
1685     # insets won't be ones we care about.
1686     i = find_token(document.body, "LatexCommand Nameref" , i)
1687     if i == -1:
1688       break
1689     cmdloc = i
1690     i += 1
1691
1692     # Make sure it is actually in an inset!
1693     val = is_in_inset(document.body, cmdloc, \
1694         "\\begin_inset CommandInset ref")
1695     if not val:
1696       continue
1697     document.body[cmdloc] = "LatexCommand nameref"
1698
1699
1700 def revert_mathrsfs(document):
1701     " Load mathrsfs if \mathrsfs us use in the document "
1702     i = 0
1703     for line in document.body:
1704       if line.find("\\mathscr{") != -1:
1705         add_to_preamble(document, ["\\usepackage{mathrsfs}"])
1706         return
1707
1708
1709 def convert_flexnames(document):
1710     "Convert \\begin_inset Flex Custom:Style to \\begin_inset Flex Style and similarly for CharStyle and Element."
1711
1712     i = 0
1713     rx = re.compile(r'^\\begin_inset Flex (?:Custom|CharStyle|Element):(.+)$')
1714     while True:
1715       i = find_token(document.body, "\\begin_inset Flex", i)
1716       if i == -1:
1717         return
1718       m = rx.match(document.body[i])
1719       if m:
1720         document.body[i] = "\\begin_inset Flex " + m.group(1)
1721       i += 1
1722
1723
1724 flex_insets = {
1725   "Alert" : "CharStyle:Alert",
1726   "Code" : "CharStyle:Code",
1727   "Concepts" : "CharStyle:Concepts",
1728   "E-Mail" : "CharStyle:E-Mail",
1729   "Emph" : "CharStyle:Emph",
1730   "Expression" : "CharStyle:Expression",
1731   "Initial" : "CharStyle:Initial",
1732   "Institute" : "CharStyle:Institute",
1733   "Meaning" : "CharStyle:Meaning",
1734   "Noun" : "CharStyle:Noun",
1735   "Strong" : "CharStyle:Strong",
1736   "Structure" : "CharStyle:Structure",
1737   "ArticleMode" : "Custom:ArticleMode",
1738   "Endnote" : "Custom:Endnote",
1739   "Glosse" : "Custom:Glosse",
1740   "PresentationMode" : "Custom:PresentationMode",
1741   "Tri-Glosse" : "Custom:Tri-Glosse"
1742 }
1743
1744 flex_elements = {
1745   "Abbrev" : "Element:Abbrev",
1746   "CCC-Code" : "Element:CCC-Code",
1747   "Citation-number" : "Element:Citation-number",
1748   "City" : "Element:City",
1749   "Code" : "Element:Code",
1750   "CODEN" : "Element:CODEN",
1751   "Country" : "Element:Country",
1752   "Day" : "Element:Day",
1753   "Directory" : "Element:Directory",
1754   "Dscr" : "Element:Dscr",
1755   "Email" : "Element:Email",
1756   "Emph" : "Element:Emph",
1757   "Filename" : "Element:Filename",
1758   "Firstname" : "Element:Firstname",
1759   "Fname" : "Element:Fname",
1760   "GuiButton" : "Element:GuiButton",
1761   "GuiMenu" : "Element:GuiMenu",
1762   "GuiMenuItem" : "Element:GuiMenuItem",
1763   "ISSN" : "Element:ISSN",
1764   "Issue-day" : "Element:Issue-day",
1765   "Issue-months" : "Element:Issue-months",
1766   "Issue-number" : "Element:Issue-number",
1767   "KeyCap" : "Element:KeyCap",
1768   "KeyCombo" : "Element:KeyCombo",
1769   "Keyword" : "Element:Keyword",
1770   "Literal" : "Element:Literal",
1771   "MenuChoice" : "Element:MenuChoice",
1772   "Month" : "Element:Month",
1773   "Orgdiv" : "Element:Orgdiv",
1774   "Orgname" : "Element:Orgname",
1775   "Postcode" : "Element:Postcode",
1776   "SS-Code" : "Element:SS-Code",
1777   "SS-Title" : "Element:SS-Title",
1778   "State" : "Element:State",
1779   "Street" : "Element:Street",
1780   "Surname" : "Element:Surname",
1781   "Volume" : "Element:Volume",
1782   "Year" : "Element:Year"
1783 }
1784
1785
1786 def revert_flexnames(document):
1787   if document.backend == "latex":
1788     flexlist = flex_insets
1789   else:
1790     flexlist = flex_elements
1791
1792   rx = re.compile(r'^\\begin_inset Flex\s+(.+)$')
1793   i = 0
1794   while True:
1795     i = find_token(document.body, "\\begin_inset Flex", i)
1796     if i == -1:
1797       return
1798     m = rx.match(document.body[i])
1799     if not m:
1800       document.warning("Illegal flex inset: " + document.body[i])
1801       i += 1
1802       continue
1803     style = m.group(1)
1804     if style in flexlist:
1805       document.body[i] = "\\begin_inset Flex " + flexlist[style]
1806     i += 1
1807
1808
1809 def convert_mathdots(document):
1810     " Load mathdots automatically "
1811     i = find_token(document.header, "\\use_esint" , 0)
1812     if i != -1:
1813       document.header.insert(i + 1, "\\use_mathdots 1")
1814
1815
1816 def revert_mathdots(document):
1817     " Load mathdots if used in the document "
1818
1819     mathdots = find_token(document.header, "\\use_mathdots" , 0)
1820     if mathdots == -1:
1821       document.warning("No \\usemathdots line. Assuming auto.")
1822     else:
1823       val = get_value(document.header, "\\use_mathdots", mathdots)
1824       del document.header[mathdots]
1825       try:
1826         usedots = int(val)
1827       except:
1828         document.warning("Invalid \\use_mathdots value: " + val + ". Assuming auto.")
1829         # probably usedots has not been changed, but be safe.
1830         usedots = 1
1831
1832       if usedots == 0:
1833         # do not load case
1834         return
1835       if usedots == 2:
1836         # force load case
1837         add_to_preamble(["\\usepackage{mathdots}"])
1838         return
1839
1840     # so we are in the auto case. we want to load mathdots if \iddots is used.
1841     i = 0
1842     while True:
1843       i = find_token(document.body, '\\begin_inset Formula', i)
1844       if i == -1:
1845         return
1846       j = find_end_of_inset(document.body, i)
1847       if j == -1:
1848         document.warning("Malformed LyX document: Can't find end of Formula inset at line " + str(i))
1849         i += 1
1850         continue
1851       code = "\n".join(document.body[i:j])
1852       if code.find("\\iddots") != -1:
1853         add_to_preamble(document, ["\\@ifundefined{iddots}{\\usepackage{mathdots}}"])
1854         return
1855       i = j
1856
1857
1858 def convert_rule(document):
1859     " Convert \\lyxline to CommandInset line. "
1860     i = 0
1861
1862     inset = ['\\begin_inset CommandInset line',
1863       'LatexCommand rule',
1864       'offset "0.5ex"',
1865       'width "100line%"',
1866       'height "1pt"', '',
1867       '\\end_inset', '', '']
1868
1869     # if paragraphs are indented, we may have to unindent to get the
1870     # line to be full-width.
1871     indent = get_value(document.header, "\\paragraph_separation", 0)
1872     have_indent = (indent == "indent")
1873
1874     while True:
1875       i = find_token(document.body, "\\lyxline" , i)
1876       if i == -1:
1877         return
1878
1879       # we need to find out if this line follows other content
1880       # in its paragraph. find its layout....
1881       lastlay = find_token_backwards(document.body, "\\begin_layout", i)
1882       if lastlay == -1:
1883         document.warning("Can't find layout for line at " + str(i))
1884         # do the best we can.
1885         document.body[i:i+1] = inset
1886         i += len(inset)
1887         continue
1888
1889       # ...and look for other content before it.
1890       lineisfirst = True
1891       for line in document.body[lastlay + 1:i]:
1892         # is it empty or a paragraph option?
1893         if not line or line[0] == '\\':
1894           continue
1895         lineisfirst = False
1896         break
1897
1898       if lineisfirst:
1899         document.body[i:i+1] = inset
1900         if indent:
1901           # we need to unindent, lest the line be too long
1902           document.body.insert(lastlay + 1, "\\noindent")
1903         i += len(inset)
1904       else:
1905         # so our line is in the middle of a paragraph
1906         # we need to add a new line, lest this line follow the
1907         # other content on that line and run off the side of the page
1908         document.body[i:i+1] = inset
1909         document.body[i:i] = ["\\begin_inset Newline newline", "\\end_inset", ""]
1910       i += len(inset)
1911
1912
1913 def revert_rule(document):
1914     " Revert line insets to Tex code "
1915     i = 0
1916     while 1:
1917       i = find_token(document.body, "\\begin_inset CommandInset line" , i)
1918       if i == -1:
1919         return
1920       # find end of inset
1921       j = find_token(document.body, "\\end_inset" , i)
1922       if j == -1:
1923         document.warning("Malformed LyX document: Can't find end of line inset.")
1924         return
1925       # determine the optional offset
1926       offset = get_quoted_value(document.body, 'offset', i, j)
1927       if offset:
1928         offset = '[' + offset + ']'
1929       # determine the width
1930       width = get_quoted_value(document.body, 'width', i, j, "100col%")
1931       width = latex_length(width)[1]
1932       # determine the height
1933       height = get_quoted_value(document.body, 'height', i, j, "1pt")
1934       height = latex_length(height)[1]
1935       # output the \rule command
1936       subst = "\\rule[" + offset + "]{" + width + "}{" + height + "}"
1937       document.body[i:j + 1] = put_cmd_in_ert(subst)
1938       i += len(subst) - (j - i)
1939
1940
1941 def revert_diagram(document):
1942   " Add the feyn package if \\Diagram is used in math "
1943   i = 0
1944   while True:
1945     i = find_token(document.body, '\\begin_inset Formula', i)
1946     if i == -1:
1947       return
1948     j = find_end_of_inset(document.body, i)
1949     if j == -1:
1950         document.warning("Malformed LyX document: Can't find end of Formula inset.")
1951         return
1952     lines = "\n".join(document.body[i:j])
1953     if lines.find("\\Diagram") == -1:
1954       i = j
1955       continue
1956     add_to_preamble(document, ["\\usepackage{feyn}"])
1957     # only need to do it once!
1958     return
1959
1960
1961 def convert_bibtex_clearpage(document):
1962   " insert a clear(double)page bibliographystyle if bibtotoc option is used "
1963
1964   i = find_token(document.header, '\\papersides', 0)
1965   sides = 0
1966   if i == -1:
1967     document.warning("Malformed LyX document: Can't find papersides definition.")
1968     document.warning("Assuming single sided.")
1969     sides = 1
1970   else:
1971     val = get_value(document.header, "\\papersides", i)
1972     try:
1973       sides = int(val)
1974     except:
1975       pass
1976     if sides != 1 and sides != 2:
1977       document.warning("Invalid papersides value: " + val)
1978       document.warning("Assuming single sided.")
1979       sides = 1
1980
1981   j = 0
1982   while True:
1983     j = find_token(document.body, "\\begin_inset CommandInset bibtex", j)
1984     if j == -1:
1985       return
1986
1987     k = find_end_of_inset(document.body, j)
1988     if k == -1:
1989       document.warning("Can't find end of Bibliography inset at line " + str(j))
1990       j += 1
1991       continue
1992
1993     # only act if there is the option "bibtotoc"
1994     val = get_value(document.body, 'options', j, k)
1995     if not val:
1996       document.warning("Can't find options for bibliography inset at line " + str(j))
1997       j = k
1998       continue
1999
2000     if val.find("bibtotoc") == -1:
2001       j = k
2002       continue
2003
2004     # so we want to insert a new page right before the paragraph that
2005     # this bibliography thing is in.
2006     lay = find_token_backwards(document.body, "\\begin_layout", j)
2007     if lay == -1:
2008       document.warning("Can't find layout containing bibliography inset at line " + str(j))
2009       j = k
2010       continue
2011
2012     if sides == 1:
2013       cmd = "clearpage"
2014     else:
2015       cmd = "cleardoublepage"
2016     subst = ['\\begin_layout Standard',
2017         '\\begin_inset Newpage ' + cmd,
2018         '\\end_inset', '', '',
2019         '\\end_layout', '']
2020     document.body[lay:lay] = subst
2021     j = k + len(subst)
2022
2023
2024 def check_passthru(document):
2025   tc = document.textclass
2026   ok = (tc == "literate-article" or tc == "literate-book" or tc == "literate-report")
2027   if not ok:
2028     mods = document.get_module_list()
2029     for mod in mods:
2030       if mod == "sweave" or mod == "noweb":
2031         ok = True
2032         break
2033   return ok
2034
2035
2036 def convert_passthru(document):
2037     " http://www.mail-archive.com/lyx-devel@lists.lyx.org/msg161298.html "
2038     if not check_passthru:
2039       return
2040
2041     rx = re.compile("\\\\begin_layout \s*(\w+)")
2042     beg = 0
2043     for lay in ["Chunk", "Scrap"]:
2044       while True:
2045         beg = find_token(document.body, "\\begin_layout " + lay, beg)
2046         if beg == -1:
2047           break
2048         end = find_end_of_layout(document.body, beg)
2049         if end == -1:
2050           document.warning("Can't find end of layout at line " + str(beg))
2051           beg += 1
2052           continue
2053         # we are now going to replace newline insets within this layout
2054         # by new instances of this layout. so we have repeated layouts
2055         # instead of newlines.
2056         ns = beg
2057         while True:
2058           ns = find_token(document.body, "\\begin_inset Newline newline", ns, end)
2059           if ns == -1:
2060             break
2061           ne = find_end_of_inset(document.body, ns)
2062           if ne == -1 or ne > end:
2063             document.warning("Can't find end of inset at line " + str(nb))
2064             ns += 1
2065             continue
2066           if document.body[ne + 1] == "":
2067             ne += 1
2068           subst = ["\\end_layout", "", "\\begin_layout " + lay]
2069           document.body[ns:ne + 1] = subst
2070           # now we need to adjust end, in particular, but might as well
2071           # do ns properly, too
2072           newlines = (ne - ns) - len(subst)
2073           ns += newlines + 2
2074           end += newlines + 1
2075         # ok, we now want to find out if the next layout is the
2076         # same as this one. if so, we will insert an extra copy of it
2077         didit = False
2078         next = find_token(document.body, "\\begin_layout", end)
2079         if next != -1:
2080           m = rx.match(document.body[next])
2081           if m:
2082             nextlay = m.group(1)
2083             if nextlay == lay:
2084               subst = ["\\begin_layout " + lay, "", "\\end_layout", ""]
2085               document.body[next:next] = subst
2086               didit = True
2087         beg = end + 1
2088         if didit:
2089           beg += 4 # for the extra layout
2090
2091
2092 def revert_passthru(document):
2093     " http://www.mail-archive.com/lyx-devel@lists.lyx.org/msg161298.html "
2094     if not check_passthru:
2095       return
2096     rx = re.compile("\\\\begin_layout \s*(\w+)")
2097     beg = 0
2098     for lay in ["Chunk", "Scrap"]:
2099       while True:
2100         beg = find_token(document.body, "\\begin_layout " + lay, beg)
2101         if beg == -1:
2102           break
2103         end = find_end_of_layout(document.body, beg)
2104         if end == -1:
2105           document.warning("Can't find end of layout at line " + str(beg))
2106           beg += 1
2107           continue
2108
2109         # we now want to find out if the next layout is the
2110         # same as this one. but we will need to do this over and
2111         # over again.
2112         while True:
2113           next = find_token(document.body, "\\begin_layout", end)
2114           if next == -1:
2115             break
2116           m = rx.match(document.body[next])
2117           if not m:
2118             break
2119           nextlay = m.group(1)
2120           if nextlay != lay:
2121             break
2122           # so it is the same layout again. we now want to know if it is empty.
2123           # but first let's check and make sure there is no content between the
2124           # two layouts. i'm not sure if that can happen or not.
2125           for l in range(end + 1, next):
2126             document.warning("c'" + document.body[l] + "'")
2127             if document.body[l] != "":
2128               document.warning("Found content between adjacent " + lay + " layouts!")
2129               break
2130           nextend = find_end_of_layout(document.body, next)
2131           if nextend == -1:
2132             document.warning("Can't find end of layout at line " + str(next))
2133             break
2134           empty = True
2135           for l in range(next + 1, nextend):
2136             document.warning("e'" + document.body[l] + "'")
2137             if document.body[l] != "":
2138               empty = False
2139               break
2140           if empty:
2141             # empty layouts just get removed
2142             # should we check if it's before yet another such layout?
2143             del document.body[next : nextend + 1]
2144             # and we do not want to check again. we know the next layout
2145             # should be another Chunk and should be left as is.
2146             break
2147           else:
2148             # if it's not empty, then we want to insert a newline in place
2149             # of the layout switch
2150             subst = ["\\begin_inset Newline newline", "\\end_inset", ""]
2151             document.body[end : next + 1] = subst
2152             # and now we have to find the end of the new, larger layout
2153             newend = find_end_of_layout(document.body, beg)
2154             if newend == -1:
2155               document.warning("Can't find end of new layout at line " + str(beg))
2156               break
2157             end = newend
2158         beg = end + 1
2159
2160
2161 def revert_multirowOffset(document):
2162     " Revert multirow cells with offset in tables to TeX-code"
2163     # this routine is the same as the revert_multirow routine except that
2164     # it checks additionally for the offset
2165     i = 0
2166     begin_table = 0
2167     bottom_index = 0
2168     multirowOffset = False
2169     # cell type 3 is multirow begin cell
2170     i = find_token(document.body, '<cell multirow="3" mroffset=', i)
2171     if i == -1:
2172       return
2173     # a multirow cell with offset was found
2174     multirowOffset = True
2175     while True:
2176       # find begin/end of table
2177       begin_table = find_token(document.body, '<lyxtabular version=', begin_table)
2178       if begin_table == -1:
2179           break
2180       end_table = find_token(document.body, '</lyxtabular>', begin_table)
2181       if end_table == -1:
2182           document.warning("Malformed LyX document: Could not find end of table.")
2183           break
2184       # store the number of rows
2185       begin = document.body[begin_table].find('rows="')
2186       end = document.body[begin_table].find('" ', begin)
2187       rows = document.body[begin_table][begin + 6:end]
2188       # store the number of columns
2189       begin = document.body[begin_table].find('columns="')
2190       end = document.body[begin_table].find('">', begin)
2191       columns = document.body[begin_table][begin + 9:end]
2192       # find column number of the multirows with offset
2193       begin_row = begin_table
2194       for row in range(int(rows)):
2195         begin_row = find_token(document.body, '<row>', begin_row)
2196         begin_cell = begin_row
2197         for column in range(int(columns)):
2198           begin_cell = find_token(document.body, '<cell ', begin_cell)
2199           i = document.body[begin_cell].find('multirow="3" mroffset=')
2200           if i <> -1:
2201             # we found a multirow in column number column - 1
2202             # store column width
2203             begin = document.body[begin_table + 2 + column].find('width="')
2204             end = document.body[begin_table + 2 + column].find('">', begin)
2205             col_width = document.body[begin_table + 2 + column][begin + 7:end]
2206             # "0pt" means that no width is specified
2207             if col_width == "0pt":
2208               col_width = "*"
2209             # determine the number of cells that are part of the multirow
2210             begin_row2 = begin_table
2211             # we have the multirow begin cell as minimal span
2212             span = 1
2213             # go one row behind the row where we found the multirow begin
2214             row2 = -1
2215             while row2 < row:
2216               begin_row2 = find_token(document.body, '<row>', begin_row2)
2217               row2 += 1
2218               begin_row2 += 1
2219             # step now through all rows until we reach the last table row
2220             rows2 = row
2221             while row2 < rows:
2222               begin_row2 = find_token(document.body, '<row>', begin_row2)
2223               begin_cell2 = begin_row2
2224               # look now for the column-th cell in the row
2225               column2 = 0
2226               while column2 < column:
2227                 begin_cell2 = find_token(document.body, '<cell ', begin_cell2)
2228                 column2 += 1
2229                 begin_cell2 += 1
2230               # cell type 4 is multirow-part cell
2231               begin_cell2 = find_token(document.body, '<cell ', begin_cell2)
2232               j = document.body[begin_cell2].find('multirow="4"')
2233               if j <> -1:
2234                 span += 1
2235                 # remove bottom line of previous multirow-part cell
2236                 if span > 1:
2237                   document.body[bottom_index] = document.body[bottom_index].replace(' bottomline="true" ', ' ')
2238                 # save index to be later able to remove bottom line
2239                 bottom_index = begin_cell2
2240                 # remove the multirow tag, set the valignment to top
2241                 # and remove the top line
2242                 document.body[begin_cell2] = document.body[begin_cell2].replace(' multirow="4" ', ' ')
2243                 document.body[begin_cell2] = document.body[begin_cell2].replace('valignment="middle"', 'valignment="top"')
2244                 document.body[begin_cell2] = document.body[begin_cell2].replace(' topline="true" ', ' ')
2245               else:
2246                 break
2247               begin_row2 = find_token(document.body, '</row>', begin_row2)
2248             # remove the multirow tag, set the valignment to top,
2249             # remove the the bottom line and offset
2250             document.body[begin_cell] = document.body[begin_cell].replace(' multirow="3" ', ' ')
2251             document.body[begin_cell] = document.body[begin_cell].replace('valignment="middle"', 'valignment="top"')
2252             # only remove the bottom line if it is not a single cell as multirow
2253             if span > 1:
2254               document.body[begin_cell] = document.body[begin_cell].replace(' bottomline="true" ', ' ')
2255             document.body[begin_cell] = document.body[begin_cell].replace(' mroffset=', '')
2256             # store the offset and remove it
2257             begin = document.body[begin_cell].find('"')
2258             end = document.body[begin_cell].find('" ', begin)
2259             offset = document.body[begin_cell][begin + 1:end]
2260             document.body[begin_cell] = document.body[begin_cell].replace(document.body[begin_cell][begin:end + 1], '')
2261             # write ERT to create the multirow cell
2262             cend = find_token(document.body, "</cell>", begin_cell)
2263             if cend == -1:
2264               document.warning("Malformed LyX document: Could not find end of tabular cell.")
2265               i += 1
2266               continue
2267             blay = find_token(document.body, "\\begin_layout", begin_cell, cend)
2268             if blay == -1:
2269               document.warning("Can't find layout for cell!")
2270               i = j
2271               continue
2272             bend = find_end_of_layout(document.body, blay)
2273             if bend == -1:
2274               document.warning("Can't find end of layout for cell!")
2275               i = cend
2276               continue
2277             # do the later one first, so as not to mess up the numbering
2278             # we are wrapping the whole cell in this ert
2279             # so before the end of the layout...
2280             document.body[bend:bend] = put_cmd_in_ert("}")
2281             # ...and after the beginning
2282             document.body[blay + 1:blay + 1] = put_cmd_in_ert("\\multirow{" + str(span) + "}{" + col_width + "}[" + offset + "]{")
2283           # set index to end of current cell (that is now much bigger due to the ERT addition)
2284           begin_cell = find_token(document.body, '</cell>', begin_cell) + 1
2285         begin_row = find_token(document.body, '</row>', begin_row) + 1
2286
2287       # go to the next table
2288       begin_table = end_table + 1
2289
2290     if multirowOffset == True:
2291         add_to_preamble(document, ["\\usepackage{multirow}"])
2292
2293
2294 ##
2295 # Conversion hub
2296 #
2297
2298 supported_versions = ["2.0.0","2.0"]
2299 convert = [[346, []],
2300            [347, []],
2301            [348, []],
2302            [349, []],
2303            [350, []],
2304            [351, []],
2305            [352, [convert_splitindex]],
2306            [353, []],
2307            [354, []],
2308            [355, []],
2309            [356, []],
2310            [357, []],
2311            [358, []],
2312            [359, [convert_nomencl_width]],
2313            [360, []],
2314            [361, []],
2315            [362, []],
2316            [363, []],
2317            [364, []],
2318            [365, []],
2319            [366, []],
2320            [367, []],
2321            [368, []],
2322            [369, [convert_author_id]],
2323            [370, []],
2324            [371, []],
2325            [372, []],
2326            [373, [merge_gbrief]],
2327            [374, []],
2328            [375, []],
2329            [376, []],
2330            [377, []],
2331            [378, []],
2332            [379, [convert_math_output]],
2333            [380, []],
2334            [381, []],
2335            [382, []],
2336            [383, []],
2337            [384, []],
2338            [385, []],
2339            [386, []],
2340            [387, []],
2341            [388, []],
2342            [389, [convert_html_quotes]],
2343            [390, []],
2344            [391, []],
2345            [392, []],
2346            [393, [convert_optarg]],
2347            [394, [convert_use_makebox]],
2348            [395, []],
2349            [396, []],
2350            [397, [remove_Nameref]],
2351            [398, []],
2352            [399, [convert_mathdots]],
2353            [400, [convert_rule]],
2354            [401, []],
2355            [402, [convert_bibtex_clearpage]],
2356            [403, [convert_flexnames]],
2357            [404, [convert_prettyref]],
2358            [405, []],
2359            [406, [convert_passthru]],
2360            [407, []]
2361 ]
2362
2363 revert =  [[406, [revert_multirowOffset]],
2364            [405, [revert_passthru]],
2365            [404, []],
2366            [403, [revert_refstyle]],
2367            [402, [revert_flexnames]],
2368            [401, []],
2369            [400, [revert_diagram]],
2370            [399, [revert_rule]],
2371            [398, [revert_mathdots]],
2372            [397, [revert_mathrsfs]],
2373            [396, []],
2374            [395, [revert_nameref]],
2375            [394, [revert_DIN_C_pagesizes]],
2376            [393, [revert_makebox]],
2377            [392, [revert_argument]],
2378            [391, []],
2379            [390, [revert_align_decimal, revert_IEEEtran]],
2380            [389, [revert_output_sync]],
2381            [388, [revert_html_quotes]],
2382            [387, [revert_pagesizes]],
2383            [386, [revert_math_scale]],
2384            [385, [revert_lyx_version]],
2385            [384, [revert_shadedboxcolor]],
2386            [383, [revert_fontcolor]],
2387            [382, [revert_turkmen]],
2388            [381, [revert_notefontcolor]],
2389            [380, [revert_equalspacing_xymatrix]],
2390            [379, [revert_inset_preview]],
2391            [378, [revert_math_output]],
2392            [377, []],
2393            [376, [revert_multirow]],
2394            [375, [revert_includeall]],
2395            [374, [revert_includeonly]],
2396            [373, [revert_html_options]],
2397            [372, [revert_gbrief]],
2398            [371, [revert_fontenc]],
2399            [370, [revert_mhchem]],
2400            [369, [revert_suppress_date]],
2401            [368, [revert_author_id]],
2402            [367, [revert_hspace_glue_lengths]],
2403            [366, [revert_percent_vspace_lengths, revert_percent_hspace_lengths]],
2404            [365, [revert_percent_skip_lengths]],
2405            [364, [revert_paragraph_indentation]],
2406            [363, [revert_branch_filename]],
2407            [362, [revert_longtable_align]],
2408            [361, [revert_applemac]],
2409            [360, []],
2410            [359, [revert_nomencl_cwidth]],
2411            [358, [revert_nomencl_width]],
2412            [357, [revert_custom_processors]],
2413            [356, [revert_ulinelatex]],
2414            [355, []],
2415            [354, [revert_strikeout]],
2416            [353, [revert_printindexall]],
2417            [352, [revert_subindex]],
2418            [351, [revert_splitindex]],
2419            [350, [revert_backgroundcolor]],
2420            [349, [revert_outputformat]],
2421            [348, [revert_xetex]],
2422            [347, [revert_phantom, revert_hphantom, revert_vphantom]],
2423            [346, [revert_tabularvalign]],
2424            [345, [revert_swiss]]
2425           ]
2426
2427
2428 if __name__ == "__main__":
2429     pass