lib/lyx2lyx/lyx_1_4.py

   1 # This file is part of lyx2lyx
   2 # -*- coding: utf-8 -*-
   3 # Copyright (C) 2002 Dekel Tsur <dekel@lyx.org>
   4 # Copyright (C) 2002-2004 José Matos <jamatos@lyx.org>
   5 # Copyright (C) 2004-2005 Georg Baum <Georg.Baum@post.rwth-aachen.de>
   6 #
   7 # This program is free software; you can redistribute it and/or
   8 # modify it under the terms of the GNU General Public License
   9 # as published by the Free Software Foundation; either version 2
  10 # of the License, or (at your option) any later version.
  11 #
  12 # This program is distributed in the hope that it will be useful,
  13 # but WITHOUT ANY WARRANTY; without even the implied warranty of
  14 # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
  15 # GNU General Public License for more details.
  16 #
  17 # You should have received a copy of the GNU General Public License
  18 # along with this program; if not, write to the Free Software
  19 # Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
  20
  21 """ Convert files to the file format generated by lyx 1.4"""
  22
  23 import re
  24 from os import access, F_OK
  25 import os.path
  26 from parser_tools import check_token, find_token, \
  27                          get_value, del_token, is_nonempty_line, \
  28                          find_tokens, find_end_of, find_beginning_of, find_token_exact, find_tokens_exact, \
  29                          find_re, find_tokens_backwards
  30 from sys import stdin
  31
  32 from lyx_0_12 import update_latexaccents
  33
  34 ####################################################################
  35 # Private helper functions
  36
  37 def get_layout(line, default_layout):
  38     " Get layout, if empty return the default layout."
  39     tokens = line.split()
  40     if len(tokens) > 1:
  41         return tokens[1]
  42     return default_layout
  43
  44
  45 def get_paragraph(lines, i, format):
  46     "Finds the paragraph that contains line i."
  47
  48     if format < 225:
  49         begin_layout = "\\layout"
  50     else:
  51         begin_layout = "\\begin_layout"
  52     while i != -1:
  53         i = find_tokens_backwards(lines, ["\\end_inset", begin_layout], i)
  54         if i == -1: return -1
  55         if check_token(lines[i], begin_layout):
  56             return i
  57         i = find_beginning_of_inset(lines, i)
  58     return -1
  59
  60
  61 def find_beginning_of_inset(lines, i):
  62     " Find beginning of inset, where lines[i] is included."
  63     return find_beginning_of(lines, i, "\\begin_inset", "\\end_inset")
  64
  65
  66 def get_next_paragraph(lines, i, format):
  67     "Finds the paragraph after the paragraph that contains line i."
  68
  69     if format < 225:
  70         tokens = ["\\begin_inset", "\\layout", "\\end_float", "\\the_end"]
  71     elif format < 236:
  72         tokens = ["\\begin_inset", "\\begin_layout", "\\end_float", "\\end_document"]
  73     else:
  74         tokens = ["\\begin_inset", "\\begin_layout", "\\end_float", "\\end_body", "\\end_document"]
  75     while i != -1:
  76         i = find_tokens(lines, tokens, i)
  77         if not check_token(lines[i], "\\begin_inset"):
  78             return i
  79         i = find_end_of_inset(lines, i)
  80     return -1
  81
  82
  83 def find_end_of_inset(lines, i):
  84     "Finds the matching \end_inset"
  85     return find_end_of(lines, i, "\\begin_inset", "\\end_inset")
  86
  87 # End of helper functions
  88 ####################################################################
  89
  90 def remove_color_default(document):
  91     " Remove \color default"
  92     i = 0
  93     while 1:
  94         i = find_token(document.body, "\\color default", i)
  95         if i == -1:
  96             return
  97         document.body[i] = document.body[i].replace("\\color default",
  98                                                     "\\color inherit")
  99
 100
 101 def add_end_header(document):
 102     " Add \end_header"
 103     document.header.append("\\end_header");
 104
 105
 106 def rm_end_header(document):
 107     " Remove \end_header"
 108     i = find_token(document.header, "\\end_header", 0)
 109     if i == -1:
 110         return
 111     del document.header[i]
 112
 113
 114 def convert_amsmath(document):
 115     " Convert \\use_amsmath"
 116     i = find_token(document.header, "\\use_amsmath", 0)
 117     if i == -1:
 118         document.warning("Malformed LyX document: Missing '\\use_amsmath'.")
 119         return
 120     tokens = document.header[i].split()
 121     if len(tokens) != 2:
 122         document.warning("Malformed LyX document: Could not parse line '%s'." % document.header[i])
 123         use_amsmath = '0'
 124     else:
 125         use_amsmath = tokens[1]
 126     # old: 0 == off, 1 == on
 127     # new: 0 == off, 1 == auto, 2 == on
 128     # translate off -> auto, since old format 'off' means auto in reality
 129     if use_amsmath == '0':
 130         document.header[i] = "\\use_amsmath 1"
 131     else:
 132         document.header[i] = "\\use_amsmath 2"
 133
 134
 135 def revert_amsmath(document):
 136     " Revert \\use_amsmath"
 137     i = find_token(document.header, "\\use_amsmath", 0)
 138     if i == -1:
 139         document.warning("Malformed LyX document: Missing '\\use_amsmath'.")
 140         return
 141     tokens = document.header[i].split()
 142     if len(tokens) != 2:
 143         document.warning("Malformed LyX document: Could not parse line '%s'." % document.header[i])
 144         use_amsmath = '0'
 145     else:
 146         use_amsmath = tokens[1]
 147     # old: 0 == off, 1 == on
 148     # new: 0 == off, 1 == auto, 2 == on
 149     # translate auto -> off, since old format 'off' means auto in reality
 150     if use_amsmath == '2':
 151         document.header[i] = "\\use_amsmath 1"
 152     else:
 153         document.header[i] = "\\use_amsmath 0"
 154
 155
 156 def convert_spaces(document):
 157     " \SpecialChar ~ -> \InsetSpace ~"
 158     for i in range(len(document.body)):
 159         document.body[i] = document.body[i].replace("\\SpecialChar ~",
 160                                                     "\\InsetSpace ~")
 161
 162
 163 def revert_spaces(document):
 164     " \InsetSpace ~ -> \SpecialChar ~"
 165     regexp = re.compile(r'(.*)(\\InsetSpace\s+)(\S+)')
 166     i = 0
 167     while 1:
 168         i = find_re(document.body, regexp, i)
 169         if i == -1:
 170             break
 171         space = regexp.match(document.body[i]).group(3)
 172         prepend = regexp.match(document.body[i]).group(1)
 173         if space == '~':
 174             document.body[i] = regexp.sub(prepend + '\\SpecialChar ~', document.body[i])
 175             i = i + 1
 176         else:
 177             document.body[i] = regexp.sub(prepend, document.body[i])
 178             document.body[i+1:i+1] = ''
 179             if space == "\\space":
 180                 space = "\\ "
 181             i = insert_ert(document.body, i+1, 'Collapsed', space, document.format - 1, document.default_layout)
 182
 183
 184 def rename_spaces(document):
 185     """ \InsetSpace \, -> \InsetSpace \thinspace{}
 186         \InsetSpace \space -> \InsetSpace \space{}"""
 187     for i in range(len(document.body)):
 188         document.body[i] = document.body[i].replace("\\InsetSpace \\space",
 189                                                     "\\InsetSpace \\space{}")
 190         document.body[i] = document.body[i].replace("\\InsetSpace \,",
 191                                                     "\\InsetSpace \\thinspace{}")
 192
 193
 194 def revert_space_names(document):
 195     """ \InsetSpace \thinspace{} -> \InsetSpace \,
 196          \InsetSpace \space{} -> \InsetSpace \space"""
 197     for i in range(len(document.body)):
 198         document.body[i] = document.body[i].replace("\\InsetSpace \\space{}",
 199                                                     "\\InsetSpace \\space")
 200         document.body[i] = document.body[i].replace("\\InsetSpace \\thinspace{}",
 201                                                     "\\InsetSpace \\,")
 202
 203
 204 def lyx_support_escape(lab):
 205     " Equivalent to pre-unicode lyx::support::escape()"
 206     hexdigit = ['0', '1', '2', '3', '4', '5', '6', '7',
 207                 '8', '9', 'A', 'B', 'C', 'D', 'E', 'F']
 208     enc = ""
 209     for c in lab:
 210         o = ord(c)
 211         if o >= 128 or c == '=' or c == '%':
 212             enc = enc + '='
 213             enc = enc + hexdigit[o >> 4]
 214             enc = enc + hexdigit[o & 15]
 215         else:
 216             enc = enc + c
 217     return enc;
 218
 219
 220 def revert_eqref(document):
 221     "\\begin_inset LatexCommand \\eqref -> ERT"
 222     regexp = re.compile(r'^\\begin_inset\s+LatexCommand\s+\\eqref')
 223     i = 0
 224     while 1:
 225         i = find_re(document.body, regexp, i)
 226         if i == -1:
 227             break
 228         eqref = lyx_support_escape(regexp.sub("", document.body[i]))
 229         document.body[i:i+1] = ["\\begin_inset ERT", "status Collapsed", "",
 230                             '\\layout %s' % document.default_layout, "", "\\backslash ",
 231                             "eqref" + eqref]
 232         i = i + 7
 233
 234
 235 def convert_bibtex(document):
 236     " Convert BibTeX changes."
 237     for i in range(len(document.body)):
 238         document.body[i] = document.body[i].replace("\\begin_inset LatexCommand \\BibTeX",
 239                                                     "\\begin_inset LatexCommand \\bibtex")
 240
 241
 242 def revert_bibtex(document):
 243     " Revert BibTeX changes."
 244     for i in range(len(document.body)):
 245         document.body[i] = document.body[i].replace("\\begin_inset LatexCommand \\bibtex",
 246                                                     "\\begin_inset LatexCommand \\BibTeX")
 247
 248
 249 def remove_insetparent(document):
 250     " Remove \lyxparent"
 251     i = 0
 252     while 1:
 253         i = find_token(document.body, "\\begin_inset LatexCommand \\lyxparent", i)
 254         if i == -1:
 255             break
 256         del document.body[i:i+3]
 257
 258
 259 def convert_external(document):
 260     " Convert inset External."
 261     external_rexp = re.compile(r'\\begin_inset External ([^,]*),"([^"]*)",')
 262     external_header = "\\begin_inset External"
 263     i = 0
 264     while 1:
 265         i = find_token(document.body, external_header, i)
 266         if i == -1:
 267             break
 268         look = external_rexp.search(document.body[i])
 269         args = ['','']
 270         if look:
 271             args[0] = look.group(1)
 272             args[1] = look.group(2)
 273         #FIXME: if the previous search fails then warn
 274
 275         if args[0] == "RasterImage":
 276             # Convert a RasterImage External Inset to a Graphics Inset.
 277             top = "\\begin_inset Graphics"
 278             if args[1]:
 279                 filename = "\tfilename " + args[1]
 280             document.body[i:i+1] = [top, filename]
 281             i = i + 1
 282         else:
 283             # Convert the old External Inset format to the new.
 284             top = external_header
 285             template = "\ttemplate " + args[0]
 286             if args[1]:
 287                 filename = "\tfilename " + args[1]
 288                 document.body[i:i+1] = [top, template, filename]
 289                 i = i + 2
 290             else:
 291                 document.body[i:i+1] = [top, template]
 292                 i = i + 1
 293
 294
 295 def revert_external_1(document):
 296     " Revert inset External."
 297     external_header = "\\begin_inset External"
 298     i = 0
 299     while 1:
 300         i = find_token(document.body, external_header, i)
 301         if i == -1:
 302             break
 303
 304         template = document.body[i+1].split()
 305         template.reverse()
 306         del document.body[i+1]
 307
 308         filename = document.body[i+1].split()
 309         filename.reverse()
 310         del document.body[i+1]
 311
 312         params = document.body[i+1].split()
 313         params.reverse()
 314         if document.body[i+1]: del document.body[i+1]
 315
 316         document.body[i] = document.body[i] + " " + template[0]+ ', "' + filename[0] + '", " '+ " ".join(params[1:]) + '"'
 317         i = i + 1
 318
 319
 320 def revert_external_2(document):
 321     " Revert inset External. (part II)"
 322     draft_token = '\tdraft'
 323     i = 0
 324     while 1:
 325         i = find_token(document.body, '\\begin_inset External', i)
 326         if i == -1:
 327             break
 328         j = find_end_of_inset(document.body, i + 1)
 329         if j == -1:
 330             #this should not happen
 331             break
 332         k = find_token(document.body, draft_token, i+1, j-1)
 333         if (k != -1 and len(draft_token) == len(document.body[k])):
 334             del document.body[k]
 335         i = j + 1
 336
 337
 338 def convert_comment(document):
 339     " Convert \\layout comment"
 340     i = 0
 341     comment = "\\layout Comment"
 342     while 1:
 343         i = find_token(document.body, comment, i)
 344         if i == -1:
 345             return
 346
 347         document.body[i:i+1] = ['\\layout %s' % document.default_layout,"","",
 348                         "\\begin_inset Comment",
 349                         "collapsed true","",
 350                         '\\layout %s' % document.default_layout]
 351         i = i + 7
 352
 353         while 1:
 354                 old_i = i
 355                 i = find_token(document.body, "\\layout", i)
 356                 if i == -1:
 357                     i = len(document.body) - 1
 358                     document.body[i:i] = ["\\end_inset","",""]
 359                     return
 360
 361                 j = find_token(document.body, '\\begin_deeper', old_i, i)
 362                 if j == -1: j = i + 1
 363                 k = find_token(document.body, '\\begin_inset', old_i, i)
 364                 if k == -1: k = i + 1
 365
 366                 if j < i and j < k:
 367                     i = j
 368                     del document.body[i]
 369                     i = find_end_of( document.body, i, "\\begin_deeper","\\end_deeper")
 370                     if i == -1:
 371                         #This case should not happen
 372                         #but if this happens deal with it greacefully adding
 373                         #the missing \end_deeper.
 374                         i = len(document.body) - 1
 375                         document.body[i:i] = ["\\end_deeper",""]
 376                         return
 377                     else:
 378                         del document.body[i]
 379                         continue
 380
 381                 if k < i:
 382                     i = k
 383                     i = find_end_of( document.body, i, "\\begin_inset","\\end_inset")
 384                     if i == -1:
 385                         #This case should not happen
 386                         #but if this happens deal with it greacefully adding
 387                         #the missing \end_inset.
 388                         i = len(document.body) - 1
 389                         document.body[i:i] = ["\\end_inset","","","\\end_inset","",""]
 390                         return
 391                     else:
 392                         i = i + 1
 393                         continue
 394
 395                 if document.body[i].find(comment) == -1:
 396                     document.body[i:i] = ["\\end_inset"]
 397                     i = i + 1
 398                     break
 399                 document.body[i:i+1] = ['\\layout %s' % document.default_layout]
 400                 i = i + 1
 401
 402
 403 def revert_comment(document):
 404     " Revert comments"
 405     i = 0
 406     while 1:
 407         i = find_tokens(document.body, ["\\begin_inset Comment", "\\begin_inset Greyedout"], i)
 408
 409         if i == -1:
 410             return
 411         document.body[i] = "\\begin_inset Note"
 412         i = i + 1
 413
 414
 415 def add_end_layout(document):
 416     " Add \end_layout"
 417     i = find_token(document.body, '\\layout', 0)
 418
 419     if i == -1:
 420         return
 421
 422     i = i + 1
 423     struct_stack = ["\\layout"]
 424
 425     while 1:
 426         i = find_tokens(document.body, ["\\begin_inset", "\\end_inset", "\\layout",
 427                                 "\\begin_deeper", "\\end_deeper", "\\the_end"], i)
 428
 429         if i != -1:
 430             token = document.body[i].split()[0]
 431         else:
 432             document.warning("Truncated document.")
 433             i = len(document.body)
 434             document.body.insert(i, '\\the_end')
 435             token = ""
 436
 437         if token == "\\begin_inset":
 438             struct_stack.append(token)
 439             i = i + 1
 440             continue
 441
 442         if token == "\\end_inset":
 443             tail = struct_stack.pop()
 444             if tail == "\\layout":
 445                 document.body.insert(i,"")
 446                 document.body.insert(i,"\\end_layout")
 447                 i = i + 2
 448                 #Check if it is the correct tag
 449                 struct_stack.pop()
 450             i = i + 1
 451             continue
 452
 453         if token == "\\layout":
 454             tail = struct_stack.pop()
 455             if tail == token:
 456                 document.body.insert(i,"")
 457                 document.body.insert(i,"\\end_layout")
 458                 i = i + 3
 459             else:
 460                 struct_stack.append(tail)
 461                 i = i + 1
 462             struct_stack.append(token)
 463             continue
 464
 465         if token == "\\begin_deeper":
 466             document.body.insert(i,"")
 467             document.body.insert(i,"\\end_layout")
 468             i = i + 3
 469             # consecutive begin_deeper only insert one end_layout
 470             while document.body[i].startswith('\\begin_deeper'):
 471                 i += 1
 472             struct_stack.append(token)
 473             continue
 474
 475         if token == "\\end_deeper":
 476             if struct_stack[-1] == '\\layout':
 477                 document.body.insert(i, '\\end_layout')
 478                 i = i + 1
 479                 struct_stack.pop()
 480             i = i + 1
 481             continue
 482
 483         #case \end_document
 484         document.body.insert(i, "")
 485         document.body.insert(i, "\\end_layout")
 486         return
 487
 488
 489 def rm_end_layout(document):
 490     " Remove \end_layout"
 491     i = 0
 492     while 1:
 493         i = find_token(document.body, '\\end_layout', i)
 494
 495         if i == -1:
 496             return
 497
 498         del document.body[i]
 499
 500
 501 def insert_tracking_changes(document):
 502     " Handle change tracking keywords."
 503     i = find_token(document.header, "\\tracking_changes", 0)
 504     if i == -1:
 505         document.header.append("\\tracking_changes 0")
 506
 507
 508 def rm_tracking_changes(document):
 509     " Remove change tracking keywords."
 510     i = find_token(document.header, "\\author", 0)
 511     if i != -1:
 512         del document.header[i]
 513
 514     i = find_token(document.header, "\\tracking_changes", 0)
 515     if i == -1:
 516         return
 517     del document.header[i]
 518
 519
 520 def rm_body_changes(document):
 521     " Remove body changes."
 522     i = 0
 523     while 1:
 524         i = find_token(document.body, "\\change_", i)
 525         if i == -1:
 526             return
 527
 528         del document.body[i]
 529
 530
 531 def layout2begin_layout(document):
 532     " \layout -> \begin_layout "
 533     i = 0
 534     while 1:
 535         i = find_token(document.body, '\\layout', i)
 536         if i == -1:
 537             return
 538
 539         document.body[i] = document.body[i].replace('\\layout', '\\begin_layout')
 540         i = i + 1
 541
 542
 543 def begin_layout2layout(document):
 544     " \begin_layout -> \layout "
 545     i = 0
 546     while 1:
 547         i = find_token(document.body, '\\begin_layout', i)
 548         if i == -1:
 549             return
 550
 551         document.body[i] = document.body[i].replace('\\begin_layout', '\\layout')
 552         i = i + 1
 553
 554
 555 def convert_valignment_middle(body, start, end):
 556     'valignment="center" -> valignment="middle"'
 557     for i in range(start, end):
 558         if re.search('^<(column|cell) .*valignment="center".*>$', body[i]):
 559             body[i] = body[i].replace('valignment="center"', 'valignment="middle"')
 560
 561
 562 def convert_table_valignment_middle(document):
 563     " Convert table  valignment, center -> middle"
 564     regexp = re.compile(r'^\\begin_inset\s+Tabular')
 565     i = 0
 566     while 1:
 567         i = find_re(document.body, regexp, i)
 568         if i == -1:
 569             return
 570         j = find_end_of_inset(document.body, i + 1)
 571         if j == -1:
 572             #this should not happen
 573             convert_valignment_middle(document.body, i + 1, len(document.body))
 574             return
 575         convert_valignment_middle(document.body, i + 1, j)
 576         i = j + 1
 577
 578
 579 def revert_table_valignment_middle(body, start, end):
 580     " valignment, middle -> center"
 581     for i in range(start, end):
 582         if re.search('^<(column|cell) .*valignment="middle".*>$', body[i]):
 583             body[i] = body[i].replace('valignment="middle"', 'valignment="center"')
 584
 585
 586 def revert_valignment_middle(document):
 587     " Convert table  valignment, middle -> center"
 588     regexp = re.compile(r'^\\begin_inset\s+Tabular')
 589     i = 0
 590     while 1:
 591         i = find_re(document.body, regexp, i)
 592         if i == -1:
 593             return
 594         j = find_end_of_inset(document.body, i + 1)
 595         if j == -1:
 596             #this should not happen
 597             revert_table_valignment_middle(document.body, i + 1, len(document.body))
 598             return
 599         revert_table_valignment_middle(document.body, i + 1, j)
 600         i = j + 1
 601
 602
 603 def convert_end_document(document):
 604     "\\the_end -> \\end_document"
 605     i = find_token(document.body, "\\the_end", 0)
 606     if i == -1:
 607         document.body.append("\\end_document")
 608         return
 609     document.body[i] = "\\end_document"
 610
 611
 612 def revert_end_document(document):
 613     "\\end_document -> \\the_end"
 614     i = find_token(document.body, "\\end_document", 0)
 615     if i == -1:
 616         document.body.append("\\the_end")
 617         return
 618     document.body[i] = "\\the_end"
 619
 620
 621 def convert_breaks(document):
 622     r"""
 623 Convert line and page breaks
 624  Old:
 625 \layout Standard
 626 \line_top \line_bottom \pagebreak_top \pagebreak_bottom \added_space_top xxx \added_space_bottom yyy
 627 0
 628
 629  New:
 630 \begin layout Standard
 631
 632 \newpage
 633
 634 \lyxline
 635 \begin_inset ERT
 636 \begin layout Standard
 637 \backslash
 638 vspace{-1\backslash
 639 parskip}
 640 \end_layout
 641 \end_inset
 642
 643 \begin_inset VSpace xxx
 644 \end_inset
 645
 646 0
 647
 648 \begin_inset VSpace xxx
 649 \end_inset
 650 \lyxline
 651
 652 \newpage
 653
 654 \end_layout
 655     """
 656     par_params = ('added_space_bottom', 'added_space_top', 'align',
 657                  'labelwidthstring', 'line_bottom', 'line_top', 'noindent',
 658                  'pagebreak_bottom', 'pagebreak_top', 'paragraph_spacing',
 659                  'start_of_appendix')
 660     font_attributes = ['\\family', '\\series', '\\shape', '\\emph',
 661                        '\\numeric', '\\bar', '\\noun', '\\color', '\\lang']
 662     attribute_values = ['default', 'default', 'default', 'default',
 663                         'default', 'default', 'default', 'none', document.language]
 664     i = 0
 665     while 1:
 666         i = find_token(document.body, "\\begin_layout", i)
 667         if i == -1:
 668             return
 669         layout = get_layout(document.body[i], document.default_layout)
 670         i = i + 1
 671
 672         # Merge all paragraph parameters into a single line
 673         # We cannot check for '\\' only because paragraphs may start e.g.
 674         # with '\\backslash'
 675         while document.body[i + 1][:1] == '\\' and document.body[i + 1][1:].split()[0] in par_params:
 676             document.body[i] = document.body[i + 1] + ' ' + document.body[i]
 677             del document.body[i+1]
 678
 679         line_top   = document.body[i].find("\\line_top")
 680         line_bot   = document.body[i].find("\\line_bottom")
 681         pb_top     = document.body[i].find("\\pagebreak_top")
 682         pb_bot     = document.body[i].find("\\pagebreak_bottom")
 683         vspace_top = document.body[i].find("\\added_space_top")
 684         vspace_bot = document.body[i].find("\\added_space_bottom")
 685
 686         if line_top == -1 and line_bot == -1 and pb_bot == -1 and pb_top == -1 and vspace_top == -1 and vspace_bot == -1:
 687             continue
 688
 689         # Do we have a nonstandard paragraph? We need to create new paragraphs
 690         # if yes to avoid putting lyxline etc. inside of special environments.
 691         # This is wrong for itemize and enumerate environments, but it is
 692         # impossible to convert these correctly.
 693         # We want to avoid new paragraphs if possible becauase we want to
 694         # inherit font sizes.
 695         nonstandard = 0
 696         if (not document.is_default_layout(layout) or
 697             document.body[i].find("\\align") != -1 or
 698             document.body[i].find("\\labelwidthstring") != -1 or
 699             document.body[i].find("\\noindent") != -1):
 700             nonstandard = 1
 701
 702         # get the font size of the beginning of this paragraph, since we need
 703         # it for the lyxline inset
 704         j = i + 1
 705         while not is_nonempty_line(document.body[j]):
 706             j = j + 1
 707         size_top = ""
 708         if document.body[j].find("\\size") != -1:
 709             size_top = document.body[j].split()[1]
 710
 711         for tag in "\\line_top", "\\line_bottom", "\\pagebreak_top", "\\pagebreak_bottom":
 712             document.body[i] = document.body[i].replace(tag, "")
 713
 714         if vspace_top != -1:
 715             # the position could be change because of the removal of other
 716             # paragraph properties above
 717             vspace_top = document.body[i].find("\\added_space_top")
 718             tmp_list = document.body[i][vspace_top:].split()
 719             vspace_top_value = tmp_list[1]
 720             document.body[i] = document.body[i][:vspace_top] + " ".join(tmp_list[2:])
 721
 722         if vspace_bot != -1:
 723             # the position could be change because of the removal of other
 724             # paragraph properties above
 725             vspace_bot = document.body[i].find("\\added_space_bottom")
 726             tmp_list = document.body[i][vspace_bot:].split()
 727             vspace_bot_value = tmp_list[1]
 728             document.body[i] = document.body[i][:vspace_bot] + " ".join(tmp_list[2:])
 729
 730         document.body[i] = document.body[i].strip()
 731         i = i + 1
 732
 733         # Create an empty paragraph or paragraph fragment for line and
 734         # page break that belong above the paragraph
 735         if pb_top !=-1 or line_top != -1 or vspace_top != -1:
 736
 737             paragraph_above = list()
 738             if nonstandard:
 739                 # We need to create an extra paragraph for nonstandard environments
 740                 paragraph_above = ['\\begin_layout %s' % document.default_layout, '']
 741
 742             if pb_top != -1:
 743                 paragraph_above.extend(['\\newpage ',''])
 744
 745             if vspace_top != -1:
 746                 paragraph_above.extend(['\\begin_inset VSpace ' + vspace_top_value,'\\end_inset','',''])
 747
 748             if line_top != -1:
 749                 if size_top != '':
 750                     paragraph_above.extend(['\\size ' + size_top + ' '])
 751                 # We need an additional vertical space of -\parskip.
 752                 # We can't use the vspace inset because it does not know \parskip.
 753                 paragraph_above.extend(['\\lyxline ', '', ''])
 754                 insert_ert(paragraph_above, len(paragraph_above) - 1, 'Collapsed',
 755                            '\\vspace{-1\\parskip}\n', document.format + 1, document.default_layout)
 756                 paragraph_above.extend([''])
 757
 758             if nonstandard:
 759                 paragraph_above.extend(['\\end_layout ',''])
 760                 # insert new paragraph above the current paragraph
 761                 document.body[i-2:i-2] = paragraph_above
 762             else:
 763                 # insert new lines at the beginning of the current paragraph
 764                 document.body[i:i] = paragraph_above
 765
 766             i = i + len(paragraph_above)
 767
 768         # Ensure that nested style are converted later.
 769         k = find_end_of(document.body, i, "\\begin_layout", "\\end_layout")
 770
 771         if k == -1:
 772             return
 773
 774         if pb_bot !=-1 or line_bot != -1 or vspace_bot != -1:
 775
 776             # get the font size of the end of this paragraph
 777             size_bot = size_top
 778             j = i + 1
 779             while j < k:
 780                 if document.body[j].find("\\size") != -1:
 781                     size_bot = document.body[j].split()[1]
 782                     j = j + 1
 783                 elif document.body[j].find("\\begin_inset") != -1:
 784                     # skip insets
 785                     j = find_end_of_inset(document.body, j)
 786                 else:
 787                     j = j + 1
 788
 789             paragraph_below = list()
 790             if nonstandard:
 791                 # We need to create an extra paragraph for nonstandard environments
 792                 paragraph_below = ['', '\\begin_layout %s' % document.default_layout, '']
 793             else:
 794                 for a in range(len(font_attributes)):
 795                     if find_token(document.body, font_attributes[a], i, k) != -1:
 796                         paragraph_below.extend([font_attributes[a] + ' ' + attribute_values[a]])
 797
 798             if line_bot != -1:
 799                 if nonstandard and size_bot != '':
 800                     paragraph_below.extend(['\\size ' + size_bot + ' '])
 801                 paragraph_below.extend(['\\lyxline ',''])
 802                 if size_bot != '':
 803                     paragraph_below.extend(['\\size default '])
 804
 805             if vspace_bot != -1:
 806                 paragraph_below.extend(['\\begin_inset VSpace ' + vspace_bot_value,'\\end_inset','',''])
 807
 808             if pb_bot != -1:
 809                 paragraph_below.extend(['\\newpage ',''])
 810
 811             if nonstandard:
 812                 paragraph_below.extend(['\\end_layout '])
 813                 # insert new paragraph below the current paragraph
 814                 document.body[k+1:k+1] = paragraph_below
 815             else:
 816                 # insert new lines at the end of the current paragraph
 817                 document.body[k:k] = paragraph_below
 818
 819
 820 def convert_note(document):
 821     " Convert Notes. "
 822     i = 0
 823     while 1:
 824         i = find_tokens(document.body, ["\\begin_inset Note",
 825                                 "\\begin_inset Comment",
 826                                 "\\begin_inset Greyedout"], i)
 827         if i == -1:
 828             break
 829
 830         document.body[i] = document.body[i][0:13] + 'Note ' + document.body[i][13:]
 831         i = i + 1
 832
 833
 834 def revert_note(document):
 835     " Revert Notes. "
 836     note_header = "\\begin_inset Note "
 837     i = 0
 838     while 1:
 839         i = find_token(document.body, note_header, i)
 840         if i == -1:
 841             break
 842
 843         document.body[i] = "\\begin_inset " + document.body[i][len(note_header):]
 844         i = i + 1
 845
 846
 847 def convert_box(document):
 848     " Convert Boxes. "
 849     i = 0
 850     while 1:
 851         i = find_tokens(document.body, ["\\begin_inset Boxed",
 852                                 "\\begin_inset Doublebox",
 853                                 "\\begin_inset Frameless",
 854                                 "\\begin_inset ovalbox",
 855                                 "\\begin_inset Ovalbox",
 856                                 "\\begin_inset Shadowbox"], i)
 857         if i == -1:
 858             break
 859
 860         document.body[i] = document.body[i][0:13] + 'Box ' + document.body[i][13:]
 861         i = i + 1
 862
 863
 864 def revert_box(document):
 865     " Revert Boxes."
 866     box_header = "\\begin_inset Box "
 867     i = 0
 868     while 1:
 869         i = find_token(document.body, box_header, i)
 870         if i == -1:
 871             break
 872
 873         document.body[i] = "\\begin_inset " + document.body[i][len(box_header):]
 874         i = i + 1
 875
 876
 877 def convert_collapsable(document):
 878     " Convert collapsed insets. "
 879     i = 0
 880     while 1:
 881         i = find_tokens_exact(document.body, ["\\begin_inset Box",
 882                                 "\\begin_inset Branch",
 883                                 "\\begin_inset CharStyle",
 884                                 "\\begin_inset Float",
 885                                 "\\begin_inset Foot",
 886                                 "\\begin_inset Marginal",
 887                                 "\\begin_inset Note",
 888                                 "\\begin_inset OptArg",
 889                                 "\\begin_inset Wrap"], i)
 890         if i == -1:
 891             break
 892
 893         # Seach for a line starting 'collapsed'
 894         # If, however, we find a line starting '\begin_layout'
 895         # (_always_ present) then break with a warning message
 896         i = i + 1
 897         while 1:
 898             if (document.body[i] == "collapsed false"):
 899                 document.body[i] = "status open"
 900                 break
 901             elif (document.body[i] == "collapsed true"):
 902                 document.body[i] = "status collapsed"
 903                 break
 904             elif (document.body[i][:13] == "\\begin_layout"):
 905                 document.warning("Malformed LyX document: Missing 'collapsed'.")
 906                 break
 907             i = i + 1
 908
 909         i = i + 1
 910
 911
 912 def revert_collapsable(document):
 913     " Revert collapsed insets. "
 914     i = 0
 915     while 1:
 916         i = find_tokens_exact(document.body, ["\\begin_inset Box",
 917                                 "\\begin_inset Branch",
 918                                 "\\begin_inset CharStyle",
 919                                 "\\begin_inset Float",
 920                                 "\\begin_inset Foot",
 921                                 "\\begin_inset Marginal",
 922                                 "\\begin_inset Note",
 923                                 "\\begin_inset OptArg",
 924                                 "\\begin_inset Wrap"], i)
 925         if i == -1:
 926             break
 927
 928         # Seach for a line starting 'status'
 929         # If, however, we find a line starting '\begin_layout'
 930         # (_always_ present) then break with a warning message
 931         i = i + 1
 932         while 1:
 933             if (document.body[i] == "status open"):
 934                 document.body[i] = "collapsed false"
 935                 break
 936             elif (document.body[i] == "status collapsed" or
 937                   document.body[i] == "status inlined"):
 938                 document.body[i] = "collapsed true"
 939                 break
 940             elif (document.body[i][:13] == "\\begin_layout"):
 941                 document.warning("Malformed LyX document: Missing 'status'.")
 942                 break
 943             i = i + 1
 944
 945         i = i + 1
 946
 947
 948 def convert_ert(document):
 949     " Convert ERT. "
 950     i = 0
 951     while 1:
 952         i = find_token(document.body, "\\begin_inset ERT", i)
 953         if i == -1:
 954             break
 955
 956         # Seach for a line starting 'status'
 957         # If, however, we find a line starting '\begin_layout'
 958         # (_always_ present) then break with a warning message
 959         i = i + 1
 960         while 1:
 961             if (document.body[i] == "status Open"):
 962                 document.body[i] = "status open"
 963                 break
 964             elif (document.body[i] == "status Collapsed"):
 965                 document.body[i] = "status collapsed"
 966                 break
 967             elif (document.body[i] == "status Inlined"):
 968                 document.body[i] = "status inlined"
 969                 break
 970             elif (document.body[i][:13] == "\\begin_layout"):
 971                 document.warning("Malformed LyX document: Missing 'status'.")
 972                 break
 973             i = i + 1
 974
 975         i = i + 1
 976
 977
 978 def revert_ert(document):
 979     " Revert ERT. "
 980     i = 0
 981     while 1:
 982         i = find_token(document.body, "\\begin_inset ERT", i)
 983         if i == -1:
 984             break
 985
 986         # Seach for a line starting 'status'
 987         # If, however, we find a line starting '\begin_layout'
 988         # (_always_ present) then break with a warning message
 989         i = i + 1
 990         while 1:
 991             if (document.body[i] == "status open"):
 992                 document.body[i] = "status Open"
 993                 break
 994             elif (document.body[i] == "status collapsed"):
 995                 document.body[i] = "status Collapsed"
 996                 break
 997             elif (document.body[i] == "status inlined"):
 998                 document.body[i] = "status Inlined"
 999                 break
1000             elif (document.body[i][:13] == "\\begin_layout"):
1001                 document.warning("Malformed LyX document : Missing 'status'.")
1002                 break
1003             i = i + 1
1004
1005         i = i + 1
1006
1007
1008 def convert_minipage(document):
1009     """ Convert minipages to the box inset.
1010     We try to use the same order of arguments as lyx does.
1011     """
1012     pos = ["t","c","b"]
1013     inner_pos = ["c","t","b","s"]
1014
1015     i = 0
1016     while 1:
1017         i = find_token(document.body, "\\begin_inset Minipage", i)
1018         if i == -1:
1019             return
1020
1021         document.body[i] = "\\begin_inset Box Frameless"
1022         i = i + 1
1023
1024         # convert old to new position using the pos list
1025         if document.body[i][:8] == "position":
1026             document.body[i] = 'position "%s"' % pos[int(document.body[i][9])]
1027         else:
1028             document.body.insert(i, 'position "%s"' % pos[0])
1029         i = i + 1
1030
1031         document.body.insert(i, 'hor_pos "c"')
1032         i = i + 1
1033         document.body.insert(i, 'has_inner_box 1')
1034         i = i + 1
1035
1036         # convert the inner_position
1037         if document.body[i][:14] == "inner_position":
1038             innerpos = inner_pos[int(document.body[i][15])]
1039             del document.body[i]
1040         else:
1041             innerpos = inner_pos[0]
1042
1043         # We need this since the new file format has a height and width
1044         # in a different order.
1045         if document.body[i][:6] == "height":
1046             height = document.body[i][6:]
1047             # test for default value of 221 and convert it accordingly
1048             if height == ' "0pt"' or height == ' "0"':
1049                 height = ' "1pt"'
1050             del document.body[i]
1051         else:
1052             height = ' "1pt"'
1053
1054         if document.body[i][:5] == "width":
1055             width = document.body[i][5:]
1056             del document.body[i]
1057         else:
1058             width = ' "0"'
1059
1060         if document.body[i][:9] == "collapsed":
1061             if document.body[i][9:] == "true":
1062                 status = "collapsed"
1063             else:
1064                 status = "open"
1065             del document.body[i]
1066         else:
1067             status = "collapsed"
1068
1069         # Handle special default case:
1070         if height == ' "1pt"' and innerpos == 'c':
1071             innerpos = 't'
1072
1073         document.body.insert(i, 'inner_pos "' + innerpos + '"')
1074         i = i + 1
1075         document.body.insert(i, 'use_parbox 0')
1076         i = i + 1
1077         document.body.insert(i, 'width' + width)
1078         i = i + 1
1079         document.body.insert(i, 'special "none"')
1080         i = i + 1
1081         document.body.insert(i, 'height' + height)
1082         i = i + 1
1083         document.body.insert(i, 'height_special "totalheight"')
1084         i = i + 1
1085         document.body.insert(i, 'status ' + status)
1086         i = i + 1
1087
1088
1089 def convert_ertbackslash(body, i, ert, format, default_layout):
1090     r""" -------------------------------------------------------------------------------------------
1091     Convert backslashes and '\n' into valid ERT code, append the converted
1092     text to body[i] and return the (maybe incremented) line index i"""
1093
1094     for c in ert:
1095         if c == '\\':
1096             body[i] = body[i] + '\\backslash '
1097             i = i + 1
1098             body.insert(i, '')
1099         elif c == '\n':
1100             if format <= 240:
1101                 body[i+1:i+1] = ['\\newline ', '']
1102                 i = i + 2
1103             else:
1104                 body[i+1:i+1] = ['\\end_layout', '', '\\begin_layout %s' % default_layout, '']
1105                 i = i + 4
1106         else:
1107             body[i] = body[i] + c
1108     return i
1109
1110
1111 def ert2latex(lines, format):
1112     r""" Converts lines in ERT code to LaTeX
1113     The surrounding \begin_layout ... \end_layout pair must not be included"""
1114
1115     backslash = re.compile(r'\\backslash\s*$')
1116     newline = re.compile(r'\\newline\s*$')
1117     if format <= 224:
1118         begin_layout = re.compile(r'\\layout\s*\S+$')
1119     else:
1120         begin_layout = re.compile(r'\\begin_layout\s*\S+$')
1121     end_layout = re.compile(r'\\end_layout\s*$')
1122     ert = ''
1123     for i in range(len(lines)):
1124         line = backslash.sub('\\\\', lines[i])
1125         if format <= 240:
1126             if begin_layout.match(line):
1127                 line = '\n\n'
1128             else:
1129                 line = newline.sub('\n', line)
1130         else:
1131             if begin_layout.match(line):
1132                 line = '\n'
1133         if format > 224 and end_layout.match(line):
1134             line = ''
1135         ert = ert + line
1136     return ert
1137
1138
1139 def get_par_params(lines, i):
1140     """ get all paragraph parameters. They can be all on one line or on several lines.
1141     lines[i] must be the first parameter line"""
1142     par_params = ('added_space_bottom', 'added_space_top', 'align',
1143                  'labelwidthstring', 'line_bottom', 'line_top', 'noindent',
1144                  'pagebreak_bottom', 'pagebreak_top', 'paragraph_spacing',
1145                  'start_of_appendix')
1146     # We cannot check for '\\' only because paragraphs may start e.g.
1147     # with '\\backslash'
1148     params = ''
1149     while lines[i][:1] == '\\' and lines[i][1:].split()[0] in par_params:
1150         params = params + ' ' + lines[i].strip()
1151         i = i + 1
1152     return params.strip()
1153
1154
1155 def lyxsize2latexsize(lyxsize):
1156     " Convert LyX font size to LaTeX fontsize. "
1157     sizes = {"tiny" : "tiny", "scriptsize" : "scriptsize",
1158              "footnotesize" : "footnotesize", "small" : "small",
1159              "normal" : "normalsize", "large" : "large", "larger" : "Large",
1160              "largest" : "LARGE", "huge" : "huge", "giant" : "Huge"}
1161     if lyxsize in sizes:
1162         return '\\' + sizes[lyxsize]
1163     return ''
1164
1165
1166 def revert_breaks(document):
1167     """ Change vspace insets, page breaks and lyxlines to paragraph options
1168     (if possible) or ERT"""
1169
1170     # Get default spaceamount
1171     i = find_token(document.header, '\\defskip', 0)
1172     if i == -1:
1173         defskipamount = 'medskip'
1174     else:
1175         defskipamount = document.header[i].split()[1]
1176
1177     keys = {"\\begin_inset" : "vspace", "\\lyxline" : "lyxline",
1178             "\\newpage" : "newpage"}
1179     keywords_top = {"vspace" : "\\added_space_top", "lyxline" : "\\line_top",
1180                     "newpage" : "\\pagebreak_top"}
1181     keywords_bot = {"vspace" : "\\added_space_bottom", "lyxline" : "\\line_bottom",
1182                     "newpage" : "\\pagebreak_bottom"}
1183     tokens = ["\\begin_inset VSpace", "\\lyxline", "\\newpage"]
1184
1185     # Convert the insets
1186     i = 0
1187     while 1:
1188         i = find_tokens(document.body, tokens, i)
1189         if i == -1:
1190             return
1191
1192         # Are we at the beginning of a paragraph?
1193         paragraph_start = 1
1194         this_par = get_paragraph(document.body, i, document.format - 1)
1195         start = this_par + 1
1196         params = get_par_params(document.body, start)
1197         size = "normal"
1198         # Paragraph parameters may be on one or more lines.
1199         # Find the start of the real paragraph text.
1200         while document.body[start][:1] == '\\' and document.body[start].split()[0] in params:
1201             start = start + 1
1202         for k in range(start, i):
1203             if document.body[k].find("\\size") != -1:
1204                 # store font size
1205                 size = document.body[k].split()[1]
1206             elif is_nonempty_line(document.body[k]):
1207                 paragraph_start = 0
1208                 break
1209         # Find the end of the real paragraph text.
1210         next_par = get_next_paragraph(document.body, i, document.format - 1)
1211         if next_par == -1:
1212             document.warning("Malformed LyX document: Missing next paragraph.")
1213             i = i + 1
1214             continue
1215
1216         # first line of our insets
1217         inset_start = i
1218         # last line of our insets
1219         inset_end = inset_start
1220         # Are we at the end of a paragraph?
1221         paragraph_end = 1
1222         # start and end line numbers to delete if we convert this inset
1223         del_lines = list()
1224         # is this inset a lyxline above a paragraph?
1225         top = list()
1226         # raw inset information
1227         lines = list()
1228         # name of this inset
1229         insets = list()
1230         # font size of this inset
1231         sizes = list()
1232
1233         # Detect subsequent lyxline, vspace and pagebreak insets created by convert_breaks()
1234         n = 0
1235         k = inset_start
1236         while k < next_par:
1237             if find_tokens(document.body, tokens, k) == k:
1238                 # inset to convert
1239                 lines.append(document.body[k].split())
1240                 insets.append(keys[lines[n][0]])
1241                 del_lines.append([k, k])
1242                 top.append(0)
1243                 sizes.append(size)
1244                 n = n + 1
1245                 inset_end = k
1246             elif document.body[k].find("\\size") != -1:
1247                 # store font size
1248                 size = document.body[k].split()[1]
1249             elif find_token(document.body, "\\begin_inset ERT", k) == k:
1250                 ert_begin = find_token(document.body, "\\layout", k) + 1
1251                 if ert_begin == 0:
1252                     document.warning("Malformed LyX document: Missing '\\layout'.")
1253                     continue
1254                 ert_end = find_end_of_inset(document.body, k)
1255                 if ert_end == -1:
1256                     document.warning("Malformed LyX document: Missing '\\end_inset'.")
1257                     continue
1258                 ert = ert2latex(document.body[ert_begin:ert_end], document.format - 1)
1259                 if (n > 0 and insets[n - 1] == "lyxline" and
1260                     ert == '\\vspace{-1\\parskip}\n'):
1261                     # vspace ERT created by convert_breaks() for top lyxline
1262                     top[n - 1] = 1
1263                     del_lines[n - 1][1] = ert_end
1264                     inset_end = ert_end
1265                     k = ert_end
1266                 else:
1267                     paragraph_end = 0
1268                     break
1269             elif (n > 0 and insets[n - 1] == "vspace" and
1270                   find_token(document.body, "\\end_inset", k) == k):
1271                 # ignore end of vspace inset
1272                 del_lines[n - 1][1] = k
1273                 inset_end = k
1274             elif is_nonempty_line(document.body[k]):
1275                 paragraph_end = 0
1276                 break
1277             k = k + 1
1278
1279         # Determine space amount for vspace insets
1280         spaceamount = list()
1281         arguments = list()
1282         for k in range(n):
1283             if insets[k] == "vspace":
1284                 spaceamount.append(lines[k][2])
1285                 arguments.append(' ' + spaceamount[k] + ' ')
1286             else:
1287                 spaceamount.append('')
1288                 arguments.append(' ')
1289
1290         # Can we convert to top paragraph parameters?
1291         before = 0
1292         if ((n == 3 and insets[0] == "newpage" and insets[1] == "vspace" and
1293              insets[2] == "lyxline" and top[2]) or
1294             (n == 2 and
1295              ((insets[0] == "newpage" and insets[1] == "vspace") or
1296               (insets[0] == "newpage" and insets[1] == "lyxline" and top[1]) or
1297               (insets[0] == "vspace"  and insets[1] == "lyxline" and top[1]))) or
1298             (n == 1 and insets[0] == "lyxline" and top[0])):
1299             # These insets have been created before a paragraph by
1300             # convert_breaks()
1301             before = 1
1302
1303         # Can we convert to bottom paragraph parameters?
1304         after = 0
1305         if ((n == 3 and insets[0] == "lyxline" and not top[0] and
1306              insets[1] == "vspace" and insets[2] == "newpage") or
1307             (n == 2 and
1308              ((insets[0] == "lyxline" and not top[0] and insets[1] == "vspace") or
1309               (insets[0] == "lyxline" and not top[0] and insets[1] == "newpage") or
1310               (insets[0] == "vspace"  and insets[1] == "newpage"))) or
1311             (n == 1 and insets[0] == "lyxline" and not top[0])):
1312             # These insets have been created after a paragraph by
1313             # convert_breaks()
1314             after = 1
1315
1316         if paragraph_start and paragraph_end:
1317             # We are in a paragraph of our own.
1318             # We must not delete this paragraph if it has parameters
1319             if params == '':
1320                 # First try to merge with the previous paragraph.
1321                 # We try the previous paragraph first because we would
1322                 # otherwise need ERT for two subsequent vspaces.
1323                 prev_par = get_paragraph(document.body, this_par - 1, document.format - 1) + 1
1324                 if prev_par > 0 and not before:
1325                     prev_params = get_par_params(document.body, prev_par + 1)
1326                     ert = 0
1327                     # determine font size
1328                     prev_size = "normal"
1329                     k = prev_par + 1
1330                     while document.body[k][:1] == '\\' and document.body[k].split()[0] in prev_params:
1331                         k = k + 1
1332                     while k < this_par:
1333                         if document.body[k].find("\\size") != -1:
1334                             prev_size = document.body[k].split()[1]
1335                             break
1336                         elif document.body[k].find("\\begin_inset") != -1:
1337                             # skip insets
1338                             k = find_end_of_inset(document.body, k)
1339                         elif is_nonempty_line(document.body[k]):
1340                             break
1341                         k = k + 1
1342                     for k in range(n):
1343                         if (keywords_bot[insets[k]] in prev_params or
1344                             (insets[k] == "lyxline" and sizes[k] != prev_size)):
1345                             ert = 1
1346                             break
1347                     if not ert:
1348                         for k in range(n):
1349                             document.body.insert(prev_par + 1,
1350                                              keywords_bot[insets[k]] + arguments[k])
1351                         del document.body[this_par+n:next_par-1+n]
1352                         i = this_par + n
1353                         continue
1354                 # Then try next paragraph
1355                 if next_par > 0 and not after:
1356                     next_params = get_par_params(document.body, next_par + 1)
1357                     ert = 0
1358                     while document.body[k][:1] == '\\' and document.body[k].split()[0] in next_params:
1359                         k = k + 1
1360                     # determine font size
1361                     next_size = "normal"
1362                     k = next_par + 1
1363                     while k < this_par:
1364                         if document.body[k].find("\\size") != -1:
1365                             next_size = document.body[k].split()[1]
1366                             break
1367                         elif is_nonempty_line(document.body[k]):
1368                             break
1369                         k = k + 1
1370                     for k in range(n):
1371                         if (keywords_top[insets[k]] in next_params or
1372                             (insets[k] == "lyxline" and sizes[k] != next_size)):
1373                             ert = 1
1374                             break
1375                     if not ert:
1376                         for k in range(n):
1377                             document.body.insert(next_par + 1,
1378                                              keywords_top[insets[k]] + arguments[k])
1379                         del document.body[this_par:next_par-1]
1380                         i = this_par
1381                         continue
1382         elif paragraph_start or paragraph_end:
1383             # Convert to paragraph formatting if we are at the beginning or end
1384             # of a paragraph and the resulting paragraph would not be empty
1385             # The order is important: del and insert invalidate some indices
1386             if paragraph_start:
1387                 keywords = keywords_top
1388             else:
1389                 keywords = keywords_bot
1390             ert = 0
1391             for k in range(n):
1392                 if keywords[insets[k]] in params:
1393                     ert = 1
1394                     break
1395             if not ert:
1396                 for k in range(n):
1397                     document.body.insert(this_par + 1,
1398                                      keywords[insets[k]] + arguments[k])
1399                     for j in range(k, n):
1400                         del_lines[j][0] = del_lines[j][0] + 1
1401                         del_lines[j][1] = del_lines[j][1] + 1
1402                     del document.body[del_lines[k][0]:del_lines[k][1]+1]
1403                     deleted = del_lines[k][1] - del_lines[k][0] + 1
1404                     for j in range(k + 1, n):
1405                         del_lines[j][0] = del_lines[j][0] - deleted
1406                         del_lines[j][1] = del_lines[j][1] - deleted
1407                 i = this_par
1408                 continue
1409
1410         # Convert the first inset to ERT.
1411         # The others are converted in the next loop runs (if they exist)
1412         if insets[0] == "vspace":
1413             document.body[i:i+1] = ['\\begin_inset ERT', 'status Collapsed', '',
1414                                 '\\layout %s' % document.default_layout, '', '\\backslash ']
1415             i = i + 6
1416             if spaceamount[0][-1] == '*':
1417                 spaceamount[0] = spaceamount[0][:-1]
1418                 keep = 1
1419             else:
1420                 keep = 0
1421
1422             # Replace defskip by the actual value
1423             if spaceamount[0] == 'defskip':
1424                 spaceamount[0] = defskipamount
1425
1426             # LaTeX does not know \\smallskip* etc
1427             if keep:
1428                 if spaceamount[0] == 'smallskip':
1429                     spaceamount[0] = '\\smallskipamount'
1430                 elif spaceamount[0] == 'medskip':
1431                     spaceamount[0] = '\\medskipamount'
1432                 elif spaceamount[0] == 'bigskip':
1433                     spaceamount[0] = '\\bigskipamount'
1434                 elif spaceamount[0] == 'vfill':
1435                     spaceamount[0] = '\\fill'
1436
1437             # Finally output the LaTeX code
1438             if (spaceamount[0] == 'smallskip' or spaceamount[0] == 'medskip' or
1439                 spaceamount[0] == 'bigskip'   or spaceamount[0] == 'vfill'):
1440                 document.body.insert(i, spaceamount[0] + '{}')
1441             else :
1442                 if keep:
1443                     document.body.insert(i, 'vspace*{')
1444                 else:
1445                     document.body.insert(i, 'vspace{')
1446                 i = convert_ertbackslash(document.body, i, spaceamount[0], document.format - 1, document.default_layout)
1447                 document.body[i] = document.body[i] + '}'
1448             i = i + 1
1449         elif insets[0] == "lyxline":
1450             document.body[i] = ''
1451             latexsize = lyxsize2latexsize(size)
1452             if latexsize == '':
1453                 document.warning("Could not convert LyX fontsize '%s' to LaTeX font size." % size)
1454                 latexsize = '\\normalsize'
1455             i = insert_ert(document.body, i, 'Collapsed',
1456                            '\\lyxline{%s}' % latexsize,
1457                            document.format - 1, document.default_layout)
1458             # We use \providecommand so that we don't get an error if native
1459             # lyxlines are used (LyX writes first its own preamble and then
1460             # the user specified one)
1461             add_to_preamble(document,
1462                             ['% Commands inserted by lyx2lyx for lyxlines',
1463                              '\\providecommand{\\lyxline}[1]{',
1464                              '  {#1 \\vspace{1ex} \\hrule width \\columnwidth \\vspace{1ex}}'
1465                              '}'])
1466         elif insets[0] == "newpage":
1467             document.body[i] = ''
1468             i = insert_ert(document.body, i, 'Collapsed', '\\newpage{}',
1469                            document.format - 1, document.default_layout)
1470
1471
1472 # Convert a LyX length into a LaTeX length
1473 def convert_len(len, special):
1474     units = {"text%":"\\textwidth", "col%":"\\columnwidth",
1475              "page%":"\\pagewidth", "line%":"\\linewidth",
1476              "theight%":"\\textheight", "pheight%":"\\pageheight"}
1477
1478     # Convert special lengths
1479     if special != 'none':
1480         len = '%f\\' % len2value(len) + special
1481
1482     # Convert LyX units to LaTeX units
1483     for unit in units.keys():
1484         if len.find(unit) != -1:
1485             len = '%f' % (len2value(len) / 100) + units[unit]
1486             break
1487
1488     return len
1489
1490
1491 def convert_ertlen(body, i, len, special, format, default_layout):
1492     """ Convert a LyX length into valid ERT code and append it to body[i]
1493     Return the (maybe incremented) line index i
1494     Convert backslashes and insert the converted length into body. """
1495     return convert_ertbackslash(body, i, convert_len(len, special), format, default_layout)
1496
1497
1498 def len2value(len):
1499     " Return the value of len without the unit in numerical form. "
1500     result = re.search('([+-]?[0-9.]+)', len)
1501     if result:
1502         return float(result.group(1))
1503     # No number means 1.0
1504     return 1.0
1505
1506
1507 def insert_ert(body, i, status, text, format, default_layout):
1508     """ Convert text to ERT and insert it at body[i]
1509     Return the index of the line after the inserted ERT"""
1510
1511     body[i:i] = ['\\begin_inset ERT', 'status ' + status, '']
1512     i = i + 3
1513     if format <= 224:
1514         body[i:i] = ['\\layout %s' % default_layout, '']
1515     else:
1516         body[i:i] = ['\\begin_layout %s' % default_layout, '']
1517     i = i + 1       # i points now to the just created empty line
1518     i = convert_ertbackslash(body, i, text, format, default_layout) + 1
1519     if format > 224:
1520         body[i:i] = ['\\end_layout']
1521         i = i + 1
1522     body[i:i] = ['', '\\end_inset', '']
1523     i = i + 3
1524     return i
1525
1526
1527 def add_to_preamble(document, text):
1528     """ Add text to the preamble if it is not already there.
1529     Only the first line is checked!"""
1530
1531     if find_token(document.preamble, text[0], 0) != -1:
1532         return
1533
1534     document.preamble.extend(text)
1535
1536
1537 def convert_frameless_box(document):
1538     " Convert frameless box."
1539     pos = ['t', 'c', 'b']
1540     inner_pos = ['c', 't', 'b', 's']
1541     i = 0
1542     while 1:
1543         i = find_token(document.body, '\\begin_inset Frameless', i)
1544         if i == -1:
1545             return
1546         j = find_end_of_inset(document.body, i)
1547         if j == -1:
1548             document.warning("Malformed LyX document: Missing '\\end_inset'.")
1549             i = i + 1
1550             continue
1551         del document.body[i]
1552         j = j - 1
1553
1554         # Gather parameters
1555         params = {'position':0, 'hor_pos':'c', 'has_inner_box':'1',
1556                   'inner_pos':1, 'use_parbox':'0', 'width':'100col%',
1557                   'special':'none', 'height':'1in',
1558                   'height_special':'totalheight', 'collapsed':'false'}
1559         for key in params.keys():
1560             value = get_value(document.body, key, i, j).replace('"', '')
1561             if value != "":
1562                 if key == 'position':
1563                     # convert new to old position: 'position "t"' -> 0
1564                     value = find_token(pos, value, 0)
1565                     if value != -1:
1566                         params[key] = value
1567                 elif key == 'inner_pos':
1568                     # convert inner position
1569                     value = find_token(inner_pos, value, 0)
1570                     if value != -1:
1571                         params[key] = value
1572                 else:
1573                     params[key] = value
1574                 j = del_token(document.body, key, i, j)
1575         i = i + 1
1576
1577         # Convert to minipage or ERT?
1578         # Note that the inner_position and height parameters of a minipage
1579         # inset are ignored and not accessible for the user, although they
1580         # are present in the file format and correctly read in and written.
1581         # Therefore we convert to ERT if they do not have their LaTeX
1582         # defaults. These are:
1583         # - the value of "position" for "inner_pos"
1584         # - "\totalheight"          for "height"
1585         if (params['use_parbox'] != '0' or
1586             params['has_inner_box'] != '1' or
1587             params['special'] != 'none' or
1588             params['height_special'] != 'totalheight' or
1589             len2value(params['height']) != 1.0):
1590
1591             # Here we know that this box is not supported in file format 224.
1592             # Therefore we need to convert it to ERT. We can't simply convert
1593             # the beginning and end of the box to ERT, because the
1594             # box inset may contain layouts that are different from the
1595             # surrounding layout. After the conversion the contents of the
1596             # box inset is on the same level as the surrounding text, and
1597             # paragraph layouts and align parameters can get mixed up.
1598
1599             # A possible solution for this problem:
1600             # Convert the box to a minipage and redefine the minipage
1601             # environment in ERT so that the original box is simulated.
1602             # For minipages we could do this in a way that the width and
1603             # position can still be set from LyX, but this did not work well.
1604             # This is not possible for parboxes either, so we convert the
1605             # original box to ERT, put the minipage inset inside the box
1606             # and redefine the minipage environment to be empty.
1607
1608             # Commands that are independant of a particular box can go to
1609             # the preamble.
1610             # We need to define lyxtolyxrealminipage with 3 optional
1611             # arguments although LyX 1.3 uses only the first one.
1612             # Otherwise we will get LaTeX errors if this document is
1613             # converted to format 225 or above again (LyX 1.4 uses all
1614             # optional arguments).
1615             add_to_preamble(document,
1616                 ['% Commands inserted by lyx2lyx for frameless boxes',
1617                  '% Save the original minipage environment',
1618                  '\\let\\lyxtolyxrealminipage\\minipage',
1619                  '\\let\\endlyxtolyxrealminipage\\endminipage',
1620                  '% Define an empty lyxtolyximinipage environment',
1621                  '% with 3 optional arguments',
1622                  '\\newenvironment{lyxtolyxiiiminipage}[4]{}{}',
1623                  '\\newenvironment{lyxtolyxiiminipage}[2][\\lyxtolyxargi]%',
1624                  '  {\\begin{lyxtolyxiiiminipage}{\\lyxtolyxargi}{\\lyxtolyxargii}{#1}{#2}}%',
1625                  '  {\\end{lyxtolyxiiiminipage}}',
1626                  '\\newenvironment{lyxtolyximinipage}[1][\\totalheight]%',
1627                  '  {\\def\\lyxtolyxargii{{#1}}\\begin{lyxtolyxiiminipage}}%',
1628                  '  {\\end{lyxtolyxiiminipage}}',
1629                  '\\newenvironment{lyxtolyxminipage}[1][c]%',
1630                  '  {\\def\\lyxtolyxargi{{#1}}\\begin{lyxtolyximinipage}}',
1631                  '  {\\end{lyxtolyximinipage}}'])
1632
1633             if params['use_parbox'] != '0':
1634                 ert = '\\parbox'
1635             else:
1636                 ert = '\\begin{lyxtolyxrealminipage}'
1637
1638             # convert optional arguments only if not latex default
1639             if (pos[params['position']] != 'c' or
1640                 inner_pos[params['inner_pos']] != pos[params['position']] or
1641                 params['height_special'] != 'totalheight' or
1642                 len2value(params['height']) != 1.0):
1643                 ert = ert + '[' + pos[params['position']] + ']'
1644             if (inner_pos[params['inner_pos']] != pos[params['position']] or
1645                 params['height_special'] != 'totalheight' or
1646                 len2value(params['height']) != 1.0):
1647                 ert = ert + '[' + convert_len(params['height'],
1648                                               params['height_special']) + ']'
1649             if inner_pos[params['inner_pos']] != pos[params['position']]:
1650                 ert = ert + '[' + inner_pos[params['inner_pos']] + ']'
1651
1652             ert = ert + '{' + convert_len(params['width'],
1653                                           params['special']) + '}'
1654
1655             if params['use_parbox'] != '0':
1656                 ert = ert + '{'
1657             ert = ert + '\\let\\minipage\\lyxtolyxminipage%\n'
1658             ert = ert + '\\let\\endminipage\\endlyxtolyxminipage%\n'
1659
1660             old_i = i
1661             i = insert_ert(document.body, i, 'Collapsed', ert, document.format - 1, document.default_layout)
1662             j = j + i - old_i - 1
1663
1664             document.body[i:i] = ['\\begin_inset Minipage',
1665                               'position %d' % params['position'],
1666                               'inner_position 1',
1667                               'height "1in"',
1668                               'width "' + params['width'] + '"',
1669                               'collapsed ' + params['collapsed']]
1670             i = i + 6
1671             j = j + 6
1672
1673             # Restore the original minipage environment since we may have
1674             # minipages inside this box.
1675             # Start a new paragraph because the following may be nonstandard
1676             document.body[i:i] = ['\\layout %s' % document.default_layout, '', '']
1677             i = i + 2
1678             j = j + 3
1679             ert = '\\let\\minipage\\lyxtolyxrealminipage%\n'
1680             ert = ert + '\\let\\endminipage\\lyxtolyxrealendminipage%'
1681             old_i = i
1682             i = insert_ert(document.body, i, 'Collapsed', ert, document.format - 1, document.default_layout)
1683             j = j + i - old_i - 1
1684
1685             # Redefine the minipage end before the inset end.
1686             # Start a new paragraph because the previous may be nonstandard
1687             document.body[j:j] = ['\\layout %s' % document.default_layout, '', '']
1688             j = j + 2
1689             ert = '\\let\\endminipage\\endlyxtolyxminipage'
1690             j = insert_ert(document.body, j, 'Collapsed', ert, document.format - 1, document.default_layout)
1691             j = j + 1
1692             document.body.insert(j, '')
1693             j = j + 1
1694
1695             # LyX writes '%\n' after each box. Therefore we need to end our
1696             # ERT with '%\n', too, since this may swallow a following space.
1697             if params['use_parbox'] != '0':
1698                 ert = '}%\n'
1699             else:
1700                 ert = '\\end{lyxtolyxrealminipage}%\n'
1701             j = insert_ert(document.body, j, 'Collapsed', ert, document.format - 1, document.default_layout)
1702
1703             # We don't need to restore the original minipage after the inset
1704             # end because the scope of the redefinition is the original box.
1705
1706         else:
1707
1708             # Convert to minipage
1709             document.body[i:i] = ['\\begin_inset Minipage',
1710                               'position %d' % params['position'],
1711                               'inner_position %d' % params['inner_pos'],
1712                               'height "' + params['height'] + '"',
1713                               'width "' + params['width'] + '"',
1714                               'collapsed ' + params['collapsed']]
1715             i = i + 6
1716
1717
1718 def remove_branches(document):
1719     " Remove branches. "
1720     i = 0
1721     while 1:
1722         i = find_token(document.header, "\\branch", i)
1723         if i == -1:
1724             break
1725         document.warning("Removing branch %s." % document.header[i].split()[1])
1726         j = find_token(document.header, "\\end_branch", i)
1727         if j == -1:
1728             document.warning("Malformed LyX document: Missing '\\end_branch'.")
1729             break
1730         del document.header[i:j+1]
1731
1732     i = 0
1733     while 1:
1734         i = find_token(document.body, "\\begin_inset Branch", i)
1735         if i == -1:
1736             return
1737         j = find_end_of_inset(document.body, i)
1738         if j == -1:
1739             document.warning("Malformed LyX document: Missing '\\end_inset'.")
1740             i = i + 1
1741             continue
1742         del document.body[i]
1743         del document.body[j - 1]
1744         # Seach for a line starting 'collapsed'
1745         # If, however, we find a line starting '\layout'
1746         # (_always_ present) then break with a warning message
1747         collapsed_found = 0
1748         while 1:
1749             if (document.body[i][:9] == "collapsed"):
1750                 del document.body[i]
1751                 collapsed_found = 1
1752                 continue
1753             elif (document.body[i][:7] == "\\layout"):
1754                 if collapsed_found == 0:
1755                     document.warning("Malformed LyX document: Missing 'collapsed'.")
1756                 # Delete this new paragraph, since it would not appear in
1757                 # .tex output. This avoids also empty paragraphs.
1758                 del document.body[i]
1759                 break
1760             i = i + 1
1761
1762
1763 def convert_jurabib(document):
1764     " Convert jurabib. "
1765     i = find_token(document.header, '\\use_numerical_citations', 0)
1766     if i == -1:
1767         document.warning("Malformed lyx document: Missing '\\use_numerical_citations'.")
1768         return
1769     document.header.insert(i + 1, '\\use_jurabib 0')
1770
1771
1772 def revert_jurabib(document):
1773     " Revert jurabib. "
1774     i = find_token(document.header, '\\use_jurabib', 0)
1775     if i == -1:
1776         document.warning("Malformed lyx document: Missing '\\use_jurabib'.")
1777         return
1778     if get_value(document.header, '\\use_jurabib', 0) != "0":
1779         document.warning("Conversion of '\\use_jurabib = 1' not yet implemented.")
1780         # Don't remove '\\use_jurabib' so that people will get warnings by lyx
1781         return
1782     del document.header[i]
1783
1784
1785 def convert_bibtopic(document):
1786     " Convert bibtopic. "
1787     i = find_token(document.header, '\\use_jurabib', 0)
1788     if i == -1:
1789         document.warning("Malformed lyx document: Missing '\\use_jurabib'.")
1790         return
1791     document.header.insert(i + 1, '\\use_bibtopic 0')
1792
1793
1794 def revert_bibtopic(document):
1795     " Revert bibtopic. "
1796     i = find_token(document.header, '\\use_bibtopic', 0)
1797     if i == -1:
1798         document.warning("Malformed lyx document: Missing '\\use_bibtopic'.")
1799         return
1800     if get_value(document.header, '\\use_bibtopic', 0) != "0":
1801         document.warning("Conversion of '\\use_bibtopic = 1' not yet implemented.")
1802         # Don't remove '\\use_jurabib' so that people will get warnings by lyx
1803     del document.header[i]
1804
1805
1806 def convert_float(document):
1807     " Convert sideway floats. "
1808     i = 0
1809     while 1:
1810         i = find_token_exact(document.body, '\\begin_inset Float', i)
1811         if i == -1:
1812             return
1813         # Seach for a line starting 'wide'
1814         # If, however, we find a line starting '\begin_layout'
1815         # (_always_ present) then break with a warning message
1816         i = i + 1
1817         while 1:
1818             if (document.body[i][:4] == "wide"):
1819                 document.body.insert(i + 1, 'sideways false')
1820                 break
1821             elif (document.body[i][:13] == "\\begin_layout"):
1822                 document.warning("Malformed lyx document: Missing 'wide'.")
1823                 break
1824             i = i + 1
1825         i = i + 1
1826
1827
1828 def revert_float(document):
1829     " Revert sideway floats. "
1830     i = 0
1831     while 1:
1832         i = find_token_exact(document.body, '\\begin_inset Float', i)
1833         if i == -1:
1834             return
1835         j = find_end_of_inset(document.body, i)
1836         if j == -1:
1837             document.warning("Malformed lyx document: Missing '\\end_inset'.")
1838             i = i + 1
1839             continue
1840         if get_value(document.body, 'sideways', i, j) != "false":
1841             document.warning("Conversion of 'sideways true' not yet implemented.")
1842             # Don't remove 'sideways' so that people will get warnings by lyx
1843             i = i + 1
1844             continue
1845         del_token(document.body, 'sideways', i, j)
1846         i = i + 1
1847
1848
1849 def convert_graphics(document):
1850     """ Add extension to documentnames of insetgraphics if necessary.
1851     """
1852     i = 0
1853     while 1:
1854         i = find_token(document.body, "\\begin_inset Graphics", i)
1855         if i == -1:
1856             return
1857
1858         j = find_token_exact(document.body, "documentname", i)
1859         if j == -1:
1860             return
1861         i = i + 1
1862         filename = document.body[j].split()[1]
1863         absname = os.path.normpath(os.path.join(document.dir, filename))
1864         if document.input == stdin and not os.path.isabs(filename):
1865             # We don't know the directory and cannot check the document.
1866             # We could use a heuristic and take the current directory,
1867             # and we could try to find out if documentname has an extension,
1868             # but that would be just guesses and could be wrong.
1869             document.warning("""Warning: Cannot determine whether document
1870          %s
1871          needs an extension when reading from standard input.
1872          You may need to correct the document manually or run
1873          lyx2lyx again with the .lyx document as commandline argument.""" % filename)
1874             continue
1875         # This needs to be the same algorithm as in pre 233 insetgraphics
1876         if access(absname, F_OK):
1877             continue
1878         if access(absname + ".ps", F_OK):
1879             document.body[j] = document.body[j].replace(filename, filename + ".ps")
1880             continue
1881         if access(absname + ".eps", F_OK):
1882             document.body[j] = document.body[j].replace(filename, filename + ".eps")
1883
1884
1885 def convert_names(document):
1886     """ Convert in the docbook backend from firstname and surname style
1887     to charstyles.
1888     """
1889     if document.backend != "docbook":
1890         return
1891
1892     i = 0
1893
1894     while 1:
1895         i = find_token(document.body, "\\begin_layout Author", i)
1896         if i == -1:
1897             return
1898
1899         i = i + 1
1900         while document.body[i] == "":
1901             i = i + 1
1902
1903         if document.body[i][:11] != "\\end_layout" or document.body[i+2][:13] != "\\begin_deeper":
1904             i = i + 1
1905             continue
1906
1907         k = i
1908         i = find_end_of( document.body, i+3, "\\begin_deeper","\\end_deeper")
1909         if i == -1:
1910             # something is really wrong, abort
1911             document.warning("Missing \\end_deeper, after style Author.")
1912             document.warning("Aborted attempt to parse FirstName and Surname.")
1913             return
1914         firstname, surname = "", ""
1915
1916         name = document.body[k:i]
1917
1918         j = find_token(name, "\\begin_layout FirstName", 0)
1919         if j != -1:
1920             j = j + 1
1921             while(name[j] != "\\end_layout"):
1922                 firstname = firstname + name[j]
1923                 j = j + 1
1924
1925         j = find_token(name, "\\begin_layout Surname", 0)
1926         if j != -1:
1927             j = j + 1
1928             while(name[j] != "\\end_layout"):
1929                 surname = surname + name[j]
1930                 j = j + 1
1931
1932         # delete name
1933         del document.body[k+2:i+1]
1934
1935         document.body[k-1:k-1] = ["", "",
1936                           "\\begin_inset CharStyle Firstname",
1937                           "status inlined",
1938                           "",
1939                           '\\begin_layout %s' % document.default_layout,
1940                           "",
1941                           "%s" % firstname,
1942                           "\end_layout",
1943                           "",
1944                           "\end_inset",
1945                           "",
1946                           "",
1947                           "\\begin_inset CharStyle Surname",
1948                           "status inlined",
1949                           "",
1950                           '\\begin_layout %s' % document.default_layout,
1951                           "",
1952                           "%s" % surname,
1953                           "\\end_layout",
1954                           "",
1955                           "\\end_inset",
1956                           ""]
1957
1958
1959 def revert_names(document):
1960     """ Revert in the docbook backend from firstname and surname char style
1961     to styles.
1962     """
1963     if document.backend != "docbook":
1964         return
1965
1966
1967 def convert_cite_engine(document):
1968     r""" \use_natbib 1                       \cite_engine <style>
1969          \use_numerical_citations 0     ->   where <style> is one of
1970          \use_jurabib 0                      "basic", "natbib_authoryear","""
1971
1972     a = find_token(document.header, "\\use_natbib", 0)
1973     if a == -1:
1974         document.warning("Malformed lyx document: Missing '\\use_natbib'.")
1975         return
1976
1977     b = find_token(document.header, "\\use_numerical_citations", 0)
1978     if b == -1 or b != a+1:
1979         document.warning("Malformed lyx document: Missing '\\use_numerical_citations'.")
1980         return
1981
1982     c = find_token(document.header, "\\use_jurabib", 0)
1983     if c == -1 or c != b+1:
1984         document.warning("Malformed lyx document: Missing '\\use_jurabib'.")
1985         return
1986
1987     use_natbib = int(document.header[a].split()[1])
1988     use_numerical_citations = int(document.header[b].split()[1])
1989     use_jurabib = int(document.header[c].split()[1])
1990
1991     cite_engine = "basic"
1992     if use_natbib:
1993         if use_numerical_citations:
1994             cite_engine = "natbib_numerical"
1995         else:
1996              cite_engine = "natbib_authoryear"
1997     elif use_jurabib:
1998         cite_engine = "jurabib"
1999
2000     del document.header[a:c+1]
2001     document.header.insert(a, "\\cite_engine " + cite_engine)
2002
2003
2004 def revert_cite_engine(document):
2005     " Revert the cite engine. "
2006     i = find_token(document.header, "\\cite_engine", 0)
2007     if i == -1:
2008         document.warning("Malformed lyx document: Missing '\\cite_engine'.")
2009         return
2010
2011     cite_engine = document.header[i].split()[1]
2012
2013     use_natbib = '0'
2014     use_numerical = '0'
2015     use_jurabib = '0'
2016     if cite_engine == "natbib_numerical":
2017         use_natbib = '1'
2018         use_numerical = '1'
2019     elif cite_engine == "natbib_authoryear":
2020         use_natbib = '1'
2021     elif cite_engine == "jurabib":
2022         use_jurabib = '1'
2023
2024     del document.header[i]
2025     document.header.insert(i, "\\use_jurabib " + use_jurabib)
2026     document.header.insert(i, "\\use_numerical_citations " + use_numerical)
2027     document.header.insert(i, "\\use_natbib " + use_natbib)
2028
2029
2030 def convert_paperpackage(document):
2031     " Convert paper package. "
2032     i = find_token(document.header, "\\paperpackage", 0)
2033     if i == -1:
2034         return
2035
2036     packages = {'default':'none','a4':'none', 'a4wide':'a4', 'widemarginsa4':'a4wide'}
2037     if len(document.header[i].split()) > 1:
2038         paperpackage = document.header[i].split()[1]
2039         document.header[i] = document.header[i].replace(paperpackage, packages[paperpackage])
2040     else:
2041         document.header[i] = document.header[i] + ' widemarginsa4'
2042
2043
2044 def revert_paperpackage(document):
2045     " Revert paper package. "
2046     i = find_token(document.header, "\\paperpackage", 0)
2047     if i == -1:
2048         return
2049
2050     packages = {'none':'a4', 'a4':'a4wide', 'a4wide':'widemarginsa4',
2051                 'widemarginsa4':'', 'default': 'default'}
2052     if len(document.header[i].split()) > 1:
2053         paperpackage = document.header[i].split()[1]
2054     else:
2055         paperpackage = 'default'
2056     document.header[i] = document.header[i].replace(paperpackage, packages[paperpackage])
2057
2058
2059 def convert_bullets(document):
2060     " Convert bullets. "
2061     i = 0
2062     while 1:
2063         i = find_token(document.header, "\\bullet", i)
2064         if i == -1:
2065             return
2066         if document.header[i][:12] == '\\bulletLaTeX':
2067             document.header[i] = document.header[i] + ' ' + document.header[i+1].strip()
2068             n = 3
2069         else:
2070             document.header[i] = document.header[i] + ' ' + document.header[i+1].strip() +\
2071                         ' ' + document.header[i+2].strip() + ' ' + document.header[i+3].strip()
2072             n = 5
2073         del document.header[i+1:i + n]
2074         i = i + 1
2075
2076
2077 def revert_bullets(document):
2078     " Revert bullets. "
2079     i = 0
2080     while 1:
2081         i = find_token(document.header, "\\bullet", i)
2082         if i == -1:
2083             return
2084         if document.header[i][:12] == '\\bulletLaTeX':
2085             n = document.header[i].find('"')
2086             if n == -1:
2087                 document.warning("Malformed header.")
2088                 return
2089             else:
2090                 document.header[i:i+1] = [document.header[i][:n-1],'\t' + document.header[i][n:], '\\end_bullet']
2091             i = i + 3
2092         else:
2093             frag = document.header[i].split()
2094             if len(frag) != 5:
2095                 document.warning("Malformed header.")
2096                 return
2097             else:
2098                 document.header[i:i+1] = [frag[0] + ' ' + frag[1],
2099                                  '\t' + frag[2],
2100                                  '\t' + frag[3],
2101                                  '\t' + frag[4],
2102                                  '\\end_bullet']
2103                 i = i + 5
2104
2105
2106 def add_begin_header(document):
2107     r" Add \begin_header and \begin_document. "
2108     i = find_token(document.header, '\\lyxformat', 0)
2109     document.header.insert(i+1, '\\begin_header')
2110     document.header.insert(i+1, '\\begin_document')
2111
2112
2113 def remove_begin_header(document):
2114     r" Remove \begin_header and \begin_document. "
2115     i = find_token(document.header, "\\begin_document", 0)
2116     if i != -1:
2117         del document.header[i]
2118     i = find_token(document.header, "\\begin_header", 0)
2119     if i != -1:
2120         del document.header[i]
2121
2122
2123 def add_begin_body(document):
2124     r" Add and \begin_document and \end_document"
2125     document.body.insert(0, '\\begin_body')
2126     document.body.insert(1, '')
2127     i = find_token(document.body, "\\end_document", 0)
2128     document.body.insert(i, '\\end_body')
2129
2130 def remove_begin_body(document):
2131     r" Remove \begin_body and \end_body"
2132     i = find_token(document.body, "\\begin_body", 0)
2133     if i != -1:
2134         del document.body[i]
2135         if not document.body[i]:
2136             del document.body[i]
2137     i = find_token(document.body, "\\end_body", 0)
2138     if i != -1:
2139         del document.body[i]
2140
2141
2142 def normalize_papersize(document):
2143     r" Normalize \papersize"
2144     i = find_token(document.header, '\\papersize', 0)
2145     if i == -1:
2146         return
2147
2148     tmp = document.header[i].split()
2149     if tmp[1] == "Default":
2150         document.header[i] = '\\papersize default'
2151         return
2152     if tmp[1] == "Custom":
2153         document.header[i] = '\\papersize custom'
2154
2155
2156 def denormalize_papersize(document):
2157     r" Revert \papersize"
2158     i = find_token(document.header, '\\papersize', 0)
2159     if i == -1:
2160         return
2161
2162     tmp = document.header[i].split()
2163     if tmp[1] == "custom":
2164         document.header[i] = '\\papersize Custom'
2165
2166
2167 def strip_end_space(document):
2168     " Strip spaces at end of command line. "
2169     for i in range(len(document.body)):
2170         if document.body[i][:1] == '\\':
2171             document.body[i] = document.body[i].strip()
2172
2173
2174 def use_x_boolean(document):
2175     r" Use boolean values for \use_geometry, \use_bibtopic and \tracking_changes"
2176     bin2bool = {'0': 'false', '1': 'true'}
2177     for use in '\\use_geometry', '\\use_bibtopic', '\\tracking_changes':
2178         i = find_token(document.header, use, 0)
2179         if i == -1:
2180             continue
2181         decompose = document.header[i].split()
2182         document.header[i] = decompose[0] + ' ' + bin2bool[decompose[1]]
2183
2184
2185 def use_x_binary(document):
2186     r" Use digit values for \use_geometry, \use_bibtopic and \tracking_changes"
2187     bool2bin = {'false': '0', 'true': '1'}
2188     for use in '\\use_geometry', '\\use_bibtopic', '\\tracking_changes':
2189         i = find_token(document.header, use, 0)
2190         if i == -1:
2191             continue
2192         decompose = document.header[i].split()
2193         document.header[i] = decompose[0] + ' ' + bool2bin[decompose[1]]
2194
2195
2196 def normalize_paragraph_params(document):
2197     " Place all the paragraph parameters in their own line. "
2198     body = document.body
2199
2200     allowed_parameters = '\\paragraph_spacing', '\\noindent', \
2201                          '\\align', '\\labelwidthstring', "\\start_of_appendix", \
2202                          "\\leftindent"
2203
2204     i = 0
2205     while 1:
2206         i = find_token(document.body, '\\begin_layout', i)
2207         if i == -1:
2208             return
2209
2210         i = i + 1
2211         while 1:
2212             if body[i].strip() and body[i].split()[0] not in allowed_parameters:
2213                 break
2214
2215             j = body[i].find('\\', 1)
2216
2217             if j != -1:
2218                 body[i:i+1] = [body[i][:j].strip(), body[i][j:]]
2219
2220             i = i + 1
2221
2222
2223 def convert_output_changes (document):
2224     " Add output_changes parameter. "
2225     i = find_token(document.header, '\\tracking_changes', 0)
2226     if i == -1:
2227         document.warning("Malformed lyx document: Missing '\\tracking_changes'.")
2228         return
2229     document.header.insert(i+1, '\\output_changes true')
2230
2231
2232 def revert_output_changes (document):
2233     " Remove output_changes parameter. "
2234     i = find_token(document.header, '\\output_changes', 0)
2235     if i == -1:
2236         return
2237     del document.header[i]
2238
2239
2240 def convert_ert_paragraphs(document):
2241     " Convert paragraph breaks and sanitize paragraphs. "
2242     forbidden_settings = [
2243                           # paragraph parameters
2244                           '\\paragraph_spacing', '\\labelwidthstring',
2245                           '\\start_of_appendix', '\\noindent',
2246                           '\\leftindent', '\\align',
2247                           # font settings
2248                           '\\family', '\\series', '\\shape', '\\size',
2249                           '\\emph', '\\numeric', '\\bar', '\\noun',
2250                           '\\color', '\\lang']
2251     i = 0
2252     while 1:
2253         i = find_token(document.body, '\\begin_inset ERT', i)
2254         if i == -1:
2255             return
2256         j = find_end_of_inset(document.body, i)
2257         if j == -1:
2258             document.warning("Malformed lyx document: Missing '\\end_inset'.")
2259             i = i + 1
2260             continue
2261
2262         # convert non-standard paragraphs to standard
2263         k = i
2264         while 1:
2265             k = find_token(document.body, "\\begin_layout", k, j)
2266             if k == -1:
2267                 break
2268             document.body[k] = '\\begin_layout %s' % document.default_layout
2269             k = k + 1
2270
2271         # remove all paragraph parameters and font settings
2272         k = i
2273         while k < j:
2274             if (document.body[k].strip() and
2275                 document.body[k].split()[0] in forbidden_settings):
2276                 del document.body[k]
2277                 j = j - 1
2278             else:
2279                 k = k + 1
2280
2281         # insert an empty paragraph before each paragraph but the first
2282         k = i
2283         first_pagraph = 1
2284         while 1:
2285             k = find_token(document.body, "\\begin_layout", k, j)
2286             if k == -1:
2287                 break
2288             if first_pagraph:
2289                 first_pagraph = 0
2290                 k = k + 1
2291                 continue
2292             document.body[k:k] = ['\\begin_layout %s' % document.default_layout, "",
2293                               "\\end_layout", ""]
2294             k = k + 5
2295             j = j + 4
2296
2297         # convert \\newline to new paragraph
2298         k = i
2299         while 1:
2300             k = find_token(document.body, "\\newline", k, j)
2301             if k == -1:
2302                 break
2303             document.body[k:k+1] = ["\\end_layout", "", '\\begin_layout %s' % document.default_layout]
2304             k = k + 3
2305             j = j + 2
2306             # We need an empty line if document.default_layout == ''
2307             if document.body[k] != '':
2308                 document.body.insert(k, '')
2309                 k = k + 1
2310                 j = j + 1
2311         i = i + 1
2312
2313
2314 def revert_ert_paragraphs(document):
2315     " Remove double paragraph breaks. "
2316     i = 0
2317     while 1:
2318         i = find_token(document.body, '\\begin_inset ERT', i)
2319         if i == -1:
2320             return
2321         j = find_end_of_inset(document.body, i)
2322         if j == -1:
2323             document.warning("Malformed lyx document: Missing '\\end_inset'.")
2324             i = i + 1
2325             continue
2326
2327         # replace paragraph breaks with \newline
2328         k = i
2329         while 1:
2330             k = find_token(document.body, "\\end_layout", k, j)
2331             l = find_token(document.body, "\\begin_layout", k, j)
2332             if k == -1 or l == -1:
2333                 break
2334             document.body[k:l+1] = ["\\newline"]
2335             j = j - l + k
2336             k = k + 1
2337
2338         # replace double \newlines with paragraph breaks
2339         k = i
2340         while 1:
2341             k = find_token(document.body, "\\newline", k, j)
2342             if k == -1:
2343                 break
2344             l = k + 1
2345             while document.body[l] == "":
2346                 l = l + 1
2347             if document.body[l].strip() and document.body[l].split()[0] == "\\newline":
2348                 document.body[k:l+1] = ["\\end_layout", "",
2349                                     '\\begin_layout %s' % document.default_layout]
2350                 j = j - l + k + 2
2351                 k = k + 3
2352                 # We need an empty line if document.default_layout == ''
2353                 if document.body[l+1] != '':
2354                     document.body.insert(l+1, '')
2355                     k = k + 1
2356                     j = j + 1
2357             else:
2358                 k = k + 1
2359         i = i + 1
2360
2361
2362 def convert_french(document):
2363     " Convert frenchb. "
2364     regexp = re.compile(r'^\\language\s+frenchb')
2365     i = find_re(document.header, regexp, 0)
2366     if i != -1:
2367         document.header[i] = "\\language french"
2368
2369     # Change language in the document body
2370     regexp = re.compile(r'^\\lang\s+frenchb')
2371     i = 0
2372     while 1:
2373         i = find_re(document.body, regexp, i)
2374         if i == -1:
2375             break
2376         document.body[i] = "\\lang french"
2377         i = i + 1
2378
2379
2380 def remove_paperpackage(document):
2381     " Remove paper package. "
2382     i = find_token(document.header, '\\paperpackage', 0)
2383
2384     if i == -1:
2385         return
2386
2387     paperpackage = document.header[i].split()[1]
2388
2389     del document.header[i]
2390
2391     if paperpackage not in ("a4", "a4wide", "widemarginsa4"):
2392         return
2393
2394     conv = {"a4":"\\usepackage{a4}","a4wide": "\\usepackage{a4wide}",
2395             "widemarginsa4": "\\usepackage[widemargins]{a4}"}
2396     # for compatibility we ensure it is the first entry in preamble
2397     document.preamble[0:0] = [conv[paperpackage]]
2398
2399     i = find_token(document.header, '\\papersize', 0)
2400     if i != -1:
2401         document.header[i] = "\\papersize default"
2402
2403
2404 def remove_quotestimes(document):
2405     " Remove quotestimes. "
2406     i = find_token(document.header, '\\quotes_times', 0)
2407     if i == -1:
2408         return
2409     del document.header[i]
2410
2411
2412 def convert_sgml_paragraphs(document):
2413     " Convert SGML paragraphs. "
2414     if document.backend != "docbook":
2415         return
2416
2417     i = 0
2418     while 1:
2419         i = find_token(document.body, "\\begin_layout SGML", i)
2420
2421         if i == -1:
2422             return
2423
2424         document.body[i] = "\\begin_layout Standard"
2425         j = find_token(document.body, "\\end_layout", i)
2426
2427         document.body[j+1:j+1] = ['','\\end_inset','','','\\end_layout']
2428         document.body[i+1:i+1] = ['\\begin_inset ERT','status inlined','','\\begin_layout Standard','']
2429
2430         i = i + 10
2431
2432 ##
2433 # Conversion hub
2434 #
2435
2436 supported_versions = ["1.4.%d" % i for i in range(3)] + ["1.4"]
2437 convert = [[222, [insert_tracking_changes, add_end_header, convert_amsmath]],
2438            [223, [remove_color_default, convert_spaces, convert_bibtex, remove_insetparent]],
2439            [224, [convert_external, convert_comment]],
2440            [225, [add_end_layout, layout2begin_layout, convert_end_document,
2441                   convert_table_valignment_middle, convert_breaks]],
2442            [226, [convert_note]],
2443            [227, [convert_box]],
2444            [228, [convert_collapsable, convert_ert]],
2445            [229, [convert_minipage]],
2446            [230, [convert_jurabib]],
2447            [231, [convert_float]],
2448            [232, [convert_bibtopic]],
2449            [233, [convert_graphics, convert_names]],
2450            [234, [convert_cite_engine]],
2451            [235, [convert_paperpackage]],
2452            [236, [convert_bullets, add_begin_header, add_begin_body,
2453                   normalize_papersize, strip_end_space]],
2454            [237, [use_x_boolean]],
2455            [238, [update_latexaccents]],
2456            [239, [normalize_paragraph_params]],
2457            [240, [convert_output_changes]],
2458            [241, [convert_ert_paragraphs]],
2459            [242, [convert_french]],
2460            [243, [remove_paperpackage]],
2461            [244, [rename_spaces]],
2462            [245, [remove_quotestimes, convert_sgml_paragraphs]]]
2463
2464 revert =  [[244, []],
2465            [243, [revert_space_names]],
2466            [242, []],
2467            [241, []],
2468            [240, [revert_ert_paragraphs]],
2469            [239, [revert_output_changes]],
2470            [238, []],
2471            [237, []],
2472            [236, [use_x_binary]],
2473            [235, [denormalize_papersize, remove_begin_body,remove_begin_header,
2474                   revert_bullets]],
2475            [234, [revert_paperpackage]],
2476            [233, [revert_cite_engine]],
2477            [232, [revert_names]],
2478            [231, [revert_bibtopic]],
2479            [230, [revert_float]],
2480            [229, [revert_jurabib]],
2481            [228, []],
2482            [227, [revert_collapsable, revert_ert]],
2483            [226, [revert_box, revert_external_2]],
2484            [225, [revert_note]],
2485            [224, [rm_end_layout, begin_layout2layout, revert_end_document,
2486                   revert_valignment_middle, revert_breaks, convert_frameless_box,
2487                   remove_branches]],
2488            [223, [revert_external_2, revert_comment, revert_eqref]],
2489            [222, [revert_spaces, revert_bibtex]],
2490            [221, [revert_amsmath, rm_end_header, rm_tracking_changes, rm_body_changes]]]
2491
2492
2493 if __name__ == "__main__":
2494     pass