lib/lyx2lyx/lyxconvert_218.py

   1 # This file is part of lyx2lyx
   2 # Copyright (C) 2002 Dekel Tsur <dekel@lyx.org>
   3 #
   4 # This program is free software; you can redistribute it and/or
   5 # modify it under the terms of the GNU General Public License
   6 # as published by the Free Software Foundation; either version 2
   7 # of the License, or (at your option) any later version.
   8 #
   9 # This program is distributed in the hope that it will be useful,
  10 # but WITHOUT ANY WARRANTY; without even the implied warranty of
  11 # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
  12 # GNU General Public License for more details.
  13 #
  14 # You should have received a copy of the GNU General Public License
  15 # along with this program; if not, write to the Free Software
  16 # Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
  17
  18
  19 import sys,string,re
  20 from parser_tools import *
  21
  22 floats = {
  23     "footnote": ["\\begin_inset Foot",
  24                  "collapsed true"],
  25     "margin":   ["\\begin_inset Marginal",
  26                  "collapsed true"],
  27     "fig":      ["\\begin_inset Float figure",
  28                  "placement htbp",
  29                  "wide false",
  30                  "collapsed false"],
  31     "tab":      ["\\begin_inset Float table",
  32                  "placement htbp",
  33                  "wide false",
  34                  "collapsed false"],
  35     "alg":      ["\\begin_inset Float algorithm",
  36                  "placement htbp",
  37                  "wide false",
  38                  "collapsed false"],
  39     "wide-fig": ["\\begin_inset Float figure",
  40                  "placement htbp",
  41                  "wide true",
  42                  "collapsed false"],
  43     "wide-tab": ["\\begin_inset Float table",
  44                  "placement htbp",
  45                  "wide true",
  46                  "collapsed false"]
  47 }
  48
  49 font_tokens = ["\\family", "\\series", "\\shape", "\\size", "\\emph",
  50                "\\bar", "\\noun", "\\color", "\\lang", "\\latex"]
  51
  52 #
  53 # Change \begin_float .. \end_float into \begin_inset Float .. \end_inset
  54 #
  55
  56 def remove_oldfloat(lines, language):
  57     i = 0
  58     while 1:
  59         i = find_token(lines, "\\begin_float", i)
  60         if i == -1:
  61             break
  62         # There are no nested floats, so finding the end of the float is simple
  63         j = find_token(lines, "\\end_float", i+1)
  64
  65         floattype = string.split(lines[i])[1]
  66         if not floats.has_key(floattype):
  67             sys.stderr.write("Error! Unknown float type "+floattype+"\n")
  68             floattype = "fig"
  69
  70         # skip \end_deeper tokens
  71         i2 = i+1
  72         while check_token(lines[i2], "\\end_deeper"):
  73             i2 = i2+1
  74         if i2 > i+1:
  75             j2 = get_next_paragraph(lines, j+1)
  76             lines[j2:j2] = ["\\end_deeper "]*(i2-(i+1))
  77
  78         new = floats[floattype]+[""]
  79         new = new+lines[i2:j]+["\\end_inset ", ""]
  80
  81         # After a float, all font attribute are reseted.
  82         # We need to output '\foo default' for every attribute foo
  83         # whose value is not default before the float.
  84         # The check here is not accurate, but it doesn't matter
  85         # as extra '\foo default' commands are ignored.
  86         # In fact, it might be safer to output '\foo default' for all
  87         # font attributes.
  88         k = get_paragraph(lines, i)
  89         flag = 0
  90         for token in font_tokens:
  91             if find_token(lines, token, k, i) != -1:
  92                 if not flag:
  93                     # This is not necessary, but we want the output to be
  94                     # as similar as posible to the lyx format
  95                     flag = 1
  96                     new.append("")
  97                 if token == "\\lang":
  98                     new.append(token+" "+language)
  99                 else:
 100                     new.append(token+" default ")
 101
 102         lines[i:j+1] = new
 103         i = i+1
 104
 105 def remove_oldminipage(lines):
 106     i = 0
 107     flag = 0
 108     while 1:
 109         i = find_token(lines, "\\pextra_type 2", i)
 110         if i == -1:
 111             break
 112         hfill = 0
 113         line = string.split(lines[i])
 114         if line[4] == "\\pextra_hfill":
 115             hfill = 1
 116             line[4:6] = []
 117         if line[4] == "\\pextra_start_minipage":
 118             # We just ignore this
 119             line[4:6] = []
 120
 121         position = line[3]
 122         width = line[5]
 123         if line[4] == "\\pextra_widthp":
 124             width = line[5]+"col%"
 125
 126
 127         start = ["\\begin_inset Minipage",
 128                  "position " + position,
 129                  "inner_position 0",
 130                  'height "0pt"',
 131                  'width "%s"' % width,
 132                  "collapsed false"
 133                  ]
 134         if flag:
 135             flag = 0
 136             if hfill:
 137                 start = ["","\hfill",""]+start
 138         else:
 139             start = ["\\layout Standard"] + start
 140
 141         j = find_token_backwards(lines,"\\layout", i-1)
 142         j0 = j
 143         mid = lines[j:i]
 144
 145         j = find_tokens(lines, ["\\layout", "\\end_float"], i+1)
 146         # j can be -1, but this is still ok
 147         mid = mid+lines[i+1:j]
 148
 149         count = 0
 150         while 1:
 151             # collect more paragraphs to the minipage
 152             count = count+1
 153             if j == -1 or not check_token(lines[j], "\\layout"):
 154                 break
 155             i = find_tokens(lines, ["\\layout", "\\pextra_type"], j+1)
 156             if i == -1 or not check_token(lines[i], "\\pextra_type"):
 157                 break
 158             line = string.split(lines[i])
 159             if line[4] == "\\pextra_hfill":
 160                 line[4:6] = []
 161             if line[4] == "\\pextra_start_minipage" and line[5] == "1":
 162                 flag = 1
 163                 break
 164             j = find_token_backwards(lines,"\\layout", i-1)
 165             mid = mid+lines[j:i]
 166             j = find_tokens(lines, ["\\layout", "\\end_float"], i+1)
 167             mid = mid+lines[i+1:j]
 168
 169         end = ["\\end_inset "]
 170
 171         lines[j0:j] = start+mid+end
 172         i = i+1
 173
 174 def is_empty(lines):
 175     return filter(is_nonempty_line, lines) == []
 176
 177 font_rexp =  re.compile(r"\\(family|series|shape|size|emph|numeric|bar|noun)")
 178 ert_rexp = re.compile(r"\\begin_inset|.*\\SpecialChar")
 179 spchar_rexp = re.compile(r"(.*)(\\SpecialChar.*)")
 180 ert_begin = ["\\begin_inset ERT",
 181              "status Collapsed",
 182              "",
 183              "\\layout Standard"]
 184
 185 def remove_oldert(lines):
 186     i = 0
 187     while 1:
 188         i = find_tokens(lines, ["\\latex latex", "\\layout LaTeX"], i)
 189         if i == -1:
 190             break
 191         j = i+1
 192         while 1:
 193             j = find_tokens(lines, ["\\latex default", "\\begin_inset", "\\layout", "\\end_float", "\\the_end"],
 194                             j)
 195             if check_token(lines[j], "\\begin_inset"):
 196                 j = find_end_of_inset(lines, j)
 197             else:
 198                 break
 199
 200         if check_token(lines[j], "\\layout"):
 201             while j-1 >= 0 and check_token(lines[j-1], "\\begin_deeper"):
 202                 j = j-1
 203
 204         # We need to remove insets, special chars & font commands from ERT text
 205         new = []
 206         new2 = []
 207         if check_token(lines[i], "\\layout LaTeX"):
 208             new = ["\layout Standard", "", ""]
 209             # We have a problem with classes in which Standard is not the default layout!
 210
 211         k = i+1
 212         while 1:
 213             k2 = find_re(lines, ert_rexp, k, j)
 214             inset = specialchar = 0
 215             if k2 == -1:
 216                 k2 = j
 217             elif check_token(lines[k2], "\\begin_inset"):
 218                 inset = 1
 219             else:
 220                 specialchar = 1
 221                 mo = spchar_rexp.match(lines[k2])
 222                 lines[k2] = mo.group(1)
 223                 specialchar_str = mo.group(2)
 224                 k2 = k2+1
 225
 226             tmp = []
 227             for line in lines[k:k2]:
 228                 if font_rexp.match(line):
 229                     if new2 == []:
 230                         # This is not necessary, but we want the output to be
 231                         # as similar as posible to the lyx format
 232                         new2 = [""]
 233                     new2.append(line)
 234                 elif not check_token(line, "\\latex"):
 235                     tmp.append(line)
 236
 237             if is_empty(tmp):
 238                 if filter(lambda x:x != "", tmp) != []:
 239                     if new == []:
 240                         # This is not necessary, but we want the output to be
 241                         # as similar as posible to the lyx format
 242                         lines[i-1] = lines[i-1]+" "
 243                     else:
 244                         new = new+[" "]
 245             else:
 246                 new = new+ert_begin+tmp+["\\end_inset ", ""]
 247
 248             if inset:
 249                 k3 = find_end_of_inset(lines, k2)
 250                 new = new+[""]+lines[k2:k3+1]+[""] # Put an empty line after \end_inset
 251                 k = k3+1
 252                 # Skip the empty line after \end_inset
 253                 if not is_nonempty_line(lines[k]):
 254                     k = k+1
 255                     new.append("")
 256             elif specialchar:
 257                 if new == []:
 258                     # This is not necessary, but we want the output to be
 259                     # as similar as posible to the lyx format
 260                     lines[i-1] = lines[i-1]+specialchar_str
 261                     new = [""]
 262                 else:
 263                     new = new+[specialchar_str, ""]
 264                 k = k2
 265             else:
 266                 break
 267
 268         new = new+new2
 269         if not check_token(lines[j], "\\latex default"):
 270             new = new+[""]+[lines[j]]
 271         lines[i:j+1] = new
 272         i = i+1
 273
 274 def remove_oldertinset(lines):
 275     i = 0
 276     while 1:
 277         i = find_token(lines, "\\begin_inset ERT", i)
 278         if i == -1:
 279             break
 280         j = find_end_of_inset(lines, i)
 281         k = find_token(lines, "\\layout", i+1)
 282         l = get_paragraph(lines, i)
 283         if lines[k] == lines[l]: # same layout
 284             k = k+1
 285         new = lines[k:j]
 286         lines[i:j+1] = new
 287         i = i+1
 288
 289 def is_ert_paragraph(lines, i):
 290     i = find_nonempty_line(lines, i+1)
 291     if not check_token(lines[i], "\\begin_inset ERT"):
 292         return 0
 293     j = find_end_of_inset(lines, i)
 294     k = find_nonempty_line(lines, j+1)
 295     return check_token(lines[k], "\\layout")
 296
 297 def combine_ert(lines):
 298     i = 0
 299     while 1:
 300         i = find_token(lines, "\\begin_inset ERT", i)
 301         if i == -1:
 302             break
 303         j = find_token_backwards(lines,"\\layout", i-1)
 304         count = 0
 305         text = []
 306         while is_ert_paragraph(lines, j):
 307
 308             count = count+1
 309             i2 = find_token(lines, "\\layout", j+1)
 310             k = find_token(lines, "\\end_inset", i2+1)
 311             text = text+lines[i2:k]
 312             j = find_token(lines, "\\layout", k+1)
 313             if j == -1:
 314                 break
 315
 316         if count >= 2:
 317             j = find_token(lines, "\\layout", i+1)
 318             lines[j:k] = text
 319
 320         i = i+1
 321
 322 oldunits = ["pt", "cm", "in", "text%", "col%"]
 323
 324 def get_length(lines, name, start, end):
 325     i = find_token(lines, name, start, end)
 326     if i == -1:
 327         return ""
 328     x = string.split(lines[i])
 329     return x[2]+oldunits[int(x[1])]
 330
 331 def append(x, token, value):
 332     if value != "":
 333         x.append("\t"+token+" "+value)
 334
 335 def remove_figinset(lines):
 336     i = 0
 337     while 1:
 338         i = find_token(lines, "\\begin_inset Figure", i)
 339         if i == -1:
 340             break
 341         j = find_end_of_inset(lines, i)
 342
 343         lyxwidth = string.split(lines[i])[3]+"pt"
 344         lyxheight = string.split(lines[i])[4]+"pt"
 345
 346         filename = get_value(lines, "file", i+1, j)
 347
 348         width = get_length(lines, "width", i+1, j)
 349         # what does width=5 mean ?
 350         height = get_length(lines, "height", i+1, j)
 351         rotateAngle = get_value(lines, "angle", i+1, j)
 352         if width == "" and height == "":
 353             size_type = "0"
 354         else:
 355             size_type = "1"
 356
 357         flags = get_value(lines, "flags", i+1, j)
 358         x = int(flags)%4
 359         if x == 1:
 360             display = "monochrome"
 361         elif x == 2:
 362             display = "gray"
 363         else:
 364             display = "color"
 365
 366         subcaptionText = get_value(lines, "subcaption", i+1, j)
 367         if subcaptionText != "":
 368             subcaptionText = '"'+subcaptionText+'"'
 369         k = find_token(lines, "subfigure", i+1,j)
 370         if k == -1:
 371             subcaption = 0
 372         else:
 373             subcaption = 1
 374
 375         new = ["\\begin_inset Graphics FormatVersion 1"]
 376         append(new, "filename", filename)
 377         append(new, "display", display)
 378         if subcaption:
 379             new.append("\tsubcaption")
 380         append(new, "subcaptionText", subcaptionText)
 381         append(new, "size_type", size_type)
 382         append(new, "width", width)
 383         append(new, "height", height)
 384         if rotateAngle != "":
 385             new.append("\trotate")
 386             append(new, "rotateAngle", rotateAngle)
 387         new.append("\trotateOrigin center")
 388         new.append("\tlyxsize_type 1")
 389         append(new, "lyxwidth", lyxwidth)
 390         append(new, "lyxheight", lyxheight)
 391         new = new + ["\end_inset"]
 392         lines[i:j+1] = new
 393
 394 def change_preamble(lines):
 395     i = find_token(lines, "\\use_amsmath", 0)
 396     if i == -1:
 397         return
 398     lines[i+1:i+1] = ["\\use_natbib 0",
 399                       "\use_numerical_citations 0"]
 400
 401 def convert(header, body):
 402     language = get_value(header, "\\language", 0)
 403     if language == "":
 404         language = "english"
 405
 406     change_preamble(header)
 407     remove_oldminipage(body)
 408     remove_oldfloat(body, language)
 409     remove_figinset(body)
 410     remove_oldertinset(body)
 411     remove_oldert(body)
 412     combine_ert(body)
 413
 414 if __name__ == "__main__":
 415     pass