1 # This file is part of lyx2lyx
2 # Copyright (C) 2002 Dekel Tsur <dekel@lyx.org>
4 # This program is free software; you can redistribute it and/or
5 # modify it under the terms of the GNU General Public License
6 # as published by the Free Software Foundation; either version 2
7 # of the License, or (at your option) any later version.
9 # This program is distributed in the hope that it will be useful,
10 # but WITHOUT ANY WARRANTY; without even the implied warranty of
11 # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
12 # GNU General Public License for more details.
14 # You should have received a copy of the GNU General Public License
15 # along with this program; if not, write to the Free Software
16 # Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307, USA.
20 from parser_tools import *
23 "footnote": ["\\begin_inset Foot",
25 "margin": ["\\begin_inset Marginal",
27 "fig": ["\\begin_inset Float figure",
30 "tab": ["\\begin_inset Float table",
33 "alg": ["\\begin_inset Float algorithm",
36 "wide-fig": ["\\begin_inset Float figure",
39 "wide-tab": ["\\begin_inset Float table",
44 font_tokens = ["\\family", "\\series", "\\shape", "\\size", "\\emph",
45 "\\bar", "\\noun", "\\color", "\\lang", "\\latex"]
47 pextra_type3_rexp = re.compile(r".*\\pextra_type\s+3")
48 pextra_rexp = re.compile(r"\\pextra_type\s+(\S+)"+\
49 r"(\s+\\pextra_alignment\s+(\S+))?"+\
50 r"(\s+\\pextra_hfill\s+(\S+))?"+\
51 r"(\s+\\pextra_start_minipage\s+(\S+))?"+\
52 r"(\s+(\\pextra_widthp?)\s+(\S*))?")
56 if mo.group(9) == "\\pextra_widthp":
57 return mo.group(10)+"col%"
64 # Change \begin_float .. \end_float into \begin_inset Float .. \end_inset
67 def remove_oldfloat(lines, language):
70 i = find_token(lines, "\\begin_float", i)
73 # There are no nested floats, so finding the end of the float is simple
74 j = find_token(lines, "\\end_float", i+1)
76 floattype = string.split(lines[i])[1]
77 if not floats.has_key(floattype):
78 sys.stderr.write("Error! Unknown float type "+floattype+"\n")
81 # skip \end_deeper tokens
83 while check_token(lines[i2], "\\end_deeper"):
86 j2 = get_next_paragraph(lines, j+1)
87 lines[j2:j2] = ["\\end_deeper "]*(i2-(i+1))
89 new = floats[floattype]+[""]
91 # Check if the float is floatingfigure
92 k = find_re(lines, pextra_type3_rexp, i, j)
94 mo = pextra_rexp.search(lines[k])
96 lines[k] = re.sub(pextra_rexp, "", lines[k])
97 new = ["\\begin_inset Wrap figure",
102 new = new+lines[i2:j]+["\\end_inset ", ""]
104 # After a float, all font attributes are reseted.
105 # We need to output '\foo default' for every attribute foo
106 # whose value is not default before the float.
107 # The check here is not accurate, but it doesn't matter
108 # as extra '\foo default' commands are ignored.
109 # In fact, it might be safer to output '\foo default' for all
111 k = get_paragraph(lines, i)
113 for token in font_tokens:
114 if find_token(lines, token, k, i) != -1:
116 # This is not necessary, but we want the output to be
117 # as similar as posible to the lyx format
120 if token == "\\lang":
121 new.append(token+" "+language)
123 new.append(token+" default ")
128 pextra_type2_rexp = re.compile(r".*\\pextra_type\s+[12]")
129 pextra_type2_rexp2 = re.compile(r".*(\\layout|\\pextra_type\s+2)")
131 def remove_pextra(lines):
135 i = find_re(lines, pextra_type2_rexp, i)
139 mo = pextra_rexp.search(lines[i])
140 width = get_width(mo)
142 if mo.group(1) == "1":
143 # handle \pextra_type 1 (indented paragraph)
144 lines[i] = re.sub(pextra_rexp, "\\leftindent "+width+" ", lines[i])
148 # handle \pextra_type 2 (minipage)
149 position = mo.group(3)
151 lines[i] = re.sub(pextra_rexp, "", lines[i])
153 start = ["\\begin_inset Minipage",
154 "position " + position,
157 'width "%s"' % width,
163 start = ["","\hfill",""]+start
165 start = ["\\layout Standard"] + start
167 j = find_token_backwards(lines,"\\layout", i-1)
170 j = find_tokens(lines, ["\\layout", "\\end_float"], i+1)
175 # collect more paragraphs to the minipage
177 if j == -1 or not check_token(lines[j], "\\layout"):
179 i = find_re(lines, pextra_type2_rexp2, j+1)
182 mo = pextra_rexp.search(lines[i])
185 if mo.group(7) == "1":
188 lines[i] = re.sub(pextra_rexp, "", lines[i])
189 j = find_tokens(lines, ["\\layout", "\\end_float"], i+1)
192 end = ["\\end_inset "]
194 lines[j0:j] = start+mid+end
198 return filter(is_nonempty_line, lines) == []
200 move_rexp = re.compile(r"\\(family|series|shape|size|emph|numeric|bar|noun|end_deeper)")
201 ert_rexp = re.compile(r"\\begin_inset|.*\\SpecialChar")
202 spchar_rexp = re.compile(r"(.*)(\\SpecialChar.*)")
203 ert_begin = ["\\begin_inset ERT",
208 def remove_oldert(lines):
211 i = find_tokens(lines, ["\\latex latex", "\\layout LaTeX"], i)
216 # \end_inset is for ert inside a tabular cell. The other tokens
218 j = find_tokens(lines, ["\\latex default", "\\layout", "\\begin_inset", "\\end_inset", "\\end_float", "\\the_end"],
220 if check_token(lines[j], "\\begin_inset"):
221 j = find_end_of_inset(lines, j)+1
225 if check_token(lines[j], "\\layout"):
226 while j-1 >= 0 and check_token(lines[j-1], "\\begin_deeper"):
229 # We need to remove insets, special chars & font commands from ERT text
232 if check_token(lines[i], "\\layout LaTeX"):
233 new = ["\layout Standard", "", ""]
234 # We have a problem with classes in which Standard is not the default layout!
238 k2 = find_re(lines, ert_rexp, k, j)
239 inset = specialchar = 0
242 elif check_token(lines[k2], "\\begin_inset"):
246 mo = spchar_rexp.match(lines[k2])
247 lines[k2] = mo.group(1)
248 specialchar_str = mo.group(2)
252 for line in lines[k:k2]:
253 # Move some lines outside the ERT inset:
254 if move_rexp.match(line):
256 # This is not necessary, but we want the output to be
257 # as similar as posible to the lyx format
260 elif not check_token(line, "\\latex"):
264 if filter(lambda x:x != "", tmp) != []:
266 # This is not necessary, but we want the output to be
267 # as similar as posible to the lyx format
268 lines[i-1] = lines[i-1]+" "
272 new = new+ert_begin+tmp+["\\end_inset ", ""]
275 k3 = find_end_of_inset(lines, k2)
276 new = new+[""]+lines[k2:k3+1]+[""] # Put an empty line after \end_inset
278 # Skip the empty line after \end_inset
279 if not is_nonempty_line(lines[k]):
284 # This is not necessary, but we want the output to be
285 # as similar as posible to the lyx format
286 lines[i-1] = lines[i-1]+specialchar_str
289 new = new+[specialchar_str, ""]
295 if not check_token(lines[j], "\\latex "):
296 new = new+[""]+[lines[j]]
300 # Delete remaining "\latex xxx" tokens
303 i = find_token(lines, "\\latex ", i)
308 # ERT insert are hidden feature of lyx 1.1.6. This might be removed in the future.
309 def remove_oldertinset(lines):
312 i = find_token(lines, "\\begin_inset ERT", i)
315 j = find_end_of_inset(lines, i)
316 k = find_token(lines, "\\layout", i+1)
317 l = get_paragraph(lines, i)
318 if lines[k] == lines[l]: # same layout
324 def is_ert_paragraph(lines, i):
325 if not check_token(lines[i], "\\layout Standard"):
328 i = find_nonempty_line(lines, i+1)
329 if not check_token(lines[i], "\\begin_inset ERT"):
332 j = find_end_of_inset(lines, i)
333 k = find_nonempty_line(lines, j+1)
334 return check_token(lines[k], "\\layout")
336 def combine_ert(lines):
339 i = find_token(lines, "\\begin_inset ERT", i)
342 j = get_paragraph(lines, i)
345 while is_ert_paragraph(lines, j):
348 i2 = find_token(lines, "\\layout", j+1)
349 k = find_token(lines, "\\end_inset", i2+1)
350 text = text+lines[i2:k]
351 j = find_token(lines, "\\layout", k+1)
356 j = find_token(lines, "\\layout", i+1)
361 oldunits = ["pt", "cm", "in", "text%", "col%"]
363 def get_length(lines, name, start, end):
364 i = find_token(lines, name, start, end)
367 x = string.split(lines[i])
368 return x[2]+oldunits[int(x[1])]
370 def write_attribute(x, token, value):
372 x.append("\t"+token+" "+value)
374 def remove_figinset(lines):
377 i = find_token(lines, "\\begin_inset Figure", i)
380 j = find_end_of_inset(lines, i)
382 if ( len(string.split(lines[i])) > 2 ):
383 lyxwidth = string.split(lines[i])[3]+"pt"
384 lyxheight = string.split(lines[i])[4]+"pt"
389 filename = get_value(lines, "file", i+1, j)
391 width = get_length(lines, "width", i+1, j)
392 # what does width=5 mean ?
393 height = get_length(lines, "height", i+1, j)
394 rotateAngle = get_value(lines, "angle", i+1, j)
395 if width == "" and height == "":
400 flags = get_value(lines, "flags", i+1, j)
403 display = "monochrome"
409 subcaptionText = get_value(lines, "subcaption", i+1, j)
410 if subcaptionText != "":
411 subcaptionText = '"'+subcaptionText+'"'
412 k = find_token(lines, "subfigure", i+1,j)
418 new = ["\\begin_inset Graphics FormatVersion 1"]
419 write_attribute(new, "filename", filename)
420 write_attribute(new, "display", display)
422 new.append("\tsubcaption")
423 write_attribute(new, "subcaptionText", subcaptionText)
424 write_attribute(new, "size_type", size_type)
425 write_attribute(new, "width", width)
426 write_attribute(new, "height", height)
427 if rotateAngle != "":
428 new.append("\trotate")
429 write_attribute(new, "rotateAngle", rotateAngle)
430 write_attribute(new, "rotateOrigin", "leftBaseline")
431 write_attribute(new, "lyxsize_type", "1")
432 write_attribute(new, "lyxwidth", lyxwidth)
433 write_attribute(new, "lyxheight", lyxheight)
434 new = new + ["\end_inset"]
437 attr_re = re.compile(r' \w*="(false|0|)"')
438 line_re = re.compile(r'<(features|column|row|cell)')
440 def update_tabular(lines):
443 i = find_token(lines, '\\begin_inset Tabular', i)
447 for k in get_tabular_lines(lines, i):
448 if check_token(lines[k], "<lyxtabular"):
449 lines[k] = string.replace(lines[k], 'version="2"', 'version="3"')
450 elif check_token(lines[k], "<column"):
451 lines[k] = string.replace(lines[k], 'width=""', 'width="0pt"')
453 if line_re.match(lines[k]):
454 lines[k] = re.sub(attr_re, "", lines[k])
458 # Figure insert are hidden feature of lyx 1.1.6. This might be removed in the future.
459 def fix_oldfloatinset(lines):
462 i = find_token(lines, "\\begin_inset Float ", i)
465 j = find_token(lines, "collapsed", i)
467 lines[j:j] = ["wide false"]
470 def change_listof(lines):
473 i = find_token(lines, "\\begin_inset LatexCommand \\listof", i)
476 type = re.search(r"listof(\w*)", lines[i]).group(1)[:-1]
477 lines[i] = "\\begin_inset FloatList "+type
480 def change_preamble(lines):
481 i = find_token(lines, "\\use_amsmath", 0)
484 lines[i+1:i+1] = ["\\use_natbib 0",
485 "\use_numerical_citations 0"]
487 def convert(header, body):
488 language = get_value(header, "\\language", 0)
492 change_preamble(header)
494 fix_oldfloatinset(body)
497 remove_oldfloat(body, language)
498 remove_figinset(body)
499 remove_oldertinset(body)
503 if __name__ == "__main__":