1 # This file is part of lyx2lyx
2 # -*- coding: iso-8859-1 -*-
3 # Copyright (C) 2002 Dekel Tsur <dekel@lyx.org>
4 # Copyright (C) 2004 José Matos <jamatos@lyx.org>
6 # This program is free software; you can redistribute it and/or
7 # modify it under the terms of the GNU General Public License
8 # as published by the Free Software Foundation; either version 2
9 # of the License, or (at your option) any later version.
11 # This program is distributed in the hope that it will be useful,
12 # but WITHOUT ANY WARRANTY; without even the implied warranty of
13 # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
14 # GNU General Public License for more details.
16 # You should have received a copy of the GNU General Public License
17 # along with this program; if not, write to the Free Software
18 # Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307, USA.
23 from parser_tools import find_token, find_token_backwards, get_next_paragraph,\
24 find_tokens, find_end_of_inset, find_re, \
25 is_nonempty_line, get_paragraph, find_nonempty_line, \
26 get_value, get_tabular_lines, check_token
29 "footnote": ["\\begin_inset Foot",
31 "margin": ["\\begin_inset Marginal",
33 "fig": ["\\begin_inset Float figure",
36 "tab": ["\\begin_inset Float table",
39 "alg": ["\\begin_inset Float algorithm",
42 "wide-fig": ["\\begin_inset Float figure",
45 "wide-tab": ["\\begin_inset Float table",
50 font_tokens = ["\\family", "\\series", "\\shape", "\\size", "\\emph",
51 "\\bar", "\\noun", "\\color", "\\lang", "\\latex"]
53 pextra_type3_rexp = re.compile(r".*\\pextra_type\s+3")
54 pextra_rexp = re.compile(r"\\pextra_type\s+(\S+)"+\
55 r"(\s+\\pextra_alignment\s+(\S+))?"+\
56 r"(\s+\\pextra_hfill\s+(\S+))?"+\
57 r"(\s+\\pextra_start_minipage\s+(\S+))?"+\
58 r"(\s+(\\pextra_widthp?)\s+(\S*))?")
63 if mo.group(9) == "\\pextra_widthp":
64 return mo.group(10)+"col%"
72 # Change \begin_float .. \end_float into \begin_inset Float .. \end_inset
74 def remove_oldfloat(lines, opt):
77 i = find_token(lines, "\\begin_float", i)
80 # There are no nested floats, so finding the end of the float is simple
81 j = find_token(lines, "\\end_float", i+1)
83 floattype = string.split(lines[i])[1]
84 if not floats.has_key(floattype):
85 opt.warning("Error! Unknown float type " + floattype)
88 # skip \end_deeper tokens
90 while check_token(lines[i2], "\\end_deeper"):
93 j2 = get_next_paragraph(lines, j+1)
94 lines[j2:j2] = ["\\end_deeper "]*(i2-(i+1))
96 new = floats[floattype]+[""]
98 # Check if the float is floatingfigure
99 k = find_re(lines, pextra_type3_rexp, i, j)
101 mo = pextra_rexp.search(lines[k])
102 width = get_width(mo)
103 lines[k] = re.sub(pextra_rexp, "", lines[k])
104 new = ["\\begin_inset Wrap figure",
105 'width "%s"' % width,
109 new = new+lines[i2:j]+["\\end_inset ", ""]
111 # After a float, all font attributes are reseted.
112 # We need to output '\foo default' for every attribute foo
113 # whose value is not default before the float.
114 # The check here is not accurate, but it doesn't matter
115 # as extra '\foo default' commands are ignored.
116 # In fact, it might be safer to output '\foo default' for all
118 k = get_paragraph(lines, i)
120 for token in font_tokens:
121 if find_token(lines, token, k, i) != -1:
123 # This is not necessary, but we want the output to be
124 # as similar as posible to the lyx format
127 if token == "\\lang":
128 new.append(token+" "+ opt.language)
130 new.append(token+" default ")
136 pextra_type2_rexp = re.compile(r".*\\pextra_type\s+[12]")
137 pextra_type2_rexp2 = re.compile(r".*(\\layout|\\pextra_type\s+2)")
139 def remove_pextra(lines):
143 i = find_re(lines, pextra_type2_rexp, i)
147 mo = pextra_rexp.search(lines[i])
148 width = get_width(mo)
150 if mo.group(1) == "1":
151 # handle \pextra_type 1 (indented paragraph)
152 lines[i] = re.sub(pextra_rexp, "\\leftindent "+width+" ", lines[i])
156 # handle \pextra_type 2 (minipage)
157 position = mo.group(3)
159 lines[i] = re.sub(pextra_rexp, "", lines[i])
161 start = ["\\begin_inset Minipage",
162 "position " + position,
165 'width "%s"' % width,
171 start = ["","\hfill",""]+start
173 start = ["\\layout Standard"] + start
175 j0 = find_token_backwards(lines,"\\layout", i-1)
176 j = get_next_paragraph(lines, i)
180 # collect more paragraphs to the minipage
182 if j == -1 or not check_token(lines[j], "\\layout"):
184 i = find_re(lines, pextra_type2_rexp2, j+1)
187 mo = pextra_rexp.search(lines[i])
190 if mo.group(7) == "1":
193 lines[i] = re.sub(pextra_rexp, "", lines[i])
194 j = find_tokens(lines, ["\\layout", "\\end_float"], i+1)
197 end = ["\\end_inset "]
199 lines[j0:j] = start+mid+end
204 return filter(is_nonempty_line, lines) == []
207 move_rexp = re.compile(r"\\(family|series|shape|size|emph|numeric|bar|noun|end_deeper)")
208 ert_rexp = re.compile(r"\\begin_inset|\\hfill|.*\\SpecialChar")
209 spchar_rexp = re.compile(r"(.*)(\\SpecialChar.*)")
210 ert_begin = ["\\begin_inset ERT",
216 def remove_oldert(lines):
219 i = find_tokens(lines, ["\\latex latex", "\\layout LaTeX"], i)
224 # \end_inset is for ert inside a tabular cell. The other tokens
226 j = find_tokens(lines, ["\\latex default", "\\layout", "\\begin_inset", "\\end_inset", "\\end_float", "\\the_end"],
228 if check_token(lines[j], "\\begin_inset"):
229 j = find_end_of_inset(lines, j)+1
233 if check_token(lines[j], "\\layout"):
234 while j-1 >= 0 and check_token(lines[j-1], "\\begin_deeper"):
237 # We need to remove insets, special chars & font commands from ERT text
240 if check_token(lines[i], "\\layout LaTeX"):
241 new = ["\layout Standard", "", ""]
242 # We have a problem with classes in which Standard is not the default layout!
246 k2 = find_re(lines, ert_rexp, k, j)
247 inset = hfill = specialchar = 0
250 elif check_token(lines[k2], "\\begin_inset"):
252 elif check_token(lines[k2], "\\hfill"):
258 mo = spchar_rexp.match(lines[k2])
259 lines[k2] = mo.group(1)
260 specialchar_str = mo.group(2)
264 for line in lines[k:k2]:
265 # Move some lines outside the ERT inset:
266 if move_rexp.match(line):
268 # This is not necessary, but we want the output to be
269 # as similar as posible to the lyx format
272 elif not check_token(line, "\\latex"):
276 if filter(lambda x:x != "", tmp) != []:
278 # This is not necessary, but we want the output to be
279 # as similar as posible to the lyx format
280 lines[i-1] = lines[i-1]+" "
284 new = new+ert_begin+tmp+["\\end_inset ", ""]
287 k3 = find_end_of_inset(lines, k2)
288 new = new+[""]+lines[k2:k3+1]+[""] # Put an empty line after \end_inset
290 # Skip the empty line after \end_inset
291 if not is_nonempty_line(lines[k]):
295 new = new+["\hfill", ""]
299 # This is not necessary, but we want the output to be
300 # as similar as posible to the lyx format
301 lines[i-1] = lines[i-1]+specialchar_str
304 new = new+[specialchar_str, ""]
310 if not check_token(lines[j], "\\latex "):
311 new = new+[""]+[lines[j]]
315 # Delete remaining "\latex xxx" tokens
318 i = find_token(lines, "\\latex ", i)
324 # ERT insert are hidden feature of lyx 1.1.6. This might be removed in the future.
325 def remove_oldertinset(lines):
328 i = find_token(lines, "\\begin_inset ERT", i)
331 j = find_end_of_inset(lines, i)
332 k = find_token(lines, "\\layout", i+1)
333 l = get_paragraph(lines, i)
334 if lines[k] == lines[l]: # same layout
341 def is_ert_paragraph(lines, i):
342 if not check_token(lines[i], "\\layout Standard"):
345 i = find_nonempty_line(lines, i+1)
346 if not check_token(lines[i], "\\begin_inset ERT"):
349 j = find_end_of_inset(lines, i)
350 k = find_nonempty_line(lines, j+1)
351 return check_token(lines[k], "\\layout")
354 def combine_ert(lines):
357 i = find_token(lines, "\\begin_inset ERT", i)
360 j = get_paragraph(lines, i)
363 while is_ert_paragraph(lines, j):
366 i2 = find_token(lines, "\\layout", j+1)
367 k = find_token(lines, "\\end_inset", i2+1)
368 text = text+lines[i2:k]
369 j = find_token(lines, "\\layout", k+1)
374 j = find_token(lines, "\\layout", i+1)
380 oldunits = ["pt", "cm", "in", "text%", "col%"]
382 def get_length(lines, name, start, end):
383 i = find_token(lines, name, start, end)
386 x = string.split(lines[i])
387 return x[2]+oldunits[int(x[1])]
390 def write_attribute(x, token, value):
392 x.append("\t"+token+" "+value)
395 def remove_figinset(lines):
398 i = find_token(lines, "\\begin_inset Figure", i)
401 j = find_end_of_inset(lines, i)
403 if ( len(string.split(lines[i])) > 2 ):
404 lyxwidth = string.split(lines[i])[3]+"pt"
405 lyxheight = string.split(lines[i])[4]+"pt"
410 filename = get_value(lines, "file", i+1, j)
412 width = get_length(lines, "width", i+1, j)
413 # what does width=5 mean ?
414 height = get_length(lines, "height", i+1, j)
415 rotateAngle = get_value(lines, "angle", i+1, j)
416 if width == "" and height == "":
421 flags = get_value(lines, "flags", i+1, j)
424 display = "monochrome"
431 subcaptionLine = find_token(lines, "subcaption", i+1, j)
432 if subcaptionLine != -1:
433 subcaptionText = lines[subcaptionLine][11:]
434 if subcaptionText != "":
435 subcaptionText = '"'+subcaptionText+'"'
437 k = find_token(lines, "subfigure", i+1,j)
443 new = ["\\begin_inset Graphics FormatVersion 1"]
444 write_attribute(new, "filename", filename)
445 write_attribute(new, "display", display)
447 new.append("\tsubcaption")
448 write_attribute(new, "subcaptionText", subcaptionText)
449 write_attribute(new, "size_type", size_type)
450 write_attribute(new, "width", width)
451 write_attribute(new, "height", height)
452 if rotateAngle != "":
453 new.append("\trotate")
454 write_attribute(new, "rotateAngle", rotateAngle)
455 write_attribute(new, "rotateOrigin", "leftBaseline")
456 write_attribute(new, "lyxsize_type", "1")
457 write_attribute(new, "lyxwidth", lyxwidth)
458 write_attribute(new, "lyxheight", lyxheight)
459 new = new + ["\end_inset"]
463 attr_re = re.compile(r' \w*="(false|0|)"')
464 line_re = re.compile(r'<(features|column|row|cell)')
466 def update_tabular(lines):
469 i = find_token(lines, '\\begin_inset Tabular', i)
473 for k in get_tabular_lines(lines, i):
474 if check_token(lines[k], "<lyxtabular"):
475 lines[k] = string.replace(lines[k], 'version="2"', 'version="3"')
476 elif check_token(lines[k], "<column"):
477 lines[k] = string.replace(lines[k], 'width=""', 'width="0pt"')
479 if line_re.match(lines[k]):
480 lines[k] = re.sub(attr_re, "", lines[k])
485 # Figure insert are hidden feature of lyx 1.1.6. This might be removed in the future.
486 def fix_oldfloatinset(lines):
489 i = find_token(lines, "\\begin_inset Float ", i)
492 j = find_token(lines, "collapsed", i)
494 lines[j:j] = ["wide false"]
498 def change_listof(lines):
501 i = find_token(lines, "\\begin_inset LatexCommand \\listof", i)
504 type = re.search(r"listof(\w*)", lines[i]).group(1)[:-1]
505 lines[i] = "\\begin_inset FloatList "+type
509 def change_infoinset(lines):
512 i = find_token(lines, "\\begin_inset Info", i)
515 txt = string.lstrip(lines[i][18:])
516 new = ["\\begin_inset Note", "collapsed true", ""]
517 j = find_token(lines, "\\end_inset", i)
521 note_lines = lines[i+1:j]
523 note_lines = [txt]+note_lines
525 for line in note_lines:
526 new = new + ["\layout Standard", ""]
527 tmp = string.split(line, '\\')
530 new = new + ["\\backslash ", x]
535 def change_preamble(lines):
536 i = find_token(lines, "\\use_amsmath", 0)
539 lines[i+1:i+1] = ["\\use_natbib 0",
540 "\use_numerical_citations 0"]
544 change_preamble(file.header)
545 change_listof(file.body)
546 fix_oldfloatinset(file.body)
547 update_tabular(file.body)
548 remove_pextra(file.body)
549 remove_oldfloat(file.body, file)
550 remove_figinset(file.body)
551 remove_oldertinset(file.body)
552 remove_oldert(file.body)
553 combine_ert(file.body)
554 change_infoinset(file.body)
559 file.error("The convertion to an older format (%s) is not implemented." % file.format)
562 if __name__ == "__main__":