1 # This file is part of lyx2lyx
2 # Copyright (C) 2002 Dekel Tsur <dekel@lyx.org>
4 # This program is free software; you can redistribute it and/or
5 # modify it under the terms of the GNU General Public License
6 # as published by the Free Software Foundation; either version 2
7 # of the License, or (at your option) any later version.
9 # This program is distributed in the hope that it will be useful,
10 # but WITHOUT ANY WARRANTY; without even the implied warranty of
11 # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
12 # GNU General Public License for more details.
14 # You should have received a copy of the GNU General Public License
15 # along with this program; if not, write to the Free Software
16 # Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307, USA.
20 from parser_tools import *
23 "footnote": ["\\begin_inset Foot",
25 "margin": ["\\begin_inset Marginal",
27 "fig": ["\\begin_inset Float figure",
30 "tab": ["\\begin_inset Float table",
33 "alg": ["\\begin_inset Float algorithm",
36 "wide-fig": ["\\begin_inset Float figure",
39 "wide-tab": ["\\begin_inset Float table",
44 font_tokens = ["\\family", "\\series", "\\shape", "\\size", "\\emph",
45 "\\bar", "\\noun", "\\color", "\\lang", "\\latex"]
48 # Change \begin_float .. \end_float into \begin_inset Float .. \end_inset
51 def remove_oldfloat(lines, language):
54 i = find_token(lines, "\\begin_float", i)
57 # There are no nested floats, so finding the end of the float is simple
58 j = find_token(lines, "\\end_float", i+1)
60 floattype = string.split(lines[i])[1]
61 if not floats.has_key(floattype):
62 sys.stderr.write("Error! Unknown float type "+floattype+"\n")
65 # skip \end_deeper tokens
67 while check_token(lines[i2], "\\end_deeper"):
70 j2 = get_next_paragraph(lines, j+1)
71 lines[j2:j2] = ["\\end_deeper "]*(i2-(i+1))
73 new = floats[floattype]+[""]
74 new = new+lines[i2:j]+["\\end_inset ", ""]
76 # After a float, all font attributes are reseted.
77 # We need to output '\foo default' for every attribute foo
78 # whose value is not default before the float.
79 # The check here is not accurate, but it doesn't matter
80 # as extra '\foo default' commands are ignored.
81 # In fact, it might be safer to output '\foo default' for all
83 k = get_paragraph(lines, i)
85 for token in font_tokens:
86 if find_token(lines, token, k, i) != -1:
88 # This is not necessary, but we want the output to be
89 # as similar as posible to the lyx format
93 new.append(token+" "+language)
95 new.append(token+" default ")
100 def remove_oldminipage(lines):
104 i = find_token(lines, "\\pextra_type 2", i)
108 line = string.split(lines[i])
109 if line[4] == "\\pextra_hfill":
112 if line[4] == "\\pextra_start_minipage":
113 # We just ignore this
118 if line[4] == "\\pextra_widthp":
119 width = line[5]+"col%"
122 start = ["\\begin_inset Minipage",
123 "position " + position,
126 'width "%s"' % width,
132 start = ["","\hfill",""]+start
134 start = ["\\layout Standard"] + start
136 j = find_token_backwards(lines,"\\layout", i-1)
140 j = find_tokens(lines, ["\\layout", "\\end_float"], i+1)
141 # j can be -1, but this is still ok
142 mid = mid+lines[i+1:j]
146 # collect more paragraphs to the minipage
148 if j == -1 or not check_token(lines[j], "\\layout"):
150 i = find_tokens(lines, ["\\layout", "\\pextra_type"], j+1)
151 if i == -1 or not check_token(lines[i], "\\pextra_type"):
153 line = string.split(lines[i])
154 if line[4] == "\\pextra_hfill":
156 if line[4] == "\\pextra_start_minipage" and line[5] == "1":
159 j = find_token_backwards(lines,"\\layout", i-1)
161 j = find_tokens(lines, ["\\layout", "\\end_float"], i+1)
162 mid = mid+lines[i+1:j]
164 end = ["\\end_inset "]
166 lines[j0:j] = start+mid+end
170 return filter(is_nonempty_line, lines) == []
172 font_rexp = re.compile(r"\\(family|series|shape|size|emph|numeric|bar|noun)")
173 ert_rexp = re.compile(r"\\begin_inset|.*\\SpecialChar")
174 spchar_rexp = re.compile(r"(.*)(\\SpecialChar.*)")
175 ert_begin = ["\\begin_inset ERT",
180 def remove_oldert(lines):
183 i = find_tokens(lines, ["\\latex latex", "\\layout LaTeX"], i)
188 j = find_tokens(lines, ["\\latex default", "\\begin_inset", "\\layout", "\\end_float", "\\the_end"],
190 if check_token(lines[j], "\\begin_inset"):
191 j = find_end_of_inset(lines, j)
195 if check_token(lines[j], "\\layout"):
196 while j-1 >= 0 and check_token(lines[j-1], "\\begin_deeper"):
199 # We need to remove insets, special chars & font commands from ERT text
202 if check_token(lines[i], "\\layout LaTeX"):
203 new = ["\layout Standard", "", ""]
204 # We have a problem with classes in which Standard is not the default layout!
208 k2 = find_re(lines, ert_rexp, k, j)
209 inset = specialchar = 0
212 elif check_token(lines[k2], "\\begin_inset"):
216 mo = spchar_rexp.match(lines[k2])
217 lines[k2] = mo.group(1)
218 specialchar_str = mo.group(2)
222 for line in lines[k:k2]:
223 if font_rexp.match(line):
225 # This is not necessary, but we want the output to be
226 # as similar as posible to the lyx format
229 elif not check_token(line, "\\latex"):
233 if filter(lambda x:x != "", tmp) != []:
235 # This is not necessary, but we want the output to be
236 # as similar as posible to the lyx format
237 lines[i-1] = lines[i-1]+" "
241 new = new+ert_begin+tmp+["\\end_inset ", ""]
244 k3 = find_end_of_inset(lines, k2)
245 new = new+[""]+lines[k2:k3+1]+[""] # Put an empty line after \end_inset
247 # Skip the empty line after \end_inset
248 if not is_nonempty_line(lines[k]):
253 # This is not necessary, but we want the output to be
254 # as similar as posible to the lyx format
255 lines[i-1] = lines[i-1]+specialchar_str
258 new = new+[specialchar_str, ""]
264 if not check_token(lines[j], "\\latex "):
265 new = new+[""]+[lines[j]]
271 i = find_token(lines, "\\latex ", i)
277 def remove_oldertinset(lines):
280 i = find_token(lines, "\\begin_inset ERT", i)
283 j = find_end_of_inset(lines, i)
284 k = find_token(lines, "\\layout", i+1)
285 l = get_paragraph(lines, i)
286 if lines[k] == lines[l]: # same layout
292 def is_ert_paragraph(lines, i):
293 i = find_nonempty_line(lines, i+1)
294 if not check_token(lines[i], "\\begin_inset ERT"):
296 j = find_end_of_inset(lines, i)
297 k = find_nonempty_line(lines, j+1)
298 return check_token(lines[k], "\\layout")
300 def combine_ert(lines):
303 i = find_token(lines, "\\begin_inset ERT", i)
306 j = find_token_backwards(lines,"\\layout", i-1)
309 while is_ert_paragraph(lines, j):
312 i2 = find_token(lines, "\\layout", j+1)
313 k = find_token(lines, "\\end_inset", i2+1)
314 text = text+lines[i2:k]
315 j = find_token(lines, "\\layout", k+1)
320 j = find_token(lines, "\\layout", i+1)
325 oldunits = ["pt", "cm", "in", "text%", "col%"]
327 def get_length(lines, name, start, end):
328 i = find_token(lines, name, start, end)
331 x = string.split(lines[i])
332 return x[2]+oldunits[int(x[1])]
334 def write_attribute(x, token, value):
336 x.append("\t"+token+" "+value)
338 def remove_figinset(lines):
341 i = find_token(lines, "\\begin_inset Figure", i)
344 j = find_end_of_inset(lines, i)
346 lyxwidth = string.split(lines[i])[3]+"pt"
347 lyxheight = string.split(lines[i])[4]+"pt"
349 filename = get_value(lines, "file", i+1, j)
351 width = get_length(lines, "width", i+1, j)
352 # what does width=5 mean ?
353 height = get_length(lines, "height", i+1, j)
354 rotateAngle = get_value(lines, "angle", i+1, j)
355 if width == "" and height == "":
360 flags = get_value(lines, "flags", i+1, j)
363 display = "monochrome"
369 subcaptionText = get_value(lines, "subcaption", i+1, j)
370 if subcaptionText != "":
371 subcaptionText = '"'+subcaptionText+'"'
372 k = find_token(lines, "subfigure", i+1,j)
378 new = ["\\begin_inset Graphics FormatVersion 1"]
379 write_attribute(new, "filename", filename)
380 write_attribute(new, "display", display)
382 new.append("\tsubcaption")
383 write_attribute(new, "subcaptionText", subcaptionText)
384 write_attribute(new, "size_type", size_type)
385 write_attribute(new, "width", width)
386 write_attribute(new, "height", height)
387 if rotateAngle != "":
388 new.append("\trotate")
389 write_attribute(new, "rotateAngle", rotateAngle)
390 write_attribute(new, "rotateOrigin", "leftBaseline")
391 write_attribute(new, "lyxsize_type", "1")
392 write_attribute(new, "lyxwidth", lyxwidth)
393 write_attribute(new, "lyxheight", lyxheight)
394 new = new + ["\end_inset"]
397 attr_re = re.compile(r' \w*="(false|0|)"')
398 line_re = re.compile(r'<(features|column|row|cell)')
400 def update_tabular(lines):
403 i = find_token(lines, '\\begin_inset Tabular', i)
407 # scan table header meta-info
408 lines[i+1] = string.replace(lines[i+1], 'version="2"', 'version="3"')
410 j = find_token(lines, '</lyxtabular>', i)
414 for k in xrange(i+2,j):
415 if check_token(lines[k], "<column"):
416 lines[k] = string.replace(lines[k], 'width=""', 'width="0pt"')
417 if line_re.match(lines[k]):
418 lines[k] = re.sub(attr_re, "", lines[k])
422 def change_preamble(lines):
423 i = find_token(lines, "\\use_amsmath", 0)
426 lines[i+1:i+1] = ["\\use_natbib 0",
427 "\use_numerical_citations 0"]
429 def convert(header, body):
430 language = get_value(header, "\\language", 0)
434 change_preamble(header)
436 remove_oldminipage(body)
437 remove_oldfloat(body, language)
438 remove_figinset(body)
439 remove_oldertinset(body)
443 if __name__ == "__main__":