X-Git-Url: https://git.lyx.org/gitweb/?a=blobdiff_plain;f=lib%2Flyx2lyx%2Flyx_1_6.py;h=071280836b670f61213117e800e25e9764eedaaa;hb=0984e113171297e402c88ce048e9ccf1fb3d3619;hp=87d0d4b4a41822f53d9891b53667ee09a5f0612e;hpb=41c028cce511ec3644bcf24ffcb1ea0ac42d0262;p=lyx.git diff --git a/lib/lyx2lyx/lyx_1_6.py b/lib/lyx2lyx/lyx_1_6.py index 87d0d4b4a4..071280836b 100644 --- a/lib/lyx2lyx/lyx_1_6.py +++ b/lib/lyx2lyx/lyx_1_6.py @@ -14,7 +14,7 @@ # # You should have received a copy of the GNU General Public License # along with this program; if not, write to the Free Software -# Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307, USA. +# Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA """ Convert files to the file format generated by lyx 1.6""" @@ -22,11 +22,28 @@ import re import unicodedata import sys, os -from parser_tools import find_token, find_end_of, find_tokens, get_value, get_value_string +from parser_tools import find_token, find_end_of, find_tokens, get_value +from unicode_symbols import read_unicodesymbols #################################################################### # Private helper functions + +def get_value_string(lines, token, start, end = 0, trim = False, default = ""): + """ get_value_string(lines, token, start[[, end], trim, default]) -> string + + Return tokens after token as string, in lines, where + token is the first element. When trim is used, the first and last character + of the string is trimmed.""" + + val = get_value(lines, token, start, end, "") + if not val: + return default + if trim: + return val[1:-1] + return val + + def find_end_of_inset(lines, i): " Find end of inset, where lines[i] is included." return find_end_of(lines, i, "\\begin_inset", "\\end_inset") @@ -35,7 +52,7 @@ def find_end_of_inset(lines, i): # DO NOT do this: # document.body[i] = wrap_insert_ert(...) # wrap_into_ert may returns a multiline string, which should NOT appear -# in document.body. Insetad, do something like this: +# in document.body. Instead, do something like this: # subst = wrap_inset_ert(...) # subst = subst.split('\n') # document.body[i:i+1] = subst @@ -50,6 +67,8 @@ def wrap_into_ert(string, src, dst): + dst + '\n\\end_layout\n\\end_inset\n') def put_cmd_in_ert(string): + for rep in unicode_reps: + string = string.replace(rep[1], rep[0].replace('\\\\', '\\')) string = string.replace('\\', "\\backslash\n") string = "\\begin_inset ERT\nstatus collapsed\n\\begin_layout Standard\n" \ + string + "\n\\end_layout\n\\end_inset" @@ -76,7 +95,7 @@ def convert_len(len): "theight%":"\\backslash\ntextheight", "pheight%":"\\backslash\npageheight"} # Convert LyX units to LaTeX units - for unit in units.keys(): + for unit in list(units.keys()): if len.find(unit) != -1: len = '%f' % (len2value(len) / 100) len = len.strip('0') + units[unit] @@ -127,15 +146,25 @@ def set_option(document, m, option, value): return l -def read_unicodesymbols(): +# FIXME: Remove this function if the version imported from unicode_symbols works. +# This function was the predecessor from that function, that in the meanwhile got +# new fixes. +def read_unicodesymbols2(): " Read the unicodesymbols list of unicode characters and corresponding commands." + + # Provide support for both python 2 and 3 + PY2 = sys.version_info[0] == 2 + if not PY2: + unichr = chr + # End of code to support for both python 2 and 3 + pathname = os.path.abspath(os.path.dirname(sys.argv[0])) fp = open(os.path.join(pathname.strip('lyx2lyx'), 'unicodesymbols')) spec_chars = [] # Two backslashes, followed by some non-word character, and then a character # in brackets. The idea is to check for constructs like: \"{u}, which is how # they are written in the unicodesymbols file; but they can also be written - # as: \"u. + # as: \"u or even \" u. r = re.compile(r'\\\\(\W)\{(\w)\}') for line in fp.readlines(): if line[0] != '#' and line.strip() != "": @@ -156,8 +185,11 @@ def read_unicodesymbols(): # since it is done that way in the LyX file. if m.group(1) == "\"": command += "\\" + commandbl = command command += m.group(1) + m.group(2) + commandbl += m.group(1) + ' ' + m.group(2) spec_chars.append([command, unichr(eval(ucs4))]) + spec_chars.append([commandbl, unichr(eval(ucs4))]) fp.close() return spec_chars @@ -204,7 +236,7 @@ def extract_argument(line): return (line[:pos + 1], line[pos + 1:]) -def latex2ert(line): +def latex2ert(line, isindex): '''Converts LaTeX commands into ERT. line may well be a multi-line string when it is returned.''' if not line: @@ -238,29 +270,40 @@ def latex2ert(line): retval += "\n" + cmd + "\n" line = end m = labelre.match(line) + # put all remaining braces in ERT + line = wrap_into_ert(line, '}', '}') + line = wrap_into_ert(line, '{', '{') + if isindex: + # active character that is not available in all font encodings + line = wrap_into_ert(line, '|', '|') retval += line return retval +unicode_reps = read_unicodesymbols() + #Bug 5022.... #Might should do latex2ert first, then deal with stuff that DOESN'T #end up inside ERT. That routine could be modified so that it returned #a list of lines, and we could then skip ERT bits and only deal with #the other bits. -def latex2lyx(data): +def latex2lyx(data, isindex): '''Takes a string, possibly multi-line, and returns the result of converting LaTeX constructs into LyX constructs. Returns a list of - lines, suitable for insertion into document.body.''' + lines, suitable for insertion into document.body. + The bool isindex specifies whether we are in an index macro (which + has some specific active characters that need to be ERTed).''' + if not data: + return [""] retval = [] # Convert LaTeX to Unicode - reps = read_unicodesymbols() # Commands of this sort need to be checked to make sure they are # followed by a non-alpha character, lest we replace too much. hardone = re.compile(r'^\\\\[a-zA-Z]+$') - for rep in reps: + for rep in unicode_reps: if hardone.match(rep[0]): pos = 0 while True: @@ -277,8 +320,11 @@ def latex2lyx(data): else: data = data.replace(rep[0], rep[1]) - # Generic, \" -> ": + # Generic + # \" -> ": data = wrap_into_ert(data, r'\"', '"') + # \\ -> \: + data = data.replace('\\\\', '\\') # Math: mathre = re.compile('^(.*?)(\$.*?\$)(.*)') @@ -295,94 +341,100 @@ def latex2lyx(data): g = m.group(3) if s: # this is non-math! - s = latex2ert(s) + s = latex2ert(s, isindex) subst = s.split('\n') retval += subst retval.append("\\begin_inset Formula " + f) retval.append("\\end_inset") m = mathre.match(g) # Handle whatever is left, which is just text - g = latex2ert(g) + g = latex2ert(g, isindex) subst = g.split('\n') retval += subst return retval +def lyxline2latex(document, line, inert): + 'Convert some LyX stuff into corresponding LaTeX stuff line-wise, as best we can.' + if line.startswith("\\begin_inset Formula"): + line = line[20:] + elif line.startswith("\\begin_inset Quotes"): + # For now, we do a very basic reversion. Someone who understands + # quotes is welcome to fix it up. + qtype = line[20:].strip() + # lang = qtype[0] + side = qtype[1] + dbls = qtype[2] + if side == "l": + if dbls == "d": + line = "``" + else: + line = "`" + else: + if dbls == "d": + line = "''" + else: + line = "'" + elif line.isspace() or \ + line.startswith("\\begin_layout") or \ + line.startswith("\\end_layout") or \ + line.startswith("\\begin_inset") or \ + line.startswith("\\end_inset") or \ + line.startswith("\\lang") or \ + line.strip() == "status collapsed" or \ + line.strip() == "status open": + #skip all that stuff + return "" + + # this needs to be added to the preamble because of cases like + # \textmu, \textbackslash, etc. + add_to_preamble(document, ['% added by lyx2lyx for converted entries', + '\\@ifundefined{textmu}', + ' {\\usepackage{textcomp}}{}']) + # a lossless reversion is not possible + # try at least to handle some common insets and settings + if inert: + line = line.replace(r'\backslash', '\\') + else: + line = line.replace('&', '\\&{}') + line = line.replace('#', '\\#{}') + line = line.replace('^', '\\^{}') + line = line.replace('%', '\\%{}') + line = line.replace('_', '\\_{}') + line = line.replace('$', '\\${}') + + # Do the LyX text --> LaTeX conversion + for rep in unicode_reps: + line = line.replace(rep[1], rep[0].replace('\\\\', '\\') + "{}") + line = line.replace(r'\backslash', r'\textbackslash{}') + line = line.replace(r'\series bold', r'\bfseries{}').replace(r'\series default', r'\mdseries{}') + line = line.replace(r'\shape italic', r'\itshape{}').replace(r'\shape smallcaps', r'\scshape{}') + line = line.replace(r'\shape slanted', r'\slshape{}').replace(r'\shape default', r'\upshape{}') + line = line.replace(r'\emph on', r'\em{}').replace(r'\emph default', r'\em{}') + line = line.replace(r'\noun on', r'\scshape{}').replace(r'\noun default', r'\upshape{}') + line = line.replace(r'\bar under', r'\underbar{').replace(r'\bar default', r'}') + line = line.replace(r'\family sans', r'\sffamily{}').replace(r'\family default', r'\normalfont{}') + line = line.replace(r'\family typewriter', r'\ttfamily{}').replace(r'\family roman', r'\rmfamily{}') + line = line.replace(r'\InsetSpace ', r'').replace(r'\SpecialChar ', r'') + return line + + def lyx2latex(document, lines): 'Convert some LyX stuff into corresponding LaTeX stuff, as best we can.' # clean up multiline stuff content = "" ert_end = 0 - reps = read_unicodesymbols() for curline in range(len(lines)): - line = lines[curline] - if line.startswith("\\begin_inset ERT"): - # We don't want to replace things inside ERT, so figure out - # where the end of the inset is. - ert_end = find_end_of_inset(lines, curline + 1) - continue - elif line.startswith("\\begin_inset Formula"): - line = line[20:] - elif line.startswith("\\begin_inset Quotes"): - # For now, we do a very basic reversion. Someone who understands - # quotes is welcome to fix it up. - qtype = line[20:].strip() - # lang = qtype[0] - side = qtype[1] - dbls = qtype[2] - if side == "l": - if dbls == "d": - line = "``" - else: - line = "`" - else: - if dbls == "d": - line = "''" - else: - line = "'" - elif line.isspace() or \ - line.startswith("\\begin_layout") or \ - line.startswith("\\end_layout") or \ - line.startswith("\\begin_inset") or \ - line.startswith("\\end_inset") or \ - line.startswith("\\lang") or \ - line.strip() == "status collapsed" or \ - line.strip() == "status open": - #skip all that stuff - continue - - # this needs to be added to the preamble because of cases like - # \textmu, \textbackslash, etc. - add_to_preamble(document, ['% added by lyx2lyx for converted index entries', - '\\@ifundefined{textmu}', - ' {\\usepackage{textcomp}}{}']) - # a lossless reversion is not possible - # try at least to handle some common insets and settings - if ert_end >= curline: - line = line.replace(r'\backslash', r'\\') - else: - line = line.replace('&', '\\&{}') - line = line.replace('#', '\\#{}') - line = line.replace('^', '\\^{}') - line = line.replace('%', '\\%{}') - line = line.replace('_', '\\_{}') - line = line.replace('$', '\\${}') - - # Do the LyX text --> LaTeX conversion - for rep in reps: - line = line.replace(rep[1], rep[0] + "{}") - line = line.replace(r'\backslash', r'\textbackslash{}') - line = line.replace(r'\series bold', r'\bfseries{}').replace(r'\series default', r'\mdseries{}') - line = line.replace(r'\shape italic', r'\itshape{}').replace(r'\shape smallcaps', r'\scshape{}') - line = line.replace(r'\shape slanted', r'\slshape{}').replace(r'\shape default', r'\upshape{}') - line = line.replace(r'\emph on', r'\em{}').replace(r'\emph default', r'\em{}') - line = line.replace(r'\noun on', r'\scshape{}').replace(r'\noun default', r'\upshape{}') - line = line.replace(r'\bar under', r'\underbar{').replace(r'\bar default', r'}') - line = line.replace(r'\family sans', r'\sffamily{}').replace(r'\family default', r'\normalfont{}') - line = line.replace(r'\family typewriter', r'\ttfamily{}').replace(r'\family roman', r'\rmfamily{}') - line = line.replace(r'\InsetSpace ', r'').replace(r'\SpecialChar ', r'') - content += line + line = lines[curline] + if line.startswith("\\begin_inset ERT"): + # We don't want to replace things inside ERT, so figure out + # where the end of the inset is. + ert_end = find_end_of_inset(lines, curline + 1) + continue + inert = ert_end >= curline + content += lyxline2latex(document, lines[curline], inert) + return content @@ -397,6 +449,7 @@ def convert_ltcaption(document): j = find_end_of_inset(document.body, i + 1) if j == -1: document.warning("Malformed LyX document: Could not find end of tabular.") + i += 1 continue nrows = int(document.body[i+1].split('"')[3]) @@ -447,6 +500,7 @@ def revert_ltcaption(document): j = find_end_of_inset(document.body, i + 1) if j == -1: document.warning("Malformed LyX document: Could not find end of tabular.") + i += 1 continue m = i + 1 @@ -487,6 +541,7 @@ def convert_tablines(document): j = find_end_of_inset(document.body, i + 1) if j == -1: document.warning("Malformed LyX document: Could not find end of tabular.") + i += 1 continue m = i + 1 @@ -546,9 +601,10 @@ def revert_tablines(document): i = find_token(document.body, "\\begin_inset Tabular", i) if i == -1: return - j = find_end_of_inset(document.body, i + 1) + j = find_end_of_inset(document.body, i) if j == -1: document.warning("Malformed LyX document: Could not find end of tabular.") + i += 1 continue m = i + 1 @@ -625,6 +681,7 @@ def fix_wrong_tables(document): j = find_end_of_inset(document.body, i + 1) if j == -1: document.warning("Malformed LyX document: Could not find end of tabular.") + i += 1 continue m = i + 1 @@ -747,7 +804,7 @@ def convert_flex(document): document.body[i] = document.body[i].replace('\\begin_inset CharStyle', '\\begin_inset Flex') def revert_flex(document): - "Convert Flex to CharStyle" + "Revert Flex to CharStyle" i = 0 while True: i = find_token(document.body, "\\begin_inset Flex", i) @@ -756,7 +813,6 @@ def revert_flex(document): document.body[i] = document.body[i].replace('\\begin_inset Flex', '\\begin_inset CharStyle') -# Discard PDF options for hyperref def revert_pdf_options(document): "Revert PDF options for hyperref." # store the PDF options and delete the entries from the Lyx file @@ -920,7 +976,7 @@ def revert_pdf_options(document): def remove_inzip_options(document): "Remove inzipName and embed options from the Graphics inset" i = 0 - while 1: + while True: i = find_token(document.body, "\\begin_inset Graphics", i) if i == -1: return @@ -928,6 +984,8 @@ def remove_inzip_options(document): if j == -1: # should not happen document.warning("Malformed LyX document: Could not find end of graphics inset.") + i += 1 + continue # If there's a inzip param, just remove that k = find_token(document.body, "\tinzipName", i + 1, j) if k != -1: @@ -946,7 +1004,7 @@ def convert_inset_command(document): LatexCommand cmd """ i = 0 - while 1: + while True: i = find_token(document.body, "\\begin_inset LatexCommand", i) if i == -1: return @@ -985,7 +1043,7 @@ def revert_inset_command(document): will not be able to recognize. Not sure what to do about that. """ i = 0 - while 1: + while True: i = find_token(document.body, "\\begin_inset CommandInset", i) if i == -1: return @@ -994,6 +1052,7 @@ def revert_inset_command(document): m = r.match(nextline) if not m: document.warning("Malformed LyX document: Missing LatexCommand in " + document.body[i] + ".") + i += 1 continue cmdName = m.group(1) insertion = ["\\begin_inset LatexCommand " + cmdName] @@ -1054,7 +1113,7 @@ def revert_wrapfig_options(document): def convert_latexcommand_index(document): - "Convert from LatexCommand form to collapsable form." + "Convert from LatexCommand form to collapsible form." i = 0 r1 = re.compile('name "(.*)"') while True: @@ -1062,10 +1121,11 @@ def convert_latexcommand_index(document): if i == -1: return if document.body[i + 1] != "LatexCommand index": # Might also be index_print - return - j = find_end_of_inset(document.body, i + 2) + i += 1 + continue + j = find_end_of_inset(document.body, i + 1) if j == -1: - document.warning("Unable to find end of index inset at line " + i + "!") + document.warning("Unable to find end of index inset at line " + str(i) + "!") i += 2 continue m = r1.match(document.body[i + 2]) @@ -1075,7 +1135,7 @@ def convert_latexcommand_index(document): linelist = [""] else: fullcontent = m.group(1) - linelist = latex2lyx(fullcontent) + linelist = latex2lyx(fullcontent, True) #document.warning(fullcontent) linelist = ["\\begin_inset Index", "status collapsed", "\\begin_layout Standard", ""] + \ @@ -1085,7 +1145,7 @@ def convert_latexcommand_index(document): def revert_latexcommand_index(document): - "Revert from collapsable form to LatexCommand form." + "Revert from collapsible form to LatexCommand form." i = 0 while True: i = find_token(document.body, "\\begin_inset Index", i) @@ -1206,7 +1266,7 @@ def revert_japanese_encoding(document): def revert_inset_info(document): 'Replace info inset with its content' i = 0 - while 1: + while True: i = find_token(document.body, '\\begin_inset Info', i) if i == -1: return @@ -1214,11 +1274,22 @@ def revert_inset_info(document): if j == -1: # should not happen document.warning("Malformed LyX document: Could not find end of Info inset.") + i += 1 + continue type = 'unknown' arg = '' for k in range(i, j+1): if document.body[k].startswith("arg"): - arg = document.body[k][3:].strip().strip('"') + arg = document.body[k][3:].strip() + # remove embracing quotation marks + if arg[0] == '"': + arg = arg[1:] + if arg[len(arg) - 1] == '"': + arg = arg[:len(arg) - 1] + # \" to straight quote + arg = arg.replace(r'\"', '"') + # \ to \backslash + arg = arg.replace(r'\\', "\\backslash\n") if document.body[k].startswith("type"): type = document.body[k][4:].strip().strip('"') # I think there is a newline after \\end_inset, which should be removed. @@ -1291,13 +1362,13 @@ def convert_url(document): j = find_token(document.body, "target", i) if j == -1: document.warning("Malformed LyX document: Can't find target for url inset") - i = j + i += 1 continue target = document.body[j][8:-1] k = find_token(document.body, "\\end_inset", j) if k == -1: document.warning("Malformed LyX document: Can't find end of url inset") - i = k + i = j continue newstuff = ["\\begin_inset Flex URL", "status collapsed", "", @@ -1307,7 +1378,7 @@ def convert_url(document): "\\end_layout", ""] document.body[i:k] = newstuff - i = k + i = i + len(newstuff) def convert_ams_classes(document): tc = document.textclass @@ -1536,6 +1607,44 @@ def convert_usorbian(document): j = j + 1 +def convert_macro_global(document): + "Remove TeX code command \global when it is in front of a macro" + # math macros are nowadays already defined \global, so that an additional + # \global would make the document uncompilable, see + # http://www.lyx.org/trac/ticket/5371 + # We're looking for something like this: + # \begin_inset ERT + # status collapsed + # + # \begin_layout Plain Layout + # + # + # \backslash + # global + # \end_layout + # + # \end_inset + # + # + # \begin_inset FormulaMacro + # \renewcommand{\foo}{123} + # \end_inset + i = 0 + while True: + i = find_token(document.body, "\\begin_inset FormulaMacro", i) + if i == -1: + return + # if i <= 13, then there isn't enough room for the ERT + if i <= 12: + i += 1 + continue + if document.body[i-6] == "global": + del document.body[i-13 : i] + i = i - 12 + else: + i += 1 + + def revert_macro_optional_params(document): "Convert macro definitions with optional parameters into ERTs" # Stub to convert macro definitions with one or more optional parameters @@ -1638,7 +1747,7 @@ def convert_serbocroatian(document): def convert_framed_notes(document): "Convert framed notes to boxes. " i = 0 - while 1: + while True: i = find_tokens(document.body, ["\\begin_inset Note Framed", "\\begin_inset Note Shaded"], i) if i == -1: return @@ -1667,7 +1776,7 @@ def convert_module_names(document): return newmodlist = [] for mod in modlist: - if modulemap.has_key(mod): + if mod in modulemap: newmodlist.append(modulemap[mod]) else: document.warning("Can't find module %s in the module map!" % mod) @@ -1686,7 +1795,7 @@ def revert_module_names(document): return newmodlist = [] for mod in modlist: - if modulemap.has_key(mod): + if mod in modulemap: newmodlist.append(modulemap[mod]) else: document.warning("Can't find module %s in the module map!" % mod) @@ -1715,7 +1824,7 @@ def revert_colsep(document): def revert_framed_notes(document): "Revert framed boxes to notes. " i = 0 - while 1: + while True: i = find_tokens(document.body, ["\\begin_inset Box Framed", "\\begin_inset Box Shaded"], i) if i == -1: @@ -1724,19 +1833,24 @@ def revert_framed_notes(document): if j == -1: # should not happen document.warning("Malformed LyX document: Could not find end of Box inset.") + i += 1 + continue k = find_token(document.body, "status", i + 1, j) if k == -1: document.warning("Malformed LyX document: Missing `status' tag in Box inset.") - return + i = j + continue status = document.body[k] l = find_default_layout(document, i + 1, j) if l == -1: document.warning("Malformed LyX document: Missing `\\begin_layout' in Box inset.") - return + i = j + continue m = find_token(document.body, "\\end_layout", i + 1, j) if m == -1: document.warning("Malformed LyX document: Missing `\\end_layout' in Box inset.") - return + i = j + continue ibox = find_token(document.body, "has_inner_box 1", i + 1, k) pbox = find_token(document.body, "use_parbox 1", i + 1, k) if ibox == -1 and pbox == -1: @@ -1756,45 +1870,51 @@ def revert_framed_notes(document): def revert_slash(document): 'Revert \\SpecialChar \\slash{} to ERT' - r = re.compile(r'\\SpecialChar \\slash{}') i = 0 while i < len(document.body): - m = r.match(document.body[i]) + m = re.match(r'(.*)\\SpecialChar \\slash{}(.*)', document.body[i]) if m: - subst = ['\\begin_inset ERT', - 'status collapsed', '', - '\\begin_layout Standard', - '', '', '\\backslash', - 'slash{}', - '\\end_layout', '', - '\\end_inset', ''] - document.body[i: i+1] = subst - i = i + len(subst) + before = m.group(1) + after = m.group(2) + subst = [before, + '\\begin_inset ERT', + 'status collapsed', '', + '\\begin_layout Standard', + '', '', '\\backslash', + 'slash{}', + '\\end_layout', '', + '\\end_inset', '', + after] + document.body[i: i+1] = subst + i = i + len(subst) else: - i = i + 1 + i = i + 1 def revert_nobreakdash(document): 'Revert \\SpecialChar \\nobreakdash- to ERT' i = 0 while i < len(document.body): - line = document.body[i] - r = re.compile(r'\\SpecialChar \\nobreakdash-') - m = r.match(line) + m = re.match(r'(.*)\\SpecialChar \\nobreakdash-(.*)', document.body[i]) if m: - subst = ['\\begin_inset ERT', + before = m.group(1) + after = m.group(2) + subst = [before, + '\\begin_inset ERT', 'status collapsed', '', '\\begin_layout Standard', '', '', '\\backslash', 'nobreakdash-', '\\end_layout', '', - '\\end_inset', ''] - document.body[i:i+1] = subst + '\\end_inset', '', + after] + document.body[i: i+1] = subst i = i + len(subst) j = find_token(document.header, "\\use_amsmath", 0) if j == -1: document.warning("Malformed LyX document: Missing '\\use_amsmath'.") - return + i += 1 + continue document.header[j] = "\\use_amsmath 2" else: i = i + 1 @@ -1822,7 +1942,7 @@ def revert_nocite_key(body, start, end): def revert_nocite(document): "Revert LatexCommand nocite to ERT" i = 0 - while 1: + while True: i = find_token(document.body, "\\begin_inset CommandInset citation", i) if i == -1: return @@ -1940,7 +2060,7 @@ def revert_serbianlatin(document): def revert_rotfloat(document): " Revert sideways custom floats. " i = 0 - while 1: + while True: # whitespace intended (exclude \\begin_inset FloatList) i = find_token(document.body, "\\begin_inset Float ", i) if i == -1: @@ -1968,7 +2088,8 @@ def revert_rotfloat(document): l = find_default_layout(document, i + 1, j) if l == -1: document.warning("Malformed LyX document: Missing `\\begin_layout' in Float inset.") - return + i = j + continue subst = ['\\begin_layout Standard', '\\begin_inset ERT', 'status collapsed', '', @@ -2002,7 +2123,7 @@ def revert_rotfloat(document): def revert_widesideways(document): " Revert wide sideways floats. " i = 0 - while 1: + while True: # whitespace intended (exclude \\begin_inset FloatList) i = find_token(document.body, '\\begin_inset Float ', i) if i == -1: @@ -2030,7 +2151,8 @@ def revert_widesideways(document): l = find_default_layout(document, i + 1, j) if l == -1: document.warning("Malformed LyX document: Missing `\\begin_layout' in Float inset.") - return + i = j + continue subst = ['\\begin_layout Standard', '\\begin_inset ERT', 'status collapsed', '', '\\begin_layout Standard', '', '', '\\backslash', @@ -2053,7 +2175,7 @@ def revert_widesideways(document): def revert_inset_embedding(document, type): ' Remove embed tag from certain type of insets' i = 0 - while 1: + while True: i = find_token(document.body, "\\begin_inset %s" % type, i) if i == -1: return @@ -2078,7 +2200,8 @@ def revert_external_embedding(document): def convert_subfig(document): " Convert subfigures to subfloats. " i = 0 - while 1: + while True: + addedLines = 0 i = find_token(document.body, '\\begin_inset Graphics', i) if i == -1: return @@ -2093,16 +2216,16 @@ def convert_subfig(document): continue l = find_token(document.body, '\tsubcaptionText', i, endInset) if l == -1: - document.warning("Malformed lyx document: Can't find subcaptionText!") - i = endInset - continue - caption = document.body[l][16:].strip('"') - del document.body[l] + caption = "" + else: + caption = document.body[l][16:].strip('"') + del document.body[l] + addedLines -= 1 del document.body[k] - addedLines = -2 + addedLines -= 1 subst = ['\\begin_inset Float figure', 'wide false', 'sideways false', 'status open', '', '\\begin_layout Plain Layout', '\\begin_inset Caption', - '', '\\begin_layout Plain Layout'] + latex2lyx(caption) + \ + '', '\\begin_layout Plain Layout'] + latex2lyx(caption, False) + \ [ '\\end_layout', '', '\\end_inset', '', '\\end_layout', '', '\\begin_layout Plain Layout'] document.body[i : i] = subst @@ -2117,7 +2240,7 @@ def convert_subfig(document): def revert_subfig(document): " Revert subfloats. " i = 0 - while 1: + while True: # whitespace intended (exclude \\begin_inset FloatList) i = find_tokens(document.body, ['\\begin_inset Float ', '\\begin_inset Wrap'], i) if i == -1: @@ -2136,11 +2259,25 @@ def revert_subfig(document): k = find_token(document.body, '\\begin_inset Float ', i + 1, j) if k == -1: break + # is the subfloat aligned? + al = find_token(document.body, '\\align ', k - 1, j) + alignment_beg = "" + alignment_end = "" + if al != -1: + if get_value(document.body, '\\align', al) == "center": + alignment_beg = "\\backslash\nbegin{centering}" + alignment_end = "\\backslash\npar\\backslash\nend{centering}" + elif get_value(document.body, '\\align', al) == "left": + alignment_beg = "\\backslash\nbegin{raggedright}" + alignment_end = "\\backslash\npar\\backslash\nend{raggedright}" + elif get_value(document.body, '\\align', al) == "right": + alignment_beg = "\\backslash\nbegin{raggedleft}" + alignment_end = "\\backslash\npar\\backslash\nend{raggedleft}" l = find_end_of_inset(document.body, k) if l == -1: document.warning("Malformed lyx document: Missing '\\end_inset' (embedded float).") i += 1 - j == -1 + j = -1 continue # escape to the outer loop m = find_default_layout(document, k + 1, l) # caption? @@ -2174,7 +2311,7 @@ def revert_subfig(document): if opt != -1: optend = find_end_of_inset(document.body, opt) if optend == -1: - document.warning("Malformed lyx document: Missing '\\end_inset' (OptArg).") + document.warning("Malformed LyX document: Missing '\\end_inset' (OptArg).") return optc = find_default_layout(document, opt, optend) if optc == -1: @@ -2192,13 +2329,15 @@ def revert_subfig(document): continue elif line in document.body[opt:optend]: continue - elif not line.startswith('\\'): - caption += line.strip() + else: + inert = True + caption += lyxline2latex(document, line, inert) if len(label) > 0: - caption += "\\backslash\nlabel{" + label + "}" - subst = '\\begin_layout Plain Layout\n\\begin_inset ERT\nstatus collapsed\n\n' \ - '\\begin_layout Plain Layout\n\n}\n\\end_layout\n\n\\end_inset\n\n' \ - '\\end_layout\n\n\\begin_layout Plain Layout\n' + caption += "\n\\backslash\nlabel{" + label + "}" + subst = '\\begin_layout PlainLayout\n\\begin_inset ERT\nstatus collapsed\n\n' \ + '\\begin_layout PlainLayout\n\n}' + alignment_end + \ + '\n\\end_layout\n\n\\end_inset\n\n' \ + '\\end_layout\n\n\\begin_layout PlainLayout\n' subst = subst.split('\n') document.body[l : l+1] = subst addedLines = len(subst) - 1 @@ -2209,7 +2348,7 @@ def revert_subfig(document): del document.body[k+1:m-1] addedLines -= (m - 1 - (k + 1)) insertion = '\\begin_inset ERT\nstatus collapsed\n\n' \ - '\\begin_layout Plain Layout\n\n\\backslash\n' \ + '\\begin_layout PlainLayout\n\n' + alignment_beg + '\n\\backslash\n' \ 'subfloat' if len(shortcap) > 0: insertion = insertion + "[" + shortcap + "]" @@ -2219,6 +2358,10 @@ def revert_subfig(document): insertion = insertion.split('\n') document.body[k : k + 1] = insertion addedLines += len(insertion) - 1 + al = find_token(document.body, '\\align ', k - 1, j + addedLines) + if al != -1: + del document.body[al] + addedLines -= 1 add_to_preamble(document, ['\\usepackage{subfig}\n']) i += addedLines + 1 @@ -2236,11 +2379,12 @@ def revert_wrapplacement(document): document.warning("Malformed LyX document: Couldn't find placement parameter of wrap float.") i += 1 continue - r = re.compile("placement (o|i|l|r)") + r = re.compile("placement (o|i|l|r|O|I|L|R)") m = r.match(document.body[j]) if m == None: document.warning("Malformed LyX document: Placement option isn't O|I|R|L!") - document.body[j] = "placement " + m.group(1).lower() + else: + document.body[j] = "placement " + m.group(1).lower() i = j @@ -2277,6 +2421,7 @@ def revert_spaceinset(document): j = find_end_of_inset(document.body, i) if j == -1: document.warning("Malformed LyX document: Could not find end of space inset.") + i += 1 continue document.body[i] = document.body[i].replace('\\begin_inset Space', '\\InsetSpace') del document.body[j] @@ -2379,6 +2524,7 @@ def revert_protected_hfill(document): j = find_end_of_inset(document.body, i) if j == -1: document.warning("Malformed LyX document: Could not find end of space inset.") + i += 1 continue del document.body[j] subst = document.body[i].replace('\\begin_inset Space \\hspace*{\\fill}', \ @@ -2400,6 +2546,7 @@ def revert_leftarrowfill(document): j = find_end_of_inset(document.body, i) if j == -1: document.warning("Malformed LyX document: Could not find end of space inset.") + i += 1 continue del document.body[j] subst = document.body[i].replace('\\begin_inset Space \\leftarrowfill{}', \ @@ -2421,6 +2568,7 @@ def revert_rightarrowfill(document): j = find_end_of_inset(document.body, i) if j == -1: document.warning("Malformed LyX document: Could not find end of space inset.") + i += 1 continue del document.body[j] subst = document.body[i].replace('\\begin_inset Space \\rightarrowfill{}', \ @@ -2442,6 +2590,7 @@ def revert_upbracefill(document): j = find_end_of_inset(document.body, i) if j == -1: document.warning("Malformed LyX document: Could not find end of space inset.") + i += 1 continue del document.body[j] subst = document.body[i].replace('\\begin_inset Space \\upbracefill{}', \ @@ -2463,6 +2612,7 @@ def revert_downbracefill(document): j = find_end_of_inset(document.body, i) if j == -1: document.warning("Malformed LyX document: Could not find end of space inset.") + i += 1 continue del document.body[j] subst = document.body[i].replace('\\begin_inset Space \\downbracefill{}', \ @@ -2530,6 +2680,7 @@ def revert_pagebreaks(document): j = find_end_of_inset(document.body, i) if j == -1: document.warning("Malformed LyX document: Could not find end of Newpage inset.") + i += 1 continue del document.body[j] document.body[i] = document.body[i].replace('\\begin_inset Newpage newpage', '\\newpage') @@ -2566,6 +2717,7 @@ def revert_linebreaks(document): j = find_end_of_inset(document.body, i) if j == -1: document.warning("Malformed LyX document: Could not find end of Newline inset.") + i += 1 continue del document.body[j] document.body[i] = document.body[i].replace('\\begin_inset Newline newline', '\\newline') @@ -2592,7 +2744,7 @@ def convert_japanese_plain(document): def revert_pdfpages(document): ' Revert pdfpages external inset to ERT ' i = 0 - while 1: + while True: i = find_token(document.body, "\\begin_inset External", i) if i == -1: return @@ -2694,7 +2846,7 @@ def revert_master(document): def revert_graphics_group(document): ' Revert group information from graphics insets ' i = 0 - while 1: + while True: i = find_token(document.body, "\\begin_inset Graphics", i) if i == -1: return @@ -2724,7 +2876,7 @@ def update_apa_styles(document): "Paragraph*": "Paragraph", "Subparagraph*": "Subparagraph"} i = 0 - while 1: + while True: i = find_token(document.body, "\\begin_layout", i) if i == -1: return @@ -2738,7 +2890,7 @@ def update_apa_styles(document): def convert_paper_sizes(document): ' exchange size options legalpaper and executivepaper to correct order ' - # routine is needed to fix http://bugzilla.lyx.org/show_bug.cgi?id=4868 + # routine is needed to fix http://www.lyx.org/trac/ticket/4868 i = 0 j = 0 i = find_token(document.header, "\\papersize executivepaper", 0) @@ -2841,7 +2993,7 @@ def convert_plain_layout(document): def revert_plain_layout(document): - " Convert 'PlainLayout' to 'Plain Layout'" + " Revert 'Plain Layout' to 'PlainLayout'" i = 0 while True: i = find_token(document.body, '\\begin_layout Plain Layout', i) @@ -2853,7 +3005,7 @@ def revert_plain_layout(document): def revert_plainlayout(document): - " Convert 'PlainLayout' to 'Plain Layout'" + " Revert 'PlainLayout' to 'Standard'" i = 0 while True: i = find_token(document.body, '\\begin_layout PlainLayout', i) @@ -2955,6 +3107,69 @@ def revert_mongolian(document): j = j + 1 +def revert_default_options(document): + ' Remove param use_default_options ' + i = find_token(document.header, "\\use_default_options", 0) + if i != -1: + del document.header[i] + + +def convert_default_options(document): + ' Add param use_default_options and set it to false ' + i = find_token(document.header, "\\textclass", 0) + if i == -1: + document.warning("Malformed LyX document: Missing `\\textclass'.") + return + document.header.insert(i, '\\use_default_options false') + + +def revert_backref_options(document): + ' Revert option pdf_backref=page to pagebackref ' + i = find_token(document.header, "\\pdf_backref page", 0) + if i != -1: + document.header[i] = "\\pdf_pagebackref true" + + +def convert_backref_options(document): + ' We have changed the option pagebackref to backref=true ' + i = find_token(document.header, "\\pdf_pagebackref true", 0) + if i != -1: + document.header[i] = "\\pdf_backref page" + j = find_token(document.header, "\\pdf_pagebackref false", 0) + if j != -1: + del document.header[j] + # backref=true was not a valid option, we meant backref=section + k = find_token(document.header, "\\pdf_backref true", 0) + if k != -1 and i != -1: + del document.header[k] + elif k != -1 and j != -1: + document.header[k] = "\\pdf_backref section" + + +def convert_charstyle_element(document): + "Convert CharStyle to Element for docbook backend" + if document.backend != "docbook": + return + i = 0 + while True: + i = find_token(document.body, "\\begin_inset Flex CharStyle:", i) + if i == -1: + return + document.body[i] = document.body[i].replace('\\begin_inset Flex CharStyle:', + '\\begin_inset Flex Element:') + +def revert_charstyle_element(document): + "Convert Element to CharStyle for docbook backend" + if document.backend != "docbook": + return + i = 0 + while True: + i = find_token(document.body, "\\begin_inset Flex Element:", i) + if i == -1: + return + document.body[i] = document.body[i].replace('\\begin_inset Flex Element:', + '\\begin_inset Flex CharStyle:') + ## # Conversion hub # @@ -2981,7 +3196,7 @@ convert = [[277, [fix_wrong_tables]], [295, [convert_htmlurl, convert_url]], [296, [convert_include]], [297, [convert_usorbian]], - [298, []], + [298, [convert_macro_global]], [299, []], [300, []], [301, []], @@ -3025,10 +3240,16 @@ convert = [[277, [fix_wrong_tables]], [339, []], [340, [add_plain_layout]], [341, []], - [342, []] + [342, []], + [343, [convert_default_options]], + [344, [convert_backref_options]], + [345, [convert_charstyle_element]] ] -revert = [[341, [revert_mongolian]], +revert = [[344, [revert_charstyle_element]], + [343, [revert_backref_options]], + [342, [revert_default_options]], + [341, [revert_mongolian]], [340, [revert_tabulators, revert_tabsize]], [339, []], [338, [revert_removed_modules]],