]> git.lyx.org Git - lyx.git/blob - src/mathed/MathParser.cpp
Don't create nested text-in-math environments.
[lyx.git] / src / mathed / MathParser.cpp
1 /**
2  * \file MathParser.cpp
3  * This file is part of LyX, the document processor.
4  * Licence details can be found in the file COPYING.
5  *
6  * \author André Pönitz
7  *
8  * Full author contact details are available in file CREDITS.
9  */
10
11 /*
12
13 If someone desperately needs partial "structures" (such as a few
14 cells of an array inset or similar) (s)he could uses the
15 following hack as starting point to write some macros:
16
17   \newif\ifcomment
18   \commentfalse
19   \ifcomment
20           \def\makeamptab{\catcode`\&=4\relax}
21           \def\makeampletter{\catcode`\&=11\relax}
22     \def\b{\makeampletter\expandafter\makeamptab\bi}
23     \long\def\bi#1\e{}
24   \else
25     \def\b{}\def\e{}
26   \fi
27   ...
28
29   \[\begin{array}{ccc}
30 1
31 &
32
33   \end{array}\]
34
35 */
36
37
38 #include <config.h>
39
40 #include "MathParser.h"
41
42 #include "InsetMathArray.h"
43 #include "InsetMathBig.h"
44 #include "InsetMathBrace.h"
45 #include "InsetMathChar.h"
46 #include "InsetMathColor.h"
47 #include "InsetMathComment.h"
48 #include "InsetMathDelim.h"
49 #include "InsetMathEnv.h"
50 #include "InsetMathFrac.h"
51 #include "InsetMathKern.h"
52 #include "MathMacro.h"
53 #include "InsetMathPar.h"
54 #include "InsetMathRef.h"
55 #include "InsetMathRoot.h"
56 #include "InsetMathScript.h"
57 #include "InsetMathSpace.h"
58 #include "InsetMathSplit.h"
59 #include "InsetMathSqrt.h"
60 #include "InsetMathTabular.h"
61 #include "MathMacroTemplate.h"
62 #include "MathFactory.h"
63 #include "MathMacroArgument.h"
64 #include "MathSupport.h"
65
66 #include "Encoding.h"
67 #include "Lexer.h"
68
69 #include "support/debug.h"
70 #include "support/convert.h"
71 #include "support/docstream.h"
72 #include "support/lstrings.h"
73
74 #include <sstream>
75
76 //#define FILEDEBUG
77
78 using namespace std;
79
80 namespace lyx {
81
82 using support::subst;
83
84 namespace {
85
86 InsetMath::mode_type asMode(InsetMath::mode_type oldmode, docstring const & str)
87 {
88         //lyxerr << "handling mode: '" << str << "'" << endl;
89         if (str == "mathmode")
90                 return InsetMath::MATH_MODE;
91         if (str == "textmode" || str == "forcetext")
92                 return InsetMath::TEXT_MODE;
93         return oldmode;
94 }
95
96
97 bool stared(docstring const & s)
98 {
99         size_t const n = s.size();
100         return n && s[n - 1] == '*';
101 }
102
103
104 docstring escapeSpecialChars(docstring const & str, bool textmode)
105 {
106         docstring const backslash = textmode ? from_ascii("\\textbackslash ")
107                                              : from_ascii("\\backslash ");
108         docstring const caret = textmode ? from_ascii("\\textasciicircum ")
109                                          : from_ascii("\\mathcircumflex ");
110
111         return subst(subst(subst(subst(subst(subst(subst(subst(subst(str,
112                         from_ascii("\\"), backslash),
113                         from_ascii("^"), caret),
114                         from_ascii("_"), from_ascii("\\_")),
115                         from_ascii("$"), from_ascii("\\$")),
116                         from_ascii("#"), from_ascii("\\#")),
117                         from_ascii("&"), from_ascii("\\&")),
118                         from_ascii("%"), from_ascii("\\%")),
119                         from_ascii("{"), from_ascii("\\{")),
120                         from_ascii("}"), from_ascii("\\}"));
121 }
122
123
124 /*!
125  * Add the row \p cellrow to \p grid.
126  * \returns wether the row could be added. Adding a row can fail for
127  * environments like "equation" that have a fixed number of rows.
128  */
129 bool addRow(InsetMathGrid & grid, InsetMathGrid::row_type & cellrow,
130             docstring const & vskip, bool allow_newpage_ = true)
131 {
132         ++cellrow;
133         if (cellrow == grid.nrows()) {
134                 //lyxerr << "adding row " << cellrow << endl;
135                 grid.addRow(cellrow - 1);
136                 if (cellrow == grid.nrows()) {
137                         // We can't add a row to this grid, so let's
138                         // append the content of this cell to the previous
139                         // one.
140                         // This does not happen in well formed .lyx files,
141                         // but LyX versions 1.3.x and older could create
142                         // such files and tex2lyx can still do that.
143                         --cellrow;
144                         lyxerr << "ignoring extra row";
145                         if (!vskip.empty())
146                                 lyxerr << " with extra space " << to_utf8(vskip);
147                         if (!allow_newpage_)
148                                 lyxerr << " with no page break allowed";
149                         lyxerr << '.' << endl;
150                         return false;
151                 }
152         }
153         grid.vcrskip(Length(to_utf8(vskip)), cellrow - 1);
154         grid.rowinfo(cellrow - 1).allow_newpage_ = allow_newpage_;
155         return true;
156 }
157
158
159 /*!
160  * Add the column \p cellcol to \p grid.
161  * \returns wether the column could be added. Adding a column can fail for
162  * environments like "eqnarray" that have a fixed number of columns.
163  */
164 bool addCol(InsetMathGrid & grid, InsetMathGrid::col_type & cellcol)
165 {
166         ++cellcol;
167         if (cellcol == grid.ncols()) {
168                 //lyxerr << "adding column " << cellcol << endl;
169                 grid.addCol(cellcol);
170                 if (cellcol == grid.ncols()) {
171                         // We can't add a column to this grid, so let's
172                         // append the content of this cell to the previous
173                         // one.
174                         // This does not happen in well formed .lyx files,
175                         // but LyX versions 1.3.x and older could create
176                         // such files and tex2lyx can still do that.
177                         --cellcol;
178                         lyxerr << "ignoring extra column." << endl;
179                         return false;
180                 }
181         }
182         return true;
183 }
184
185
186 /*!
187  * Check wether the last row is empty and remove it if yes.
188  * Otherwise the following code
189  * \verbatim
190 \begin{array}{|c|c|}
191 \hline
192 1 & 2 \\ \hline
193 3 & 4 \\ \hline
194 \end{array}
195  * \endverbatim
196  * will result in a grid with 3 rows (+ the dummy row that is always present),
197  * because the last '\\' opens a new row.
198  */
199 void delEmptyLastRow(InsetMathGrid & grid)
200 {
201         InsetMathGrid::row_type const row = grid.nrows() - 1;
202         for (InsetMathGrid::col_type col = 0; col < grid.ncols(); ++col) {
203                 if (!grid.cell(grid.index(row, col)).empty())
204                         return;
205         }
206         // Copy the row information of the empty row (which would contain the
207         // last hline in the example above) to the dummy row and delete the
208         // empty row.
209         grid.rowinfo(row + 1) = grid.rowinfo(row);
210         grid.delRow(row);
211 }
212
213
214 // These are TeX's catcodes
215 enum CatCode {
216         catEscape,     // 0    backslash
217         catBegin,      // 1    {
218         catEnd,        // 2    }
219         catMath,       // 3    $
220         catAlign,      // 4    &
221         catNewline,    // 5    ^^M
222         catParameter,  // 6    #
223         catSuper,      // 7    ^
224         catSub,        // 8    _
225         catIgnore,     // 9
226         catSpace,      // 10   space
227         catLetter,     // 11   a-zA-Z
228         catOther,      // 12   none of the above
229         catActive,     // 13   ~
230         catComment,    // 14   %
231         catInvalid     // 15   <delete>
232 };
233
234 CatCode theCatcode[128];
235
236
237 inline CatCode catcode(char_type c)
238 {
239         /* The only characters that are not catOther lie in the pure ASCII
240          * range. Therefore theCatcode has only 128 entries.
241          * TeX itself deals with 8bit characters, so if needed this table
242          * could be enlarged to 256 entries.
243          * Any larger value does not make sense, since the fact that we use
244          * unicode internally does not change Knuth's TeX engine.
245          * Apart from that a table for the full 21bit UCS4 range would waste
246          * too much memory. */
247         if (c >= 128)
248                 return catOther;
249
250         return theCatcode[c];
251 }
252
253
254 enum {
255         FLAG_ALIGN      = 1 << 0,  //  next & or \\ ends the parsing process
256         FLAG_BRACE_LAST = 1 << 1,  //  next closing brace ends the parsing
257         FLAG_RIGHT      = 1 << 2,  //  next \\right ends the parsing process
258         FLAG_END        = 1 << 3,  //  next \\end ends the parsing process
259         FLAG_BRACK_LAST = 1 << 4,  //  next closing bracket ends the parsing
260         FLAG_TEXTMODE   = 1 << 5,  //  we are in a box
261         FLAG_ITEM       = 1 << 6,  //  read a (possibly braced) token
262         FLAG_LEAVE      = 1 << 7,  //  leave the loop at the end
263         FLAG_SIMPLE     = 1 << 8,  //  next $ leaves the loop
264         FLAG_EQUATION   = 1 << 9,  //  next \] leaves the loop
265         FLAG_SIMPLE2    = 1 << 10, //  next \) leaves the loop
266         FLAG_OPTION     = 1 << 11, //  read [...] style option
267         FLAG_BRACED     = 1 << 12  //  read {...} style argument
268 };
269
270
271 //
272 // Helper class for parsing
273 //
274
275 class Token {
276 public:
277         ///
278         Token() : cs_(), char_(0), cat_(catIgnore) {}
279         ///
280         Token(char_type c, CatCode cat) : cs_(), char_(c), cat_(cat) {}
281         ///
282         explicit Token(docstring const & cs) : cs_(cs), char_(0), cat_(catIgnore) {}
283
284         ///
285         docstring const & cs() const { return cs_; }
286         ///
287         CatCode cat() const { return cat_; }
288         ///
289         char_type character() const { return char_; }
290         ///
291         docstring asString() const { return cs_.size() ? cs_ : docstring(1, char_); }
292         ///
293         docstring asInput() const { return cs_.size() ? '\\' + cs_ : docstring(1, char_); }
294
295 private:
296         ///
297         docstring cs_;
298         ///
299         char_type char_;
300         ///
301         CatCode cat_;
302 };
303
304
305 ostream & operator<<(ostream & os, Token const & t)
306 {
307         if (t.cs().size()) {
308                 docstring const & cs = t.cs();
309                 // FIXME: For some strange reason, the stream operator instanciate
310                 // a new Token before outputting the contents of t.cs().
311                 // Because of this the line
312                 //     os << '\\' << cs;
313                 // below becomes recursive.
314                 // In order to avoid that we return early:
315                 if (cs == "\\")
316                         return os;
317                 os << '\\' << to_utf8(cs);
318         }
319         else if (t.cat() == catLetter)
320                 os << t.character();
321         else
322                 os << '[' << t.character() << ',' << t.cat() << ']';
323         return os;
324 }
325
326
327 class Parser {
328 public:
329         ///
330         typedef  InsetMath::mode_type mode_type;
331         ///
332         typedef  Parse::flags parse_mode;
333
334         ///
335         Parser(Lexer & lex, parse_mode mode);
336         /// Only use this for reading from .lyx file format, for the reason
337         /// see Parser::tokenize(istream &).
338         Parser(istream & is, parse_mode mode);
339         ///
340         Parser(docstring const & str, parse_mode mode);
341
342         ///
343         bool parse(MathAtom & at);
344         ///
345         bool parse(MathData & array, unsigned flags, mode_type mode);
346         ///
347         bool parse1(InsetMathGrid & grid, unsigned flags, mode_type mode,
348                 bool numbered);
349         ///
350         MathData parse(unsigned flags, mode_type mode);
351         ///
352         int lineno() const { return lineno_; }
353         ///
354         void putback();
355
356 private:
357         ///
358         void parse2(MathAtom & at, unsigned flags, mode_type mode, bool numbered);
359         /// get arg delimited by 'left' and 'right'
360         docstring getArg(char_type left, char_type right);
361         ///
362         char_type getChar();
363         ///
364         void error(string const & msg);
365         void error(docstring const & msg) { error(to_utf8(msg)); }
366         /// dump contents to screen
367         void dump() const;
368         /// Only use this for reading from .lyx file format (see
369         /// implementation for reason)
370         void tokenize(istream & is);
371         ///
372         void tokenize(docstring const & s);
373         ///
374         void skipSpaceTokens(idocstream & is, char_type c);
375         ///
376         void push_back(Token const & t);
377         ///
378         void pop_back();
379         ///
380         Token const & prevToken() const;
381         ///
382         Token const & nextToken() const;
383         ///
384         Token const & getToken();
385         /// skips spaces if any
386         void skipSpaces();
387         ///
388         void lex(docstring const & s);
389         ///
390         bool good() const;
391         ///
392         docstring parse_verbatim_item();
393         ///
394         docstring parse_verbatim_option();
395
396         ///
397         int lineno_;
398         ///
399         vector<Token> tokens_;
400         ///
401         unsigned pos_;
402         /// Stack of active environments
403         vector<docstring> environments_;
404         ///
405         parse_mode mode_;
406         ///
407         bool success_;
408 };
409
410
411 Parser::Parser(Lexer & lexer, parse_mode mode)
412         : lineno_(lexer.lineNumber()), pos_(0), mode_(mode), success_(true)
413 {
414         tokenize(lexer.getStream());
415         lexer.eatLine();
416 }
417
418
419 Parser::Parser(istream & is, parse_mode mode)
420         : lineno_(0), pos_(0), mode_(mode), success_(true)
421 {
422         tokenize(is);
423 }
424
425
426 Parser::Parser(docstring const & str, parse_mode mode)
427         : lineno_(0), pos_(0), mode_(mode), success_(true)
428 {
429         tokenize(str);
430 }
431
432
433 void Parser::push_back(Token const & t)
434 {
435         tokens_.push_back(t);
436 }
437
438
439 void Parser::pop_back()
440 {
441         tokens_.pop_back();
442 }
443
444
445 Token const & Parser::prevToken() const
446 {
447         static const Token dummy;
448         return pos_ > 0 ? tokens_[pos_ - 1] : dummy;
449 }
450
451
452 Token const & Parser::nextToken() const
453 {
454         static const Token dummy;
455         return good() ? tokens_[pos_] : dummy;
456 }
457
458
459 Token const & Parser::getToken()
460 {
461         static const Token dummy;
462         //lyxerr << "looking at token " << tokens_[pos_] << " pos: " << pos_ << endl;
463         return good() ? tokens_[pos_++] : dummy;
464 }
465
466
467 void Parser::skipSpaces()
468 {
469         while (nextToken().cat() == catSpace || nextToken().cat() == catNewline)
470                 getToken();
471 }
472
473
474 void Parser::putback()
475 {
476         --pos_;
477 }
478
479
480 bool Parser::good() const
481 {
482         return pos_ < tokens_.size();
483 }
484
485
486 char_type Parser::getChar()
487 {
488         if (!good()) {
489                 error("The input stream is not well...");
490                 putback();
491                 return 0;
492         }
493         return tokens_[pos_++].character();
494 }
495
496
497 docstring Parser::getArg(char_type left, char_type right)
498 {
499         skipSpaces();
500
501         docstring result;
502         char_type c = getChar();
503
504         if (c != left)
505                 putback();
506         else
507                 while ((c = getChar()) != right && good())
508                         result += c;
509
510         return result;
511 }
512
513
514 void Parser::skipSpaceTokens(idocstream & is, char_type c)
515 {
516         // skip trailing spaces
517         while (catcode(c) == catSpace || catcode(c) == catNewline)
518                 if (!is.get(c))
519                         break;
520         //lyxerr << "putting back: " << c << endl;
521         is.putback(c);
522 }
523
524
525 void Parser::tokenize(istream & is)
526 {
527         // eat everything up to the next \end_inset or end of stream
528         // and store it in s for further tokenization
529         string s;
530         char c;
531         while (is.get(c)) {
532                 s += c;
533                 if (s.size() >= 10 && s.substr(s.size() - 10) == "\\end_inset") {
534                         s = s.substr(0, s.size() - 10);
535                         break;
536                 }
537         }
538         // Remove the space after \end_inset
539         if (is.get(c) && c != ' ')
540                 is.unget();
541
542         // tokenize buffer
543         tokenize(from_utf8(s));
544 }
545
546
547 void Parser::tokenize(docstring const & buffer)
548 {
549         idocstringstream is(mode_ & Parse::VERBATIM
550                         ? escapeSpecialChars(buffer, mode_ & Parse::TEXTMODE)
551                         : buffer, ios::in | ios::binary);
552
553         char_type c;
554         while (is.get(c)) {
555                 //lyxerr << "reading c: " << c << endl;
556
557                 switch (catcode(c)) {
558                         case catNewline: {
559                                 ++lineno_;
560                                 is.get(c);
561                                 if (catcode(c) == catNewline)
562                                         ; //push_back(Token("par"));
563                                 else {
564                                         push_back(Token('\n', catNewline));
565                                         is.putback(c);
566                                 }
567                                 break;
568                         }
569
570 /*
571                         case catComment: {
572                                 while (is.get(c) && catcode(c) != catNewline)
573                                         ;
574                                 ++lineno_;
575                                 break;
576                         }
577 */
578
579                         case catEscape: {
580                                 is.get(c);
581                                 if (!is) {
582                                         error("unexpected end of input");
583                                 } else {
584                                         docstring s(1, c);
585                                         if (catcode(c) == catLetter) {
586                                                 // collect letters
587                                                 while (is.get(c) && catcode(c) == catLetter)
588                                                         s += c;
589                                                 skipSpaceTokens(is, c);
590                                         }
591                                         push_back(Token(s));
592                                 }
593                                 break;
594                         }
595
596                         case catSuper:
597                         case catSub: {
598                                 push_back(Token(c, catcode(c)));
599                                 is.get(c);
600                                 skipSpaceTokens(is, c);
601                                 break;
602                         }
603
604                         case catIgnore: {
605                                 if (!(mode_ & Parse::QUIET))
606                                         lyxerr << "ignoring a char: " << int(c) << endl;
607                                 break;
608                         }
609
610                         default:
611                                 push_back(Token(c, catcode(c)));
612                 }
613         }
614
615 #ifdef FILEDEBUG
616         dump();
617 #endif
618 }
619
620
621 void Parser::dump() const
622 {
623         lyxerr << "\nTokens: ";
624         for (unsigned i = 0; i < tokens_.size(); ++i) {
625                 if (i == pos_)
626                         lyxerr << " <#> ";
627                 lyxerr << tokens_[i];
628         }
629         lyxerr << " pos: " << pos_ << endl;
630 }
631
632
633 void Parser::error(string const & msg)
634 {
635         success_ = false;
636         if (!(mode_ & Parse::QUIET)) {
637                 lyxerr << "Line ~" << lineno_ << ": Math parse error: "
638                        << msg << endl;
639                 dump();
640         }
641 }
642
643
644 bool Parser::parse(MathAtom & at)
645 {
646         skipSpaces();
647         MathData ar;
648         parse(ar, false, InsetMath::UNDECIDED_MODE);
649         if (ar.size() != 1 || ar.front()->getType() == hullNone) {
650                 if (!(mode_ & Parse::QUIET))
651                         lyxerr << "unusual contents found: " << ar << endl;
652                 at = MathAtom(new InsetMathPar(ar));
653                 //if (at->nargs() > 0)
654                 //      at.nucleus()->cell(0) = ar;
655                 //else
656                 //      lyxerr << "unusual contents found: " << ar << endl;
657                 success_ = false;
658         } else
659                 at = ar[0];
660         return success_;
661 }
662
663
664 docstring Parser::parse_verbatim_option()
665 {
666         skipSpaces();
667         docstring res;
668         if (nextToken().character() == '[') {
669                 Token t = getToken();
670                 for (Token t = getToken(); t.character() != ']' && good(); t = getToken()) {
671                         if (t.cat() == catBegin) {
672                                 putback();
673                                 res += '{' + parse_verbatim_item() + '}';
674                         } else
675                                 res += t.asInput();
676                 }
677         }
678         return res;
679 }
680
681
682 docstring Parser::parse_verbatim_item()
683 {
684         skipSpaces();
685         docstring res;
686         if (nextToken().cat() == catBegin) {
687                 Token t = getToken();
688                 for (Token t = getToken(); t.cat() != catEnd && good(); t = getToken()) {
689                         if (t.cat() == catBegin) {
690                                 putback();
691                                 res += '{' + parse_verbatim_item() + '}';
692                         }
693                         else
694                                 res += t.asInput();
695                 }
696         }
697         return res;
698 }
699
700
701 MathData Parser::parse(unsigned flags, mode_type mode)
702 {
703         MathData ar;
704         parse(ar, flags, mode);
705         return ar;
706 }
707
708
709 bool Parser::parse(MathData & array, unsigned flags, mode_type mode)
710 {
711         InsetMathGrid grid(1, 1);
712         parse1(grid, flags, mode, false);
713         array = grid.cell(0);
714         return success_;
715 }
716
717
718 void Parser::parse2(MathAtom & at, const unsigned flags, const mode_type mode,
719         const bool numbered)
720 {
721         parse1(*(at.nucleus()->asGridInset()), flags, mode, numbered);
722 }
723
724
725 bool Parser::parse1(InsetMathGrid & grid, unsigned flags,
726         const mode_type mode, const bool numbered)
727 {
728         int limits = 0;
729         InsetMathGrid::row_type cellrow = 0;
730         InsetMathGrid::col_type cellcol = 0;
731         MathData * cell = &grid.cell(grid.index(cellrow, cellcol));
732
733         if (grid.asHullInset())
734                 grid.asHullInset()->numbered(cellrow, numbered);
735
736         //dump();
737         //lyxerr << " flags: " << flags << endl;
738         //lyxerr << " mode: " << mode  << endl;
739         //lyxerr << "grid: " << grid << endl;
740
741         while (good()) {
742                 Token const & t = getToken();
743
744 #ifdef FILEDEBUG
745                 lyxerr << "t: " << t << " flags: " << flags << endl;
746                 lyxerr << "mode: " << mode  << endl;
747                 cell->dump();
748                 lyxerr << endl;
749 #endif
750
751                 if (flags & FLAG_ITEM) {
752
753                         if (t.cat() == catBegin) {
754                                 // skip the brace and collect everything to the next matching
755                                 // closing brace
756                                 parse1(grid, FLAG_BRACE_LAST, mode, numbered);
757                                 return success_;
758                         }
759
760                         // handle only this single token, leave the loop if done
761                         flags = FLAG_LEAVE;
762                 }
763
764
765                 if (flags & FLAG_BRACED) {
766                         if (t.cat() == catSpace)
767                                 continue;
768
769                         if (t.cat() != catBegin) {
770                                 error("opening brace expected");
771                                 return success_;
772                         }
773
774                         // skip the brace and collect everything to the next matching
775                         // closing brace
776                         flags = FLAG_BRACE_LAST;
777                 }
778
779
780                 if (flags & FLAG_OPTION) {
781                         if (t.cat() == catOther && t.character() == '[') {
782                                 MathData ar;
783                                 parse(ar, FLAG_BRACK_LAST, mode);
784                                 cell->append(ar);
785                         } else {
786                                 // no option found, put back token and we are done
787                                 putback();
788                         }
789                         return success_;
790                 }
791
792                 //
793                 // cat codes
794                 //
795                 if (t.cat() == catMath) {
796                         if (mode != InsetMath::MATH_MODE) {
797                                 // we are inside some text mode thingy, so opening new math is allowed
798                                 Token const & n = getToken();
799                                 if (n.cat() == catMath) {
800                                         // TeX's $$...$$ syntax for displayed math
801                                         cell->push_back(MathAtom(new InsetMathHull(hullEquation)));
802                                         parse2(cell->back(), FLAG_SIMPLE, InsetMath::MATH_MODE, false);
803                                         getToken(); // skip the second '$' token
804                                 } else {
805                                         // simple $...$  stuff
806                                         putback();
807                                         cell->push_back(MathAtom(new InsetMathHull(hullSimple)));
808                                         parse2(cell->back(), FLAG_SIMPLE, InsetMath::MATH_MODE, false);
809                                 }
810                         }
811
812                         else if (flags & FLAG_SIMPLE) {
813                                 // this is the end of the formula
814                                 return success_;
815                         }
816
817                         else {
818                                 error("something strange in the parser");
819                                 break;
820                         }
821                 }
822
823                 else if (t.cat() == catLetter)
824                         cell->push_back(MathAtom(new InsetMathChar(t.character())));
825
826                 else if (t.cat() == catSpace && mode != InsetMath::MATH_MODE) {
827                         if (cell->empty() || cell->back()->getChar() != ' ')
828                                 cell->push_back(MathAtom(new InsetMathChar(t.character())));
829                 }
830
831                 else if (t.cat() == catNewline && mode != InsetMath::MATH_MODE) {
832                         if (cell->empty() || cell->back()->getChar() != ' ')
833                                 cell->push_back(MathAtom(new InsetMathChar(' ')));
834                 }
835
836                 else if (t.cat() == catParameter) {
837                         Token const & n = getToken();
838                         cell->push_back(MathAtom(new MathMacroArgument(n.character()-'0')));
839                 }
840
841                 else if (t.cat() == catActive)
842                         cell->push_back(MathAtom(new InsetMathChar(t.character())));
843
844                 else if (t.cat() == catBegin) {
845                         MathData ar;
846                         parse(ar, FLAG_BRACE_LAST, mode);
847                         // do not create a BraceInset if they were written by LyX
848                         // this helps to keep the annoyance of  "a choose b"  to a minimum
849                         if (ar.size() == 1 && ar[0]->extraBraces())
850                                 cell->append(ar);
851                         else
852                                 cell->push_back(MathAtom(new InsetMathBrace(ar)));
853                 }
854
855                 else if (t.cat() == catEnd) {
856                         if (flags & FLAG_BRACE_LAST)
857                                 return success_;
858                         error("found '}' unexpectedly");
859                         //LASSERT(false, /**/);
860                         //add(cell, '}', LM_TC_TEX);
861                 }
862
863                 else if (t.cat() == catAlign) {
864                         //lyxerr << " column now " << (cellcol + 1)
865                         //       << " max: " << grid.ncols() << endl;
866                         if (flags & FLAG_ALIGN)
867                                 return success_;
868                         if (addCol(grid, cellcol))
869                                 cell = &grid.cell(grid.index(cellrow, cellcol));
870                 }
871
872                 else if (t.cat() == catSuper || t.cat() == catSub) {
873                         bool up = (t.cat() == catSuper);
874                         // we need no new script inset if the last thing was a scriptinset,
875                         // which has that script already not the same script already
876                         if (!cell->size())
877                                 cell->push_back(MathAtom(new InsetMathScript(up)));
878                         else if (cell->back()->asScriptInset() &&
879                                         !cell->back()->asScriptInset()->has(up))
880                                 cell->back().nucleus()->asScriptInset()->ensure(up);
881                         else if (cell->back()->asScriptInset())
882                                 cell->push_back(MathAtom(new InsetMathScript(up)));
883                         else
884                                 cell->back() = MathAtom(new InsetMathScript(cell->back(), up));
885                         InsetMathScript * p = cell->back().nucleus()->asScriptInset();
886                         // special handling of {}-bases
887                         // Here we could remove the brace inset for things
888                         // like {a'}^2 and add the braces back in
889                         // InsetMathScript::write().
890                         // We do not do it, since it is not possible to detect
891                         // reliably whether the braces are needed because the
892                         // nucleus contains more than one symbol, or whether
893                         // they are needed for unknown commands like \xx{a}_0
894                         // or \yy{a}{b}_0. This was done in revision 14819
895                         // in an unreliable way. See this thread
896                         // http://www.mail-archive.com/lyx-devel%40lists.lyx.org/msg104917.html
897                         // for more details.
898                         parse(p->cell(p->idxOfScript(up)), FLAG_ITEM, mode);
899                         if (limits) {
900                                 p->limits(limits);
901                                 limits = 0;
902                         }
903                 }
904
905                 else if (t.character() == ']' && (flags & FLAG_BRACK_LAST)) {
906                         //lyxerr << "finished reading option" << endl;
907                         return success_;
908                 }
909
910                 else if (t.cat() == catOther) {
911                         char_type c = t.character();
912                         if (c < 0x80 || mode_ & Parse::VERBATIM
913                             || !(mode_ & Parse::USETEXT)
914                             || mode == InsetMath::TEXT_MODE) {
915                                 cell->push_back(MathAtom(new InsetMathChar(c)));
916                         } else {
917                                 MathAtom at = createInsetMath("text");
918                                 at.nucleus()->cell(0).push_back(MathAtom(new InsetMathChar(c)));
919                                 while (nextToken().cat() == catOther
920                                        && nextToken().character() >= 0x80) {
921                                         c = getToken().character();
922                                         at.nucleus()->cell(0).push_back(MathAtom(new InsetMathChar(c)));
923                                 }
924                                 cell->push_back(at);
925                         }
926                 }
927
928                 else if (t.cat() == catComment) {
929                         docstring s;
930                         while (good()) {
931                                 Token const & t = getToken();
932                                 if (t.cat() == catNewline)
933                                         break;
934                                 s += t.asString();
935                         }
936                         cell->push_back(MathAtom(new InsetMathComment(s)));
937                         skipSpaces();
938                 }
939
940                 //
941                 // control sequences
942                 //
943
944                 else if (t.cs() == "lyxlock") {
945                         if (cell->size())
946                                 cell->back().nucleus()->lock(true);
947                 }
948
949                 else if ((t.cs() == "global" && nextToken().cs() == "def") ||
950                          t.cs() == "def") {
951                         if (t.cs() == "global")
952                                 getToken();
953                         
954                         // get name
955                         docstring name = getToken().cs();
956                         
957                         // read parameters
958                         int nargs = 0;
959                         docstring pars;
960                         while (good() && nextToken().cat() != catBegin) {
961                                 pars += getToken().cs();
962                                 ++nargs;
963                         }
964                         nargs /= 2;
965                         
966                         // read definition
967                         MathData def;
968                         parse(def, FLAG_ITEM, InsetMath::UNDECIDED_MODE);
969                         
970                         // is a version for display attached?
971                         skipSpaces();
972                         MathData display;
973                         if (nextToken().cat() == catBegin)
974                                 parse(display, FLAG_ITEM, InsetMath::MATH_MODE);
975                         
976                         cell->push_back(MathAtom(new MathMacroTemplate(name, nargs,
977                                0, MacroTypeDef, vector<MathData>(), def, display)));
978                 }
979                 
980                 else if (t.cs() == "newcommand" ||
981                          t.cs() == "renewcommand" ||
982                          t.cs() == "newlyxcommand") {
983                         // get name
984                         if (getToken().cat() != catBegin) {
985                                 error("'{' in \\newcommand expected (1) ");
986                                 return success_;
987                         }
988                         docstring name = getToken().cs();
989                         if (getToken().cat() != catEnd) {
990                                 error("'}' in \\newcommand expected");
991                                 return success_;
992                         }
993                                 
994                         // get arity
995                         docstring const arg = getArg('[', ']');
996                         int nargs = 0;
997                         if (!arg.empty())
998                                 nargs = convert<int>(arg);
999                                 
1000                         // optional argument given?
1001                         skipSpaces();
1002                         int optionals = 0;
1003                         vector<MathData> optionalValues;
1004                         while (nextToken().character() == '[') {
1005                                 getToken();
1006                                 optionalValues.push_back(MathData());
1007                                 parse(optionalValues[optionals], FLAG_BRACK_LAST, mode);
1008                                 ++optionals;
1009                         }
1010                         
1011                         MathData def;
1012                         parse(def, FLAG_ITEM, InsetMath::UNDECIDED_MODE);
1013                         
1014                         // is a version for display attached?
1015                         skipSpaces();
1016                         MathData display;
1017                         if (nextToken().cat() == catBegin)
1018                                 parse(display, FLAG_ITEM, InsetMath::MATH_MODE);
1019                         
1020                         cell->push_back(MathAtom(new MathMacroTemplate(name, nargs,
1021                                 optionals, MacroTypeNewcommand, optionalValues, def, display)));
1022                         
1023                 }
1024                 
1025                 else if (t.cs() == "newcommandx" ||
1026                          t.cs() == "renewcommandx") {
1027                         // \newcommandx{\foo}[2][usedefault, addprefix=\global,1=default]{#1,#2}
1028                         // get name
1029                         docstring name;
1030                         if (nextToken().cat() == catBegin) {
1031                                 getToken();
1032                                 name = getToken().cs();
1033                                 if (getToken().cat() != catEnd) {
1034                                         error("'}' in \\newcommandx expected");
1035                                         return success_;
1036                                 }
1037                         } else
1038                                 name = getToken().cs();
1039                                 
1040                         // get arity
1041                         docstring const arg = getArg('[', ']');
1042                         if (arg.empty()) {
1043                                 error("[num] in \\newcommandx expected");
1044                                 return success_;
1045                         }
1046                         int nargs = convert<int>(arg);
1047                         
1048                         // get options
1049                         int optionals = 0;
1050                         vector<MathData> optionalValues;
1051                         if (nextToken().character() == '[') {
1052                                 // skip '['
1053                                 getToken();
1054                                         
1055                                 // handle 'opt=value' options, separated by ','.
1056                                 skipSpaces();
1057                                 while (nextToken().character() != ']' && good()) {
1058                                         if (nextToken().character() >= '1'
1059                                             && nextToken().character() <= '9') {
1060                                                 // optional value -> get parameter number
1061                                                 int n = getChar() - '0';
1062                                                 if (n > nargs) {
1063                                                         error("Arity of \\newcommandx too low "
1064                                                               "for given optional parameter.");
1065                                                         return success_;
1066                                                 }
1067                                                 
1068                                                 // skip '='
1069                                                 if (getToken().character() != '=') {
1070                                                         error("'=' and optional parameter value "
1071                                                               "expected for \\newcommandx");
1072                                                         return success_;
1073                                                 }
1074                                                 
1075                                                 // get value
1076                                                 int optNum = max(size_t(n), optionalValues.size());
1077                                                 optionalValues.resize(optNum);
1078                                                 optionalValues[n - 1].clear();
1079                                                 while (nextToken().character() != ']'
1080                                                        && nextToken().character() != ',') {
1081                                                         MathData data;
1082                                                         parse(data, FLAG_ITEM, InsetMath::UNDECIDED_MODE);
1083                                                         optionalValues[n - 1].append(data);
1084                                                 }
1085                                                 optionals = max(n, optionals);
1086                                         } else if (nextToken().cat() == catLetter) {
1087                                                 // we in fact ignore every non-optional
1088                                                 // parameter
1089                                                 
1090                                                 // get option name
1091                                                 docstring opt;
1092                                                 while (nextToken().cat() == catLetter)
1093                                                         opt += getChar();
1094                                         
1095                                                 // value?
1096                                                 skipSpaces();
1097                                                 MathData value;
1098                                                 if (nextToken().character() == '=') {
1099                                                         getToken();
1100                                                         while (nextToken().character() != ']'
1101                                                                 && nextToken().character() != ',')
1102                                                                 parse(value, FLAG_ITEM, 
1103                                                                       InsetMath::UNDECIDED_MODE);
1104                                                 }
1105                                         } else {
1106                                                 error("option for \\newcommandx expected");
1107                                                 return success_;
1108                                         }
1109                                         
1110                                         // skip komma
1111                                         skipSpaces();
1112                                         if (nextToken().character() == ',') {
1113                                                 getChar();
1114                                                 skipSpaces();
1115                                         } else if (nextToken().character() != ']') {
1116                                                 error("Expecting ',' or ']' in options "
1117                                                       "of \\newcommandx");
1118                                                 return success_;
1119                                         }
1120                                 }
1121                                 
1122                                 // skip ']'
1123                                 if (!good())
1124                                         return success_;
1125                                 getToken();
1126                         }
1127
1128                         // get definition
1129                         MathData def;
1130                         parse(def, FLAG_ITEM, InsetMath::UNDECIDED_MODE);
1131
1132                         // is a version for display attached?
1133                         skipSpaces();
1134                         MathData display;
1135                         if (nextToken().cat() == catBegin)
1136                                 parse(display, FLAG_ITEM, InsetMath::MATH_MODE);
1137
1138                         cell->push_back(MathAtom(new MathMacroTemplate(name, nargs,
1139                                 optionals, MacroTypeNewcommandx, optionalValues, def, 
1140                                 display)));
1141                 }
1142
1143                 else if (t.cs() == "(") {
1144                         if (mode == InsetMath::MATH_MODE) {
1145                                 error("bad math environment");
1146                                 break;
1147                         }
1148                         cell->push_back(MathAtom(new InsetMathHull(hullSimple)));
1149                         parse2(cell->back(), FLAG_SIMPLE2, InsetMath::MATH_MODE, false);
1150                 }
1151
1152                 else if (t.cs() == "[") {
1153                         if (mode != InsetMath::UNDECIDED_MODE) {
1154                                 error("bad math environment");
1155                                 break;
1156                         }
1157                         cell->push_back(MathAtom(new InsetMathHull(hullEquation)));
1158                         parse2(cell->back(), FLAG_EQUATION, InsetMath::MATH_MODE, false);
1159                 }
1160
1161                 else if (t.cs() == "protect")
1162                         // ignore \\protect, will hopefully be re-added during output
1163                         ;
1164
1165                 else if (t.cs() == "end") {
1166                         if (flags & FLAG_END) {
1167                                 // eat environment name
1168                                 docstring const name = getArg('{', '}');
1169                                 if (environments_.empty())
1170                                         error("'found \\end{" + name +
1171                                               "}' without matching '\\begin{" +
1172                                               name + "}'");
1173                                 else if (name != environments_.back())
1174                                         error("'\\end{" + name +
1175                                               "}' does not match '\\begin{" +
1176                                               environments_.back() + "}'");
1177                                 else {
1178                                         environments_.pop_back();
1179                                         // Delete empty last row in matrix
1180                                         // like insets.
1181                                         // If you abuse InsetMathGrid for
1182                                         // non-matrix like structures you
1183                                         // probably need to refine this test.
1184                                         // Right now we only have to test for
1185                                         // single line hull insets.
1186                                         if (grid.nrows() > 1)
1187                                                 delEmptyLastRow(grid);
1188                                         return success_;
1189                                 }
1190                         } else
1191                                 error("found 'end' unexpectedly");
1192                 }
1193
1194                 else if (t.cs() == ")") {
1195                         if (flags & FLAG_SIMPLE2)
1196                                 return success_;
1197                         error("found '\\)' unexpectedly");
1198                 }
1199
1200                 else if (t.cs() == "]") {
1201                         if (flags & FLAG_EQUATION)
1202                                 return success_;
1203                         error("found '\\]' unexpectedly");
1204                 }
1205
1206                 else if (t.cs() == "\\") {
1207                         if (flags & FLAG_ALIGN)
1208                                 return success_;
1209                         bool added = false;
1210                         if (nextToken().asInput() == "*") {
1211                                 getToken();
1212                                 added = addRow(grid, cellrow, docstring(), false);
1213                         } else if (good())
1214                                 added = addRow(grid, cellrow, getArg('[', ']'));
1215                         else
1216                                 error("missing token after \\\\");
1217                         if (added) {
1218                                 cellcol = 0;
1219                                 if (grid.asHullInset())
1220                                         grid.asHullInset()->numbered(
1221                                                         cellrow, numbered);
1222                                 cell = &grid.cell(grid.index(cellrow,
1223                                                              cellcol));
1224                         }
1225                 }
1226
1227 #if 0
1228                 else if (t.cs() == "multicolumn") {
1229                         // extract column count and insert dummy cells
1230                         MathData count;
1231                         parse(count, FLAG_ITEM, mode);
1232                         int cols = 1;
1233                         if (!extractNumber(count, cols)) {
1234                                 success_ = false;
1235                                 lyxerr << " can't extract number of cells from " << count << endl;
1236                         }
1237                         // resize the table if necessary
1238                         for (int i = 0; i < cols; ++i) {
1239                                 if (addCol(grid, cellcol)) {
1240                                         cell = &grid.cell(grid.index(
1241                                                         cellrow, cellcol));
1242                                         // mark this as dummy
1243                                         grid.cellinfo(grid.index(
1244                                                 cellrow, cellcol)).dummy_ = true;
1245                                 }
1246                         }
1247                         // the last cell is the real thing, not a dummy
1248                         grid.cellinfo(grid.index(cellrow, cellcol)).dummy_ = false;
1249
1250                         // read special alignment
1251                         MathData align;
1252                         parse(align, FLAG_ITEM, mode);
1253                         //grid.cellinfo(grid.index(cellrow, cellcol)).align_ = extractString(align);
1254
1255                         // parse the remaining contents into the "real" cell
1256                         parse(*cell, FLAG_ITEM, mode);
1257                 }
1258 #endif
1259
1260                 else if (t.cs() == "limits")
1261                         limits = 1;
1262
1263                 else if (t.cs() == "nolimits")
1264                         limits = -1;
1265
1266                 else if (t.cs() == "nonumber") {
1267                         if (grid.asHullInset())
1268                                 grid.asHullInset()->numbered(cellrow, false);
1269                 }
1270
1271                 else if (t.cs() == "number") {
1272                         if (grid.asHullInset())
1273                                 grid.asHullInset()->numbered(cellrow, true);
1274                 }
1275
1276                 else if (t.cs() == "hline") {
1277                         grid.rowinfo(cellrow).lines_ ++;
1278                 }
1279
1280                 else if (t.cs() == "sqrt") {
1281                         MathData ar;
1282                         parse(ar, FLAG_OPTION, mode);
1283                         if (ar.size()) {
1284                                 cell->push_back(MathAtom(new InsetMathRoot));
1285                                 cell->back().nucleus()->cell(0) = ar;
1286                                 parse(cell->back().nucleus()->cell(1), FLAG_ITEM, mode);
1287                         } else {
1288                                 cell->push_back(MathAtom(new InsetMathSqrt));
1289                                 parse(cell->back().nucleus()->cell(0), FLAG_ITEM, mode);
1290                         }
1291                 }
1292
1293                 else if (t.cs() == "unit") {
1294                         // Allowed formats \unit[val]{unit}
1295                         MathData ar;
1296                         parse(ar, FLAG_OPTION, mode);
1297                         if (ar.size()) {
1298                                 cell->push_back(MathAtom(new InsetMathFrac(InsetMathFrac::UNIT)));
1299                                 cell->back().nucleus()->cell(0) = ar;
1300                                 parse(cell->back().nucleus()->cell(1), FLAG_ITEM, mode);
1301                         } else {
1302                                 cell->push_back(MathAtom(new InsetMathFrac(InsetMathFrac::UNIT, 1)));
1303                                 parse(cell->back().nucleus()->cell(0), FLAG_ITEM, mode);
1304                         }
1305                 }
1306
1307                 else if (t.cs() == "unitfrac") {
1308                         // Here allowed formats are \unitfrac[val]{num}{denom}
1309                         MathData ar;
1310                         parse(ar, FLAG_OPTION, mode);
1311                         if (ar.size()) {
1312                                 cell->push_back(MathAtom(new InsetMathFrac(InsetMathFrac::UNITFRAC, 3)));
1313                                 cell->back().nucleus()->cell(2) = ar;
1314                         } else {
1315                                 cell->push_back(MathAtom(new InsetMathFrac(InsetMathFrac::UNITFRAC)));
1316                         }
1317                         parse(cell->back().nucleus()->cell(0), FLAG_ITEM, mode);
1318                         parse(cell->back().nucleus()->cell(1), FLAG_ITEM, mode);
1319                 }
1320
1321                 else if (t.cs() == "cfrac") {
1322                         // Here allowed formats are \cfrac[pos]{num}{denom}
1323                         MathData ar;
1324                         parse(ar, FLAG_OPTION, mode);
1325                         if (ar.size()) {
1326                                 cell->push_back(MathAtom(new InsetMathFrac(InsetMathFrac::CFRAC, 3)));
1327                                 cell->back().nucleus()->cell(2) = ar;
1328                         } else {
1329                                 cell->push_back(MathAtom(new InsetMathFrac(InsetMathFrac::CFRAC)));
1330                         }
1331                         parse(cell->back().nucleus()->cell(0), FLAG_ITEM, mode);
1332                         parse(cell->back().nucleus()->cell(1), FLAG_ITEM, mode);
1333                 }
1334
1335                 else if (t.cs() == "xrightarrow" || t.cs() == "xleftarrow") {
1336                         cell->push_back(createInsetMath(t.cs()));
1337                         parse(cell->back().nucleus()->cell(1), FLAG_OPTION, mode);
1338                         parse(cell->back().nucleus()->cell(0), FLAG_ITEM, mode);
1339                 }
1340
1341                 else if (t.cs() == "ref" || t.cs() == "eqref" || t.cs() == "prettyref"
1342                           || t.cs() == "pageref" || t.cs() == "vpageref" || t.cs() == "vref") {
1343                         cell->push_back(MathAtom(new InsetMathRef(t.cs())));
1344                         parse(cell->back().nucleus()->cell(1), FLAG_OPTION, mode);
1345                         parse(cell->back().nucleus()->cell(0), FLAG_ITEM, mode);
1346                 }
1347
1348                 else if (t.cs() == "left") {
1349                         skipSpaces();
1350                         Token const & tl = getToken();
1351                         // \| and \Vert are equivalent, and InsetMathDelim
1352                         // can't handle \|
1353                         // FIXME: fix this in InsetMathDelim itself!
1354                         docstring const l = tl.cs() == "|" ? from_ascii("Vert") : tl.asString();
1355                         MathData ar;
1356                         parse(ar, FLAG_RIGHT, mode);
1357                         if (!good())
1358                                 break;
1359                         skipSpaces();
1360                         Token const & tr = getToken();
1361                         docstring const r = tr.cs() == "|" ? from_ascii("Vert") : tr.asString();
1362                         cell->push_back(MathAtom(new InsetMathDelim(l, r, ar)));
1363                 }
1364
1365                 else if (t.cs() == "right") {
1366                         if (flags & FLAG_RIGHT)
1367                                 return success_;
1368                         //lyxerr << "got so far: '" << cell << "'" << endl;
1369                         error("Unmatched right delimiter");
1370                         return success_;
1371                 }
1372
1373                 else if (t.cs() == "begin") {
1374                         docstring const name = getArg('{', '}');
1375                         environments_.push_back(name);
1376
1377                         if (name == "array" || name == "subarray") {
1378                                 docstring const valign = parse_verbatim_option() + 'c';
1379                                 docstring const halign = parse_verbatim_item();
1380                                 cell->push_back(MathAtom(new InsetMathArray(name,
1381                                         InsetMathGrid::guessColumns(halign), 1, (char)valign[0], halign)));
1382                                 parse2(cell->back(), FLAG_END, mode, false);
1383                         }
1384
1385                         else if (name == "tabular") {
1386                                 docstring const valign = parse_verbatim_option() + 'c';
1387                                 docstring const halign = parse_verbatim_item();
1388                                 cell->push_back(MathAtom(new InsetMathTabular(name,
1389                                         InsetMathGrid::guessColumns(halign), 1, (char)valign[0], halign)));
1390                                 parse2(cell->back(), FLAG_END, InsetMath::TEXT_MODE, false);
1391                         }
1392
1393                         else if (name == "split" || name == "cases") {
1394                                 cell->push_back(createInsetMath(name));
1395                                 parse2(cell->back(), FLAG_END, mode, false);
1396                         }
1397
1398                         else if (name == "alignedat") {
1399                                 docstring const valign = parse_verbatim_option() + 'c';
1400                                 // ignore this for a while
1401                                 getArg('{', '}');
1402                                 cell->push_back(MathAtom(new InsetMathSplit(name, (char)valign[0])));
1403                                 parse2(cell->back(), FLAG_END, mode, false);
1404                         }
1405
1406                         else if (name == "math") {
1407                                 if (mode == InsetMath::MATH_MODE) {
1408                                         error("bad math environment");
1409                                         break;
1410                                 }
1411                                 cell->push_back(MathAtom(new InsetMathHull(hullSimple)));
1412                                 parse2(cell->back(), FLAG_END, InsetMath::MATH_MODE, true);
1413                         }
1414
1415                         else if (name == "equation" || name == "equation*"
1416                                         || name == "displaymath") {
1417                                 if (mode != InsetMath::UNDECIDED_MODE) {
1418                                         error("bad math environment");
1419                                         break;
1420                                 }
1421                                 cell->push_back(MathAtom(new InsetMathHull(hullEquation)));
1422                                 parse2(cell->back(), FLAG_END, InsetMath::MATH_MODE, (name == "equation"));
1423                         }
1424
1425                         else if (name == "eqnarray" || name == "eqnarray*") {
1426                                 if (mode != InsetMath::UNDECIDED_MODE) {
1427                                         error("bad math environment");
1428                                         break;
1429                                 }
1430                                 cell->push_back(MathAtom(new InsetMathHull(hullEqnArray)));
1431                                 parse2(cell->back(), FLAG_END, InsetMath::MATH_MODE, !stared(name));
1432                         }
1433
1434                         else if (name == "align" || name == "align*") {
1435                                 if (mode != InsetMath::UNDECIDED_MODE) {
1436                                         error("bad math environment");
1437                                         break;
1438                                 }
1439                                 cell->push_back(MathAtom(new InsetMathHull(hullAlign)));
1440                                 parse2(cell->back(), FLAG_END, InsetMath::MATH_MODE, !stared(name));
1441                         }
1442
1443                         else if (name == "flalign" || name == "flalign*") {
1444                                 if (mode != InsetMath::UNDECIDED_MODE) {
1445                                         error("bad math environment");
1446                                         break;
1447                                 }
1448                                 cell->push_back(MathAtom(new InsetMathHull(hullFlAlign)));
1449                                 parse2(cell->back(), FLAG_END, InsetMath::MATH_MODE, !stared(name));
1450                         }
1451
1452                         else if (name == "alignat" || name == "alignat*") {
1453                                 if (mode != InsetMath::UNDECIDED_MODE) {
1454                                         error("bad math environment");
1455                                         break;
1456                                 }
1457                                 // ignore this for a while
1458                                 getArg('{', '}');
1459                                 cell->push_back(MathAtom(new InsetMathHull(hullAlignAt)));
1460                                 parse2(cell->back(), FLAG_END, InsetMath::MATH_MODE, !stared(name));
1461                         }
1462
1463                         else if (name == "xalignat" || name == "xalignat*") {
1464                                 if (mode != InsetMath::UNDECIDED_MODE) {
1465                                         error("bad math environment");
1466                                         break;
1467                                 }
1468                                 // ignore this for a while
1469                                 getArg('{', '}');
1470                                 cell->push_back(MathAtom(new InsetMathHull(hullXAlignAt)));
1471                                 parse2(cell->back(), FLAG_END, InsetMath::MATH_MODE, !stared(name));
1472                         }
1473
1474                         else if (name == "xxalignat") {
1475                                 if (mode != InsetMath::UNDECIDED_MODE) {
1476                                         error("bad math environment");
1477                                         break;
1478                                 }
1479                                 // ignore this for a while
1480                                 getArg('{', '}');
1481                                 cell->push_back(MathAtom(new InsetMathHull(hullXXAlignAt)));
1482                                 parse2(cell->back(), FLAG_END, InsetMath::MATH_MODE, !stared(name));
1483                         }
1484
1485                         else if (name == "multline" || name == "multline*") {
1486                                 if (mode != InsetMath::UNDECIDED_MODE) {
1487                                         error("bad math environment");
1488                                         break;
1489                                 }
1490                                 cell->push_back(MathAtom(new InsetMathHull(hullMultline)));
1491                                 parse2(cell->back(), FLAG_END, InsetMath::MATH_MODE, !stared(name));
1492                         }
1493
1494                         else if (name == "gather" || name == "gather*") {
1495                                 if (mode != InsetMath::UNDECIDED_MODE) {
1496                                         error("bad math environment");
1497                                         break;
1498                                 }
1499                                 cell->push_back(MathAtom(new InsetMathHull(hullGather)));
1500                                 parse2(cell->back(), FLAG_END, InsetMath::MATH_MODE, !stared(name));
1501                         }
1502
1503                         else if (latexkeys const * l = in_word_set(name)) {
1504                                 if (l->inset == "matrix") {
1505                                         cell->push_back(createInsetMath(name));
1506                                         parse2(cell->back(), FLAG_END, mode, false);
1507                                 } else if (l->inset == "split") {
1508                                         docstring const valign = parse_verbatim_option() + 'c';
1509                                         cell->push_back(MathAtom(new InsetMathSplit(name, (char)valign[0])));
1510                                         parse2(cell->back(), FLAG_END, mode, false);
1511                                 } else {
1512                                         success_ = false;
1513                                         if (!(mode_ & Parse::QUIET)) {
1514                                                 dump();
1515                                                 lyxerr << "found math environment `"
1516                                                        << to_utf8(name)
1517                                                        << "' in symbols file with unsupported inset `"
1518                                                        << to_utf8(l->inset)
1519                                                        << "'." << endl;
1520                                         }
1521                                         // create generic environment inset
1522                                         cell->push_back(MathAtom(new InsetMathEnv(name)));
1523                                         parse(cell->back().nucleus()->cell(0), FLAG_END, mode);
1524                                 }
1525                         }
1526
1527                         else {
1528                                 success_ = false;
1529                                 if (!(mode_ & Parse::QUIET)) {
1530                                         dump();
1531                                         lyxerr << "found unknown math environment '"
1532                                                << to_utf8(name) << "'" << endl;
1533                                 }
1534                                 // create generic environment inset
1535                                 cell->push_back(MathAtom(new InsetMathEnv(name)));
1536                                 parse(cell->back().nucleus()->cell(0), FLAG_END, mode);
1537                         }
1538                 }
1539
1540                 else if (t.cs() == "kern") {
1541                         // FIXME: A hack...
1542                         docstring s;
1543                         while (true) {
1544                                 Token const & t = getToken();
1545                                 if (!good()) {
1546                                         putback();
1547                                         break;
1548                                 }
1549                                 s += t.character();
1550                                 if (isValidLength(to_utf8(s)))
1551                                         break;
1552                         }
1553                         cell->push_back(MathAtom(new InsetMathKern(s)));
1554                 }
1555
1556                 else if (t.cs() == "label") {
1557                         // FIXME: This is swallowed in inline formulas
1558                         docstring label = parse_verbatim_item();
1559                         MathData ar;
1560                         asArray(label, ar);
1561                         if (grid.asHullInset()) {
1562                                 grid.asHullInset()->label(cellrow, label);
1563                         } else {
1564                                 cell->push_back(createInsetMath(t.cs()));
1565                                 cell->push_back(MathAtom(new InsetMathBrace(ar)));
1566                         }
1567                 }
1568
1569                 else if (t.cs() == "choose" || t.cs() == "over"
1570                                 || t.cs() == "atop" || t.cs() == "brace"
1571                                 || t.cs() == "brack") {
1572                         MathAtom at = createInsetMath(t.cs());
1573                         at.nucleus()->cell(0) = *cell;
1574                         cell->clear();
1575                         parse(at.nucleus()->cell(1), flags, mode);
1576                         cell->push_back(at);
1577                         return success_;
1578                 }
1579
1580                 else if (t.cs() == "color") {
1581                         docstring const color = parse_verbatim_item();
1582                         cell->push_back(MathAtom(new InsetMathColor(true, color)));
1583                         parse(cell->back().nucleus()->cell(0), flags, mode);
1584                         return success_;
1585                 }
1586
1587                 else if (t.cs() == "textcolor") {
1588                         docstring const color = parse_verbatim_item();
1589                         cell->push_back(MathAtom(new InsetMathColor(false, color)));
1590                         parse(cell->back().nucleus()->cell(0), FLAG_ITEM, InsetMath::TEXT_MODE);
1591                 }
1592
1593                 else if (t.cs() == "normalcolor") {
1594                         cell->push_back(createInsetMath(t.cs()));
1595                         parse(cell->back().nucleus()->cell(0), flags, mode);
1596                         return success_;
1597                 }
1598
1599                 else if (t.cs() == "substack") {
1600                         cell->push_back(createInsetMath(t.cs()));
1601                         parse2(cell->back(), FLAG_ITEM, mode, false);
1602                 }
1603
1604                 else if (t.cs() == "xymatrix") {
1605                         odocstringstream os;
1606                         while (good() && nextToken().cat() != catBegin)
1607                                 os << getToken().asInput();
1608                         cell->push_back(createInsetMath(t.cs() + os.str()));
1609                         parse2(cell->back(), FLAG_ITEM, mode, false);
1610                 }
1611
1612                 else if (t.cs() == "framebox" || t.cs() == "makebox") {
1613                         cell->push_back(createInsetMath(t.cs()));
1614                         parse(cell->back().nucleus()->cell(0), FLAG_OPTION, InsetMath::TEXT_MODE);
1615                         parse(cell->back().nucleus()->cell(1), FLAG_OPTION, InsetMath::TEXT_MODE);
1616                         parse(cell->back().nucleus()->cell(2), FLAG_ITEM, InsetMath::TEXT_MODE);
1617                 }
1618
1619                 else if (t.cs() == "tag") {
1620                         if (nextToken().character() == '*') {
1621                                 getToken();
1622                                 cell->push_back(createInsetMath(t.cs() + '*'));
1623                         } else
1624                                 cell->push_back(createInsetMath(t.cs()));
1625                         parse(cell->back().nucleus()->cell(0), FLAG_ITEM, InsetMath::TEXT_MODE);
1626                 }
1627
1628                 else if (t.cs() == "hspace" && nextToken().character() != '*') {
1629                         docstring const name = t.cs();
1630                         docstring const arg = parse_verbatim_item();
1631                         Length length;
1632                         if (isValidLength(to_utf8(arg), &length))
1633                                 cell->push_back(MathAtom(new InsetMathSpace(length)));
1634                         else {
1635                                 // Since the Length class cannot use length variables
1636                                 // we must not create an InsetMathSpace.
1637                                 cell->push_back(MathAtom(new MathMacro(name)));
1638                                 MathData ar;
1639                                 mathed_parse_cell(ar, '{' + arg + '}');
1640                                 cell->append(ar);
1641                         }
1642                 }
1643
1644 #if 0
1645                 else if (t.cs() == "infer") {
1646                         MathData ar;
1647                         parse(ar, FLAG_OPTION, mode);
1648                         cell->push_back(createInsetMath(t.cs()));
1649                         parse2(cell->back(), FLAG_ITEM, mode, false);
1650                 }
1651
1652                 // Disabled
1653                 else if (1 && t.cs() == "ar") {
1654                         auto_ptr<InsetMathXYArrow> p(new InsetMathXYArrow);
1655                         // try to read target
1656                         parse(p->cell(0), FLAG_OTPTION, mode);
1657                         // try to read label
1658                         if (nextToken().cat() == catSuper || nextToken().cat() == catSub) {
1659                                 p->up_ = nextToken().cat() == catSuper;
1660                                 getToken();
1661                                 parse(p->cell(1), FLAG_ITEM, mode);
1662                                 //lyxerr << "read label: " << p->cell(1) << endl;
1663                         }
1664
1665                         cell->push_back(MathAtom(p.release()));
1666                         //lyxerr << "read cell: " << cell << endl;
1667                 }
1668 #endif
1669
1670                 else if (t.cs() == "lyxmathsym") {
1671                         skipSpaces();
1672                         if (getToken().cat() != catBegin) {
1673                                 error("'{' expected in \\" + t.cs());
1674                                 return success_;
1675                         }
1676                         int count = 0;
1677                         docstring cmd;
1678                         CatCode cat = nextToken().cat();
1679                         while (good() && (count || cat != catEnd)) {
1680                                 if (cat == catBegin)
1681                                         ++count;
1682                                 else if (cat == catEnd)
1683                                         --count;
1684                                 cmd += getToken().asInput();
1685                                 cat = nextToken().cat();
1686                         }
1687                         if (getToken().cat() != catEnd) {
1688                                 error("'}' expected in \\" + t.cs());
1689                                 return success_;
1690                         }
1691                         docstring rem;
1692                         do {
1693                                 cmd = Encodings::fromLaTeXCommand(cmd, rem);
1694                                 for (size_t i = 0; i < cmd.size(); ++i)
1695                                         cell->push_back(MathAtom(new InsetMathChar(cmd[i])));
1696                                 if (rem.size()) {
1697                                         char_type c = rem[0];
1698                                         cell->push_back(MathAtom(new InsetMathChar(c)));
1699                                         cmd = rem.substr(1);
1700                                         rem.clear();
1701                                 } else
1702                                         cmd.clear();
1703                         } while (cmd.size());
1704                 }
1705
1706                 else if (t.cs().size()) {
1707                         latexkeys const * l = in_word_set(t.cs());
1708                         if (l) {
1709                                 if (l->inset == "big") {
1710                                         skipSpaces();
1711                                         docstring const delim = getToken().asInput();
1712                                         if (InsetMathBig::isBigInsetDelim(delim))
1713                                                 cell->push_back(MathAtom(
1714                                                         new InsetMathBig(t.cs(), delim)));
1715                                         else {
1716                                                 cell->push_back(createInsetMath(t.cs()));
1717                                                 putback();
1718                                         }
1719                                 }
1720
1721                                 else if (l->inset == "font") {
1722                                         cell->push_back(createInsetMath(t.cs()));
1723                                         parse(cell->back().nucleus()->cell(0),
1724                                                 FLAG_ITEM, asMode(mode, l->extra));
1725                                 }
1726
1727                                 else if (l->inset == "oldfont") {
1728                                         cell->push_back(createInsetMath(t.cs()));
1729                                         parse(cell->back().nucleus()->cell(0),
1730                                                 flags | FLAG_ALIGN, asMode(mode, l->extra));
1731                                         if (prevToken().cat() != catAlign &&
1732                                             prevToken().cs() != "\\")
1733                                                 return success_;
1734                                         putback();
1735                                 }
1736
1737                                 else if (l->inset == "style") {
1738                                         cell->push_back(createInsetMath(t.cs()));
1739                                         parse(cell->back().nucleus()->cell(0),
1740                                                 flags | FLAG_ALIGN, mode);
1741                                         if (prevToken().cat() != catAlign &&
1742                                             prevToken().cs() != "\\")
1743                                                 return success_;
1744                                         putback();
1745                                 }
1746
1747                                 else {
1748                                         MathAtom at = createInsetMath(t.cs());
1749                                         for (InsetMath::idx_type i = 0; i < at->nargs(); ++i)
1750                                                 parse(at.nucleus()->cell(i),
1751                                                         FLAG_ITEM, asMode(mode, l->extra));
1752                                         cell->push_back(at);
1753                                 }
1754                         }
1755
1756                         else {
1757                                 bool is_unicode_symbol = false;
1758                                 if (mode == InsetMath::TEXT_MODE) {
1759                                         int num_tokens = 0;
1760                                         docstring cmd = prevToken().asInput();
1761                                         skipSpaces();
1762                                         CatCode cat = nextToken().cat();
1763                                         if (cat == catBegin) {
1764                                                 int count = 0;
1765                                                 while (good() && (count || cat != catEnd)) {
1766                                                         cat = nextToken().cat();
1767                                                         cmd += getToken().asInput();
1768                                                         ++num_tokens;
1769                                                         if (cat == catBegin)
1770                                                                 ++count;
1771                                                         else if (cat == catEnd)
1772                                                                 --count;
1773                                                 }
1774                                         }
1775                                         bool is_combining;
1776                                         char_type c =
1777                                                 Encodings::fromLaTeXCommand(cmd, is_combining);
1778                                         if (is_combining) {
1779                                                 if (cat == catLetter)
1780                                                         cmd += '{';
1781                                                 cmd += getToken().asInput();
1782                                                 ++num_tokens;
1783                                                 if (cat == catLetter)
1784                                                         cmd += '}';
1785                                                 c = Encodings::fromLaTeXCommand(cmd, is_combining);
1786                                         }
1787                                         if (c) {
1788                                                 is_unicode_symbol = true;
1789                                                 cell->push_back(MathAtom(new InsetMathChar(c)));
1790                                         } else {
1791                                                 while (num_tokens--)
1792                                                         putback();
1793                                         }
1794                                 }
1795                                 if (!is_unicode_symbol) {
1796                                         MathAtom at = createInsetMath(t.cs());
1797                                         InsetMath::mode_type m = mode;
1798                                         //if (m == InsetMath::UNDECIDED_MODE)
1799                                         //lyxerr << "default creation: m1: " << m << endl;
1800                                         if (at->currentMode() != InsetMath::UNDECIDED_MODE)
1801                                                 m = at->currentMode();
1802                                         //lyxerr << "default creation: m2: " << m << endl;
1803                                         InsetMath::idx_type start = 0;
1804                                         // this fails on \bigg[...\bigg]
1805                                         //MathData opt;
1806                                         //parse(opt, FLAG_OPTION, InsetMath::VERBATIM_MODE);
1807                                         //if (opt.size()) {
1808                                         //      start = 1;
1809                                         //      at.nucleus()->cell(0) = opt;
1810                                         //}
1811                                         for (InsetMath::idx_type i = start; i < at->nargs(); ++i) {
1812                                                 parse(at.nucleus()->cell(i), FLAG_ITEM, m);
1813                                                 skipSpaces();
1814                                         }
1815                                         cell->push_back(at);
1816                                 }
1817                         }
1818                 }
1819
1820
1821                 if (flags & FLAG_LEAVE) {
1822                         flags &= ~FLAG_LEAVE;
1823                         break;
1824                 }
1825         }
1826         return success_;
1827 }
1828
1829
1830
1831 } // anonymous namespace
1832
1833
1834 bool mathed_parse_cell(MathData & ar, docstring const & str, Parse::flags f)
1835 {
1836         return Parser(str, f).parse(ar, 0, f & Parse::TEXTMODE ?
1837                                 InsetMath::TEXT_MODE : InsetMath::MATH_MODE);
1838 }
1839
1840
1841 bool mathed_parse_cell(MathData & ar, istream & is, Parse::flags f)
1842 {
1843         return Parser(is, f).parse(ar, 0, f & Parse::TEXTMODE ?
1844                                 InsetMath::TEXT_MODE : InsetMath::MATH_MODE);
1845 }
1846
1847
1848 bool mathed_parse_normal(MathAtom & t, docstring const & str, Parse::flags f)
1849 {
1850         return Parser(str, f).parse(t);
1851 }
1852
1853
1854 bool mathed_parse_normal(MathAtom & t, Lexer & lex, Parse::flags f)
1855 {
1856         return Parser(lex, f).parse(t);
1857 }
1858
1859
1860 bool mathed_parse_normal(InsetMathGrid & grid, docstring const & str, Parse::flags f)
1861 {
1862         return Parser(str, f).parse1(grid, 0, f & Parse::TEXTMODE ?
1863                         InsetMath::TEXT_MODE : InsetMath::MATH_MODE, false);
1864 }
1865
1866
1867 void initParser()
1868 {
1869         fill(theCatcode, theCatcode + 128, catOther);
1870         fill(theCatcode + 'a', theCatcode + 'z' + 1, catLetter);
1871         fill(theCatcode + 'A', theCatcode + 'Z' + 1, catLetter);
1872
1873         theCatcode[int('\\')] = catEscape;
1874         theCatcode[int('{')]  = catBegin;
1875         theCatcode[int('}')]  = catEnd;
1876         theCatcode[int('$')]  = catMath;
1877         theCatcode[int('&')]  = catAlign;
1878         theCatcode[int('\n')] = catNewline;
1879         theCatcode[int('#')]  = catParameter;
1880         theCatcode[int('^')]  = catSuper;
1881         theCatcode[int('_')]  = catSub;
1882         theCatcode[int(0x7f)] = catIgnore;
1883         theCatcode[int(' ')]  = catSpace;
1884         theCatcode[int('\t')] = catSpace;
1885         theCatcode[int('\r')] = catNewline;
1886         theCatcode[int('~')]  = catActive;
1887         theCatcode[int('%')]  = catComment;
1888 }
1889
1890
1891 } // namespace lyx