]> git.lyx.org Git - lyx.git/blob - src/mathed/MathParser.cpp
simplify Lexer use a bit
[lyx.git] / src / mathed / MathParser.cpp
1 /**
2  * \file MathParser.cpp
3  * This file is part of LyX, the document processor.
4  * Licence details can be found in the file COPYING.
5  *
6  * \author André Pönitz
7  *
8  * Full author contact details are available in file CREDITS.
9  */
10
11 /*
12
13 If someone desperately needs partial "structures" (such as a few
14 cells of an array inset or similar) (s)he could uses the
15 following hack as starting point to write some macros:
16
17   \newif\ifcomment
18   \commentfalse
19   \ifcomment
20           \def\makeamptab{\catcode`\&=4\relax}
21           \def\makeampletter{\catcode`\&=11\relax}
22     \def\b{\makeampletter\expandafter\makeamptab\bi}
23     \long\def\bi#1\e{}
24   \else
25     \def\b{}\def\e{}
26   \fi
27   ...
28
29   \[\begin{array}{ccc}
30 1
31 &
32
33   \end{array}\]
34
35 */
36
37
38 #include <config.h>
39
40 #include "MathParser.h"
41
42 #include "InsetMathArray.h"
43 #include "InsetMathBig.h"
44 #include "InsetMathBrace.h"
45 #include "InsetMathChar.h"
46 #include "InsetMathColor.h"
47 #include "InsetMathComment.h"
48 #include "InsetMathDelim.h"
49 #include "InsetMathEnv.h"
50 #include "InsetMathFrac.h"
51 #include "InsetMathKern.h"
52 #include "MathMacro.h"
53 #include "InsetMathPar.h"
54 #include "InsetMathRef.h"
55 #include "InsetMathRoot.h"
56 #include "InsetMathScript.h"
57 #include "InsetMathSplit.h"
58 #include "InsetMathSqrt.h"
59 #include "InsetMathTabular.h"
60 #include "MathMacroTemplate.h"
61 #include "MathFactory.h"
62 #include "MathMacroArgument.h"
63 #include "MathSupport.h"
64
65 #include "Lexer.h"
66
67 #include "support/debug.h"
68 #include "support/convert.h"
69 #include "support/docstream.h"
70
71 #include <sstream>
72
73 //#define FILEDEBUG
74
75 using namespace std;
76
77 namespace lyx {
78
79 namespace {
80
81 InsetMath::mode_type asMode(InsetMath::mode_type oldmode, docstring const & str)
82 {
83         //lyxerr << "handling mode: '" << str << "'" << endl;
84         if (str == "mathmode")
85                 return InsetMath::MATH_MODE;
86         if (str == "textmode" || str == "forcetext")
87                 return InsetMath::TEXT_MODE;
88         return oldmode;
89 }
90
91
92 bool stared(docstring const & s)
93 {
94         size_t const n = s.size();
95         return n && s[n - 1] == '*';
96 }
97
98
99 /*!
100  * Add the row \p cellrow to \p grid.
101  * \returns wether the row could be added. Adding a row can fail for
102  * environments like "equation" that have a fixed number of rows.
103  */
104 bool addRow(InsetMathGrid & grid, InsetMathGrid::row_type & cellrow,
105             docstring const & vskip, bool allow_newpage_ = true)
106 {
107         ++cellrow;
108         if (cellrow == grid.nrows()) {
109                 //lyxerr << "adding row " << cellrow << endl;
110                 grid.addRow(cellrow - 1);
111                 if (cellrow == grid.nrows()) {
112                         // We can't add a row to this grid, so let's
113                         // append the content of this cell to the previous
114                         // one.
115                         // This does not happen in well formed .lyx files,
116                         // but LyX versions 1.3.x and older could create
117                         // such files and tex2lyx can still do that.
118                         --cellrow;
119                         lyxerr << "ignoring extra row";
120                         if (!vskip.empty())
121                                 lyxerr << " with extra space " << to_utf8(vskip);
122                         if (!allow_newpage_)
123                                 lyxerr << " with no page break allowed";
124                         lyxerr << '.' << endl;
125                         return false;
126                 }
127         }
128         grid.vcrskip(Length(to_utf8(vskip)), cellrow - 1);
129         grid.rowinfo(cellrow - 1).allow_newpage_ = allow_newpage_;
130         return true;
131 }
132
133
134 /*!
135  * Add the column \p cellcol to \p grid.
136  * \returns wether the column could be added. Adding a column can fail for
137  * environments like "eqnarray" that have a fixed number of columns.
138  */
139 bool addCol(InsetMathGrid & grid, InsetMathGrid::col_type & cellcol)
140 {
141         ++cellcol;
142         if (cellcol == grid.ncols()) {
143                 //lyxerr << "adding column " << cellcol << endl;
144                 grid.addCol(cellcol);
145                 if (cellcol == grid.ncols()) {
146                         // We can't add a column to this grid, so let's
147                         // append the content of this cell to the previous
148                         // one.
149                         // This does not happen in well formed .lyx files,
150                         // but LyX versions 1.3.x and older could create
151                         // such files and tex2lyx can still do that.
152                         --cellcol;
153                         lyxerr << "ignoring extra column." << endl;
154                         return false;
155                 }
156         }
157         return true;
158 }
159
160
161 /*!
162  * Check wether the last row is empty and remove it if yes.
163  * Otherwise the following code
164  * \verbatim
165 \begin{array}{|c|c|}
166 \hline
167 1 & 2 \\ \hline
168 3 & 4 \\ \hline
169 \end{array}
170  * \endverbatim
171  * will result in a grid with 3 rows (+ the dummy row that is always present),
172  * because the last '\\' opens a new row.
173  */
174 void delEmptyLastRow(InsetMathGrid & grid)
175 {
176         InsetMathGrid::row_type const row = grid.nrows() - 1;
177         for (InsetMathGrid::col_type col = 0; col < grid.ncols(); ++col) {
178                 if (!grid.cell(grid.index(row, col)).empty())
179                         return;
180         }
181         // Copy the row information of the empty row (which would contain the
182         // last hline in the example above) to the dummy row and delete the
183         // empty row.
184         grid.rowinfo(row + 1) = grid.rowinfo(row);
185         grid.delRow(row);
186 }
187
188
189 // These are TeX's catcodes
190 enum CatCode {
191         catEscape,     // 0    backslash
192         catBegin,      // 1    {
193         catEnd,        // 2    }
194         catMath,       // 3    $
195         catAlign,      // 4    &
196         catNewline,    // 5    ^^M
197         catParameter,  // 6    #
198         catSuper,      // 7    ^
199         catSub,        // 8    _
200         catIgnore,     // 9
201         catSpace,      // 10   space
202         catLetter,     // 11   a-zA-Z
203         catOther,      // 12   none of the above
204         catActive,     // 13   ~
205         catComment,    // 14   %
206         catInvalid     // 15   <delete>
207 };
208
209 CatCode theCatcode[128];
210
211
212 inline CatCode catcode(char_type c)
213 {
214         /* The only characters that are not catOther lie in the pure ASCII
215          * range. Therefore theCatcode has only 128 entries.
216          * TeX itself deals with 8bit characters, so if needed this table
217          * could be enlarged to 256 entries.
218          * Any larger value does not make sense, since the fact that we use
219          * unicode internally does not change Knuth's TeX engine.
220          * Apart from that a table for the full 21bit UCS4 range would waste
221          * too much memory. */
222         if (c >= 128)
223                 return catOther;
224
225         return theCatcode[c];
226 }
227
228
229 enum {
230         FLAG_ALIGN      = 1 << 0,  //  next & or \\ ends the parsing process
231         FLAG_BRACE_LAST = 1 << 1,  //  next closing brace ends the parsing
232         FLAG_RIGHT      = 1 << 2,  //  next \\right ends the parsing process
233         FLAG_END        = 1 << 3,  //  next \\end ends the parsing process
234         FLAG_BRACK_LAST = 1 << 4,  //  next closing bracket ends the parsing
235         FLAG_TEXTMODE   = 1 << 5,  //  we are in a box
236         FLAG_ITEM       = 1 << 6,  //  read a (possibly braced) token
237         FLAG_LEAVE      = 1 << 7,  //  leave the loop at the end
238         FLAG_SIMPLE     = 1 << 8,  //  next $ leaves the loop
239         FLAG_EQUATION   = 1 << 9,  //  next \] leaves the loop
240         FLAG_SIMPLE2    = 1 << 10, //  next \) leaves the loop
241         FLAG_OPTION     = 1 << 11, //  read [...] style option
242         FLAG_BRACED     = 1 << 12  //  read {...} style argument
243 };
244
245
246 //
247 // Helper class for parsing
248 //
249
250 class Token {
251 public:
252         ///
253         Token() : cs_(), char_(0), cat_(catIgnore) {}
254         ///
255         Token(char_type c, CatCode cat) : cs_(), char_(c), cat_(cat) {}
256         ///
257         explicit Token(docstring const & cs) : cs_(cs), char_(0), cat_(catIgnore) {}
258
259         ///
260         docstring const & cs() const { return cs_; }
261         ///
262         CatCode cat() const { return cat_; }
263         ///
264         char_type character() const { return char_; }
265         ///
266         docstring asString() const { return cs_.size() ? cs_ : docstring(1, char_); }
267         ///
268         docstring asInput() const { return cs_.size() ? '\\' + cs_ : docstring(1, char_); }
269
270 private:
271         ///
272         docstring cs_;
273         ///
274         char_type char_;
275         ///
276         CatCode cat_;
277 };
278
279
280 ostream & operator<<(ostream & os, Token const & t)
281 {
282         if (t.cs().size()) {
283                 docstring const & cs = t.cs();
284                 // FIXME: For some strange reason, the stream operator instanciate
285                 // a new Token before outputting the contents of t.cs().
286                 // Because of this the line
287                 //     os << '\\' << cs;
288                 // below becomes recursive.
289                 // In order to avoid that we return early:
290                 if (cs == "\\")
291                         return os;
292                 os << '\\' << to_utf8(cs);
293         }
294         else if (t.cat() == catLetter)
295                 os << t.character();
296         else
297                 os << '[' << t.character() << ',' << t.cat() << ']';
298         return os;
299 }
300
301
302 class Parser {
303 public:
304         ///
305         typedef  InsetMath::mode_type mode_type;
306
307         ///
308         Parser(Lexer & lex);
309         /// Only use this for reading from .lyx file format, for the reason
310         /// see Parser::tokenize(istream &).
311         Parser(istream & is);
312         ///
313         Parser(docstring const & str);
314
315         ///
316         bool parse(MathAtom & at);
317         ///
318         void parse(MathData & array, unsigned flags, mode_type mode);
319         ///
320         void parse1(InsetMathGrid & grid, unsigned flags, mode_type mode,
321                 bool numbered);
322         ///
323         MathData parse(unsigned flags, mode_type mode);
324         ///
325         int lineno() const { return lineno_; }
326         ///
327         void putback();
328
329 private:
330         ///
331         void parse2(MathAtom & at, unsigned flags, mode_type mode, bool numbered);
332         /// get arg delimited by 'left' and 'right'
333         docstring getArg(char_type left, char_type right);
334         ///
335         char_type getChar();
336         ///
337         void error(string const & msg);
338         void error(docstring const & msg) { error(to_utf8(msg)); }
339         /// dump contents to screen
340         void dump() const;
341         /// Only use this for reading from .lyx file format (see
342         /// implementation for reason)
343         void tokenize(istream & is);
344         ///
345         void tokenize(docstring const & s);
346         ///
347         void skipSpaceTokens(idocstream & is, char_type c);
348         ///
349         void push_back(Token const & t);
350         ///
351         void pop_back();
352         ///
353         Token const & prevToken() const;
354         ///
355         Token const & nextToken() const;
356         ///
357         Token const & getToken();
358         /// skips spaces if any
359         void skipSpaces();
360         ///
361         void lex(docstring const & s);
362         ///
363         bool good() const;
364         ///
365         docstring parse_verbatim_item();
366         ///
367         docstring parse_verbatim_option();
368
369         ///
370         int lineno_;
371         ///
372         vector<Token> tokens_;
373         ///
374         unsigned pos_;
375         /// Stack of active environments
376         vector<docstring> environments_;
377 };
378
379
380 Parser::Parser(Lexer & lexer)
381         : lineno_(lexer.lineNumber()), pos_(0)
382 {
383         tokenize(lexer.getStream());
384         lexer.eatLine();
385 }
386
387
388 Parser::Parser(istream & is)
389         : lineno_(0), pos_(0)
390 {
391         tokenize(is);
392 }
393
394
395 Parser::Parser(docstring const & str)
396         : lineno_(0), pos_(0)
397 {
398         tokenize(str);
399 }
400
401
402 void Parser::push_back(Token const & t)
403 {
404         tokens_.push_back(t);
405 }
406
407
408 void Parser::pop_back()
409 {
410         tokens_.pop_back();
411 }
412
413
414 Token const & Parser::prevToken() const
415 {
416         static const Token dummy;
417         return pos_ > 0 ? tokens_[pos_ - 1] : dummy;
418 }
419
420
421 Token const & Parser::nextToken() const
422 {
423         static const Token dummy;
424         return good() ? tokens_[pos_] : dummy;
425 }
426
427
428 Token const & Parser::getToken()
429 {
430         static const Token dummy;
431         //lyxerr << "looking at token " << tokens_[pos_] << " pos: " << pos_ << endl;
432         return good() ? tokens_[pos_++] : dummy;
433 }
434
435
436 void Parser::skipSpaces()
437 {
438         while (nextToken().cat() == catSpace || nextToken().cat() == catNewline)
439                 getToken();
440 }
441
442
443 void Parser::putback()
444 {
445         --pos_;
446 }
447
448
449 bool Parser::good() const
450 {
451         return pos_ < tokens_.size();
452 }
453
454
455 char_type Parser::getChar()
456 {
457         if (!good()) {
458                 error("The input stream is not well...");
459                 putback();
460                 return 0;
461         }
462         return tokens_[pos_++].character();
463 }
464
465
466 docstring Parser::getArg(char_type left, char_type right)
467 {
468         skipSpaces();
469
470         docstring result;
471         char_type c = getChar();
472
473         if (c != left)
474                 putback();
475         else
476                 while ((c = getChar()) != right && good())
477                         result += c;
478
479         return result;
480 }
481
482
483 void Parser::skipSpaceTokens(idocstream & is, char_type c)
484 {
485         // skip trailing spaces
486         while (catcode(c) == catSpace || catcode(c) == catNewline)
487                 if (!is.get(c))
488                         break;
489         //lyxerr << "putting back: " << c << endl;
490         is.putback(c);
491 }
492
493
494 void Parser::tokenize(istream & is)
495 {
496         // eat everything up to the next \end_inset or end of stream
497         // and store it in s for further tokenization
498         string s;
499         char c;
500         while (is.get(c)) {
501                 s += c;
502                 if (s.size() >= 10 && s.substr(s.size() - 10) == "\\end_inset") {
503                         s = s.substr(0, s.size() - 10);
504                         break;
505                 }
506         }
507         // Remove the space after \end_inset
508         if (is.get(c) && c != ' ')
509                 is.unget();
510
511         // tokenize buffer
512         tokenize(from_utf8(s));
513 }
514
515
516 void Parser::tokenize(docstring const & buffer)
517 {
518         idocstringstream is(buffer, ios::in | ios::binary);
519
520         char_type c;
521         while (is.get(c)) {
522                 //lyxerr << "reading c: " << c << endl;
523
524                 switch (catcode(c)) {
525                         case catNewline: {
526                                 ++lineno_;
527                                 is.get(c);
528                                 if (catcode(c) == catNewline)
529                                         ; //push_back(Token("par"));
530                                 else {
531                                         push_back(Token('\n', catNewline));
532                                         is.putback(c);
533                                 }
534                                 break;
535                         }
536
537 /*
538                         case catComment: {
539                                 while (is.get(c) && catcode(c) != catNewline)
540                                         ;
541                                 ++lineno_;
542                                 break;
543                         }
544 */
545
546                         case catEscape: {
547                                 is.get(c);
548                                 if (!is) {
549                                         error("unexpected end of input");
550                                 } else {
551                                         docstring s(1, c);
552                                         if (catcode(c) == catLetter) {
553                                                 // collect letters
554                                                 while (is.get(c) && catcode(c) == catLetter)
555                                                         s += c;
556                                                 skipSpaceTokens(is, c);
557                                         }
558                                         push_back(Token(s));
559                                 }
560                                 break;
561                         }
562
563                         case catSuper:
564                         case catSub: {
565                                 push_back(Token(c, catcode(c)));
566                                 is.get(c);
567                                 skipSpaceTokens(is, c);
568                                 break;
569                         }
570
571                         case catIgnore: {
572                                 lyxerr << "ignoring a char: " << int(c) << endl;
573                                 break;
574                         }
575
576                         default:
577                                 push_back(Token(c, catcode(c)));
578                 }
579         }
580
581 #ifdef FILEDEBUG
582         dump();
583 #endif
584 }
585
586
587 void Parser::dump() const
588 {
589         lyxerr << "\nTokens: ";
590         for (unsigned i = 0; i < tokens_.size(); ++i) {
591                 if (i == pos_)
592                         lyxerr << " <#> ";
593                 lyxerr << tokens_[i];
594         }
595         lyxerr << " pos: " << pos_ << endl;
596 }
597
598
599 void Parser::error(string const & msg)
600 {
601         lyxerr << "Line ~" << lineno_ << ": Math parse error: " << msg << endl;
602         dump();
603         //exit(1);
604 }
605
606
607 bool Parser::parse(MathAtom & at)
608 {
609         skipSpaces();
610         MathData ar;
611         parse(ar, false, InsetMath::UNDECIDED_MODE);
612         if (ar.size() != 1 || ar.front()->getType() == hullNone) {
613                 lyxerr << "unusual contents found: " << ar << endl;
614                 at = MathAtom(new InsetMathPar(ar));
615                 //if (at->nargs() > 0)
616                 //      at.nucleus()->cell(0) = ar;
617                 //else
618                 //      lyxerr << "unusual contents found: " << ar << endl;
619                 return true;
620         }
621         at = ar[0];
622         return true;
623 }
624
625
626 docstring Parser::parse_verbatim_option()
627 {
628         skipSpaces();
629         docstring res;
630         if (nextToken().character() == '[') {
631                 Token t = getToken();
632                 for (Token t = getToken(); t.character() != ']' && good(); t = getToken()) {
633                         if (t.cat() == catBegin) {
634                                 putback();
635                                 res += '{' + parse_verbatim_item() + '}';
636                         } else
637                                 res += t.asString();
638                 }
639         }
640         return res;
641 }
642
643
644 docstring Parser::parse_verbatim_item()
645 {
646         skipSpaces();
647         docstring res;
648         if (nextToken().cat() == catBegin) {
649                 Token t = getToken();
650                 for (Token t = getToken(); t.cat() != catEnd && good(); t = getToken()) {
651                         if (t.cat() == catBegin) {
652                                 putback();
653                                 res += '{' + parse_verbatim_item() + '}';
654                         }
655                         else
656                                 res += t.asString();
657                 }
658         }
659         return res;
660 }
661
662
663 MathData Parser::parse(unsigned flags, mode_type mode)
664 {
665         MathData ar;
666         parse(ar, flags, mode);
667         return ar;
668 }
669
670
671 void Parser::parse(MathData & array, unsigned flags, mode_type mode)
672 {
673         InsetMathGrid grid(1, 1);
674         parse1(grid, flags, mode, false);
675         array = grid.cell(0);
676 }
677
678
679 void Parser::parse2(MathAtom & at, const unsigned flags, const mode_type mode,
680         const bool numbered)
681 {
682         parse1(*(at.nucleus()->asGridInset()), flags, mode, numbered);
683 }
684
685
686 void Parser::parse1(InsetMathGrid & grid, unsigned flags,
687         const mode_type mode, const bool numbered)
688 {
689         int limits = 0;
690         InsetMathGrid::row_type cellrow = 0;
691         InsetMathGrid::col_type cellcol = 0;
692         MathData * cell = &grid.cell(grid.index(cellrow, cellcol));
693
694         if (grid.asHullInset())
695                 grid.asHullInset()->numbered(cellrow, numbered);
696
697         //dump();
698         //lyxerr << " flags: " << flags << endl;
699         //lyxerr << " mode: " << mode  << endl;
700         //lyxerr << "grid: " << grid << endl;
701
702         while (good()) {
703                 Token const & t = getToken();
704
705 #ifdef FILEDEBUG
706                 lyxerr << "t: " << t << " flags: " << flags << endl;
707                 lyxerr << "mode: " << mode  << endl;
708                 cell->dump();
709                 lyxerr << endl;
710 #endif
711
712                 if (flags & FLAG_ITEM) {
713
714                         if (t.cat() == catBegin) {
715                                 // skip the brace and collect everything to the next matching
716                                 // closing brace
717                                 parse1(grid, FLAG_BRACE_LAST, mode, numbered);
718                                 return;
719                         }
720
721                         // handle only this single token, leave the loop if done
722                         flags = FLAG_LEAVE;
723                 }
724
725
726                 if (flags & FLAG_BRACED) {
727                         if (t.cat() == catSpace)
728                                 continue;
729
730                         if (t.cat() != catBegin) {
731                                 error("opening brace expected");
732                                 return;
733                         }
734
735                         // skip the brace and collect everything to the next matching
736                         // closing brace
737                         flags = FLAG_BRACE_LAST;
738                 }
739
740
741                 if (flags & FLAG_OPTION) {
742                         if (t.cat() == catOther && t.character() == '[') {
743                                 MathData ar;
744                                 parse(ar, FLAG_BRACK_LAST, mode);
745                                 cell->append(ar);
746                         } else {
747                                 // no option found, put back token and we are done
748                                 putback();
749                         }
750                         return;
751                 }
752
753                 //
754                 // cat codes
755                 //
756                 if (t.cat() == catMath) {
757                         if (mode != InsetMath::MATH_MODE) {
758                                 // we are inside some text mode thingy, so opening new math is allowed
759                                 Token const & n = getToken();
760                                 if (n.cat() == catMath) {
761                                         // TeX's $$...$$ syntax for displayed math
762                                         cell->push_back(MathAtom(new InsetMathHull(hullEquation)));
763                                         parse2(cell->back(), FLAG_SIMPLE, InsetMath::MATH_MODE, false);
764                                         getToken(); // skip the second '$' token
765                                 } else {
766                                         // simple $...$  stuff
767                                         putback();
768                                         cell->push_back(MathAtom(new InsetMathHull(hullSimple)));
769                                         parse2(cell->back(), FLAG_SIMPLE, InsetMath::MATH_MODE, false);
770                                 }
771                         }
772
773                         else if (flags & FLAG_SIMPLE) {
774                                 // this is the end of the formula
775                                 return;
776                         }
777
778                         else {
779                                 error("something strange in the parser");
780                                 break;
781                         }
782                 }
783
784                 else if (t.cat() == catLetter)
785                         cell->push_back(MathAtom(new InsetMathChar(t.character())));
786
787                 else if (t.cat() == catSpace && mode != InsetMath::MATH_MODE) {
788                         if (cell->empty() || cell->back()->getChar() != ' ')
789                                 cell->push_back(MathAtom(new InsetMathChar(t.character())));
790                 }
791
792                 else if (t.cat() == catNewline && mode != InsetMath::MATH_MODE) {
793                         if (cell->empty() || cell->back()->getChar() != ' ')
794                                 cell->push_back(MathAtom(new InsetMathChar(' ')));
795                 }
796
797                 else if (t.cat() == catParameter) {
798                         Token const & n = getToken();
799                         cell->push_back(MathAtom(new MathMacroArgument(n.character()-'0')));
800                 }
801
802                 else if (t.cat() == catActive)
803                         cell->push_back(MathAtom(new InsetMathChar(t.character())));
804
805                 else if (t.cat() == catBegin) {
806                         MathData ar;
807                         parse(ar, FLAG_BRACE_LAST, mode);
808                         // do not create a BraceInset if they were written by LyX
809                         // this helps to keep the annoyance of  "a choose b"  to a minimum
810                         if (ar.size() == 1 && ar[0]->extraBraces())
811                                 cell->append(ar);
812                         else
813                                 cell->push_back(MathAtom(new InsetMathBrace(ar)));
814                 }
815
816                 else if (t.cat() == catEnd) {
817                         if (flags & FLAG_BRACE_LAST)
818                                 return;
819                         error("found '}' unexpectedly");
820                         //BOOST_ASSERT(false);
821                         //add(cell, '}', LM_TC_TEX);
822                 }
823
824                 else if (t.cat() == catAlign) {
825                         //lyxerr << " column now " << (cellcol + 1)
826                         //       << " max: " << grid.ncols() << endl;
827                         if (flags & FLAG_ALIGN)
828                                 return;
829                         if (addCol(grid, cellcol))
830                                 cell = &grid.cell(grid.index(cellrow, cellcol));
831                 }
832
833                 else if (t.cat() == catSuper || t.cat() == catSub) {
834                         bool up = (t.cat() == catSuper);
835                         // we need no new script inset if the last thing was a scriptinset,
836                         // which has that script already not the same script already
837                         if (!cell->size())
838                                 cell->push_back(MathAtom(new InsetMathScript(up)));
839                         else if (cell->back()->asScriptInset() &&
840                                         !cell->back()->asScriptInset()->has(up))
841                                 cell->back().nucleus()->asScriptInset()->ensure(up);
842                         else if (cell->back()->asScriptInset())
843                                 cell->push_back(MathAtom(new InsetMathScript(up)));
844                         else
845                                 cell->back() = MathAtom(new InsetMathScript(cell->back(), up));
846                         InsetMathScript * p = cell->back().nucleus()->asScriptInset();
847                         // special handling of {}-bases
848                         // Here we could remove the brace inset for things
849                         // like {a'}^2 and add the braces back in
850                         // InsetMathScript::write().
851                         // We do not do it, since it is not possible to detect
852                         // reliably whether the braces are needed because the
853                         // nucleus contains more than one symbol, or whether
854                         // they are needed for unknown commands like \xx{a}_0
855                         // or \yy{a}{b}_0. This was done in revision 14819
856                         // in an unreliable way. See this thread
857                         // http://www.mail-archive.com/lyx-devel%40lists.lyx.org/msg104917.html
858                         // for more details.
859                         parse(p->cell(p->idxOfScript(up)), FLAG_ITEM, mode);
860                         if (limits) {
861                                 p->limits(limits);
862                                 limits = 0;
863                         }
864                 }
865
866                 else if (t.character() == ']' && (flags & FLAG_BRACK_LAST)) {
867                         //lyxerr << "finished reading option" << endl;
868                         return;
869                 }
870
871                 else if (t.cat() == catOther)
872                         cell->push_back(MathAtom(new InsetMathChar(t.character())));
873
874                 else if (t.cat() == catComment) {
875                         docstring s;
876                         while (good()) {
877                                 Token const & t = getToken();
878                                 if (t.cat() == catNewline)
879                                         break;
880                                 s += t.asString();
881                         }
882                         cell->push_back(MathAtom(new InsetMathComment(s)));
883                         skipSpaces();
884                 }
885
886                 //
887                 // control sequences
888                 //
889
890                 else if (t.cs() == "lyxlock") {
891                         if (cell->size())
892                                 cell->back().nucleus()->lock(true);
893                 }
894
895                 else if ((t.cs() == "global" && nextToken().cs() == "def") ||
896                          t.cs() == "def") {
897                         if (t.cs() == "global")
898                                 getToken();
899                         
900                         // get name
901                         docstring name = getToken().cs();
902                         
903                         // read parameters
904                         int nargs = 0;
905                         docstring pars;
906                         while (good() && nextToken().cat() != catBegin) {
907                                 pars += getToken().cs();
908                                 ++nargs;
909                         }
910                         nargs /= 2;
911                         
912                         // read definition
913                         MathData def;
914                         parse(def, FLAG_ITEM, InsetMath::UNDECIDED_MODE);
915                         
916                         // is a version for display attached?
917                         skipSpaces();
918                         MathData display;
919                         if (nextToken().cat() == catBegin)
920                                 parse(display, FLAG_ITEM, InsetMath::MATH_MODE);
921                         
922                         cell->push_back(MathAtom(new MathMacroTemplate(name, nargs,
923                                0, MacroTypeDef, vector<MathData>(), def, display)));
924                 }
925                 
926                 else if (t.cs() == "newcommand" ||
927                          t.cs() == "renewcommand" ||
928                          t.cs() == "newlyxcommand") {
929                         // get name
930                         if (getToken().cat() != catBegin) {
931                                 error("'{' in \\newcommand expected (1) ");
932                                 return;
933                         }
934                         docstring name = getToken().cs();
935                         if (getToken().cat() != catEnd) {
936                                 error("'}' in \\newcommand expected");
937                                 return;
938                         }
939                                 
940                         // get arity
941                         docstring const arg = getArg('[', ']');
942                         int nargs = 0;
943                         if (!arg.empty())
944                                 nargs = convert<int>(arg);
945                                 
946                         // optional argument given?
947                         skipSpaces();
948                         int optionals = 0;
949                         vector<MathData> optionalValues;
950                         while (nextToken().character() == '[') {
951                                 getToken();
952                                 optionalValues.push_back(MathData());
953                                 parse(optionalValues[optionals], FLAG_BRACK_LAST, mode);
954                                 ++optionals;
955                         }
956                         
957                         MathData def;
958                         parse(def, FLAG_ITEM, InsetMath::UNDECIDED_MODE);
959                         
960                         // is a version for display attached?
961                         skipSpaces();
962                         MathData display;
963                         if (nextToken().cat() == catBegin)
964                                 parse(display, FLAG_ITEM, InsetMath::MATH_MODE);
965                         
966                         cell->push_back(MathAtom(new MathMacroTemplate(name, nargs,
967                                 optionals, MacroTypeNewcommand, optionalValues, def, display)));
968                         
969                 }
970                 
971                 else if (t.cs() == "newcommandx" ||
972                          t.cs() == "renewcommandx") {
973                         // \newcommandx{\foo}[2][usedefault, addprefix=\global,1=default]{#1,#2}
974                         // get name
975                         docstring name;
976                         if (nextToken().cat() == catBegin) {
977                                 getToken();
978                                 name = getToken().cs();
979                                 if (getToken().cat() != catEnd) {
980                                         error("'}' in \\newcommandx expected");
981                                         return;
982                                 }
983                         } else
984                                 name = getToken().cs();
985                                 
986                         // get arity
987                         docstring const arg = getArg('[', ']');
988                         if (arg.empty()) {
989                                 error("[num] in \\newcommandx expected");
990                                 return;
991                         }
992                         int nargs = convert<int>(arg);
993                         
994                         // get options
995                         int optionals = 0;
996                         vector<MathData> optionalValues;
997                         if (nextToken().character() == '[') {
998                                 // skip '['
999                                 getToken();
1000                                         
1001                                 // handle 'opt=value' options, separated by ','.
1002                                 skipSpaces();
1003                                 while (nextToken().character() != ']' && good()) {
1004                                         if (nextToken().character() >= '1'
1005                                             && nextToken().character() <= '9') {
1006                                                 // optional value -> get parameter number
1007                                                 int n = getChar() - '0';
1008                                                 if (n > nargs) {
1009                                                         error("Arity of \\newcommandx too low "
1010                                                               "for given optional parameter.");
1011                                                         return;
1012                                                 }
1013                                                 
1014                                                 // skip '='
1015                                                 if (getToken().character() != '=') {
1016                                                         error("'=' and optional parameter value "
1017                                                               "expected for \\newcommandx");
1018                                                         return;
1019                                                 }
1020                                                 
1021                                                 // get value
1022                                                 int optNum = max(size_t(n), optionalValues.size());
1023                                                 optionalValues.resize(optNum);
1024                                                 optionalValues[n - 1].clear();
1025                                                 while (nextToken().character() != ']'
1026                                                        && nextToken().character() != ',') {
1027                                                         MathData data;
1028                                                         parse(data, FLAG_ITEM, InsetMath::UNDECIDED_MODE);
1029                                                         optionalValues[n - 1].append(data);
1030                                                 }
1031                                                 optionals = max(n, optionals);
1032                                         } else if (nextToken().cat() == catLetter) {
1033                                                 // we in fact ignore every non-optional
1034                                                 // parameter
1035                                                 
1036                                                 // get option name
1037                                                 docstring opt;
1038                                                 while (nextToken().cat() == catLetter)
1039                                                         opt += getChar();
1040                                         
1041                                                 // value?
1042                                                 skipSpaces();
1043                                                 MathData value;
1044                                                 if (nextToken().character() == '=') {
1045                                                         getToken();
1046                                                         while (nextToken().character() != ']'
1047                                                                 && nextToken().character() != ',')
1048                                                                 parse(value, FLAG_ITEM, 
1049                                                                       InsetMath::UNDECIDED_MODE);
1050                                                 }
1051                                         } else {
1052                                                 error("option for \\newcommandx expected");
1053                                                 return;
1054                                         }
1055                                         
1056                                         // skip komma
1057                                         skipSpaces();
1058                                         if (nextToken().character() == ',') {
1059                                                 getChar();
1060                                                 skipSpaces();
1061                                         } else if (nextToken().character() != ']') {
1062                                                 error("Expecting ',' or ']' in options "
1063                                                       "of \\newcommandx");
1064                                                 return;
1065                                         }
1066                                 }
1067                                 
1068                                 // skip ']'
1069                                 if (!good())
1070                                         return;
1071                                 getToken();
1072                         }
1073
1074                         // get definition
1075                         MathData def;
1076                         parse(def, FLAG_ITEM, InsetMath::UNDECIDED_MODE);
1077
1078                         // is a version for display attached?
1079                         skipSpaces();
1080                         MathData display;
1081                         if (nextToken().cat() == catBegin)
1082                                 parse(display, FLAG_ITEM, InsetMath::MATH_MODE);
1083
1084                         cell->push_back(MathAtom(new MathMacroTemplate(name, nargs,
1085                                 optionals, MacroTypeNewcommandx, optionalValues, def, 
1086                                 display)));
1087                 }
1088
1089                 else if (t.cs() == "(") {
1090                         cell->push_back(MathAtom(new InsetMathHull(hullSimple)));
1091                         parse2(cell->back(), FLAG_SIMPLE2, InsetMath::MATH_MODE, false);
1092                 }
1093
1094                 else if (t.cs() == "[") {
1095                         cell->push_back(MathAtom(new InsetMathHull(hullEquation)));
1096                         parse2(cell->back(), FLAG_EQUATION, InsetMath::MATH_MODE, false);
1097                 }
1098
1099                 else if (t.cs() == "protect")
1100                         // ignore \\protect, will hopefully be re-added during output
1101                         ;
1102
1103                 else if (t.cs() == "end") {
1104                         if (flags & FLAG_END) {
1105                                 // eat environment name
1106                                 docstring const name = getArg('{', '}');
1107                                 if (environments_.empty())
1108                                         error("'found \\end{" + name +
1109                                               "}' without matching '\\begin{" +
1110                                               name + "}'");
1111                                 else if (name != environments_.back())
1112                                         error("'\\end{" + name +
1113                                               "}' does not match '\\begin{" +
1114                                               environments_.back() + "}'");
1115                                 else {
1116                                         environments_.pop_back();
1117                                         // Delete empty last row in matrix
1118                                         // like insets.
1119                                         // If you abuse InsetMathGrid for
1120                                         // non-matrix like structures you
1121                                         // probably need to refine this test.
1122                                         // Right now we only have to test for
1123                                         // single line hull insets.
1124                                         if (grid.nrows() > 1)
1125                                                 delEmptyLastRow(grid);
1126                                         return;
1127                                 }
1128                         } else
1129                                 error("found 'end' unexpectedly");
1130                 }
1131
1132                 else if (t.cs() == ")") {
1133                         if (flags & FLAG_SIMPLE2)
1134                                 return;
1135                         error("found '\\)' unexpectedly");
1136                 }
1137
1138                 else if (t.cs() == "]") {
1139                         if (flags & FLAG_EQUATION)
1140                                 return;
1141                         error("found '\\]' unexpectedly");
1142                 }
1143
1144                 else if (t.cs() == "\\") {
1145                         if (flags & FLAG_ALIGN)
1146                                 return;
1147                         bool added = false;
1148                         if (nextToken().asInput() == "*") {
1149                                 getToken();
1150                                 added = addRow(grid, cellrow, docstring(), false);
1151                         } else if (good())
1152                                 added = addRow(grid, cellrow, getArg('[', ']'));
1153                         else
1154                                 error("missing token after \\\\");
1155                         if (added) {
1156                                 cellcol = 0;
1157                                 if (grid.asHullInset())
1158                                         grid.asHullInset()->numbered(
1159                                                         cellrow, numbered);
1160                                 cell = &grid.cell(grid.index(cellrow,
1161                                                              cellcol));
1162                         }
1163                 }
1164
1165 #if 0
1166                 else if (t.cs() == "multicolumn") {
1167                         // extract column count and insert dummy cells
1168                         MathData count;
1169                         parse(count, FLAG_ITEM, mode);
1170                         int cols = 1;
1171                         if (!extractNumber(count, cols)) {
1172                                 lyxerr << " can't extract number of cells from " << count << endl;
1173                         }
1174                         // resize the table if necessary
1175                         for (int i = 0; i < cols; ++i) {
1176                                 if (addCol(grid, cellcol)) {
1177                                         cell = &grid.cell(grid.index(
1178                                                         cellrow, cellcol));
1179                                         // mark this as dummy
1180                                         grid.cellinfo(grid.index(
1181                                                 cellrow, cellcol)).dummy_ = true;
1182                                 }
1183                         }
1184                         // the last cell is the real thing, not a dummy
1185                         grid.cellinfo(grid.index(cellrow, cellcol)).dummy_ = false;
1186
1187                         // read special alignment
1188                         MathData align;
1189                         parse(align, FLAG_ITEM, mode);
1190                         //grid.cellinfo(grid.index(cellrow, cellcol)).align_ = extractString(align);
1191
1192                         // parse the remaining contents into the "real" cell
1193                         parse(*cell, FLAG_ITEM, mode);
1194                 }
1195 #endif
1196
1197                 else if (t.cs() == "limits")
1198                         limits = 1;
1199
1200                 else if (t.cs() == "nolimits")
1201                         limits = -1;
1202
1203                 else if (t.cs() == "nonumber") {
1204                         if (grid.asHullInset())
1205                                 grid.asHullInset()->numbered(cellrow, false);
1206                 }
1207
1208                 else if (t.cs() == "number") {
1209                         if (grid.asHullInset())
1210                                 grid.asHullInset()->numbered(cellrow, true);
1211                 }
1212
1213                 else if (t.cs() == "hline") {
1214                         grid.rowinfo(cellrow).lines_ ++;
1215                 }
1216
1217                 else if (t.cs() == "sqrt") {
1218                         MathData ar;
1219                         parse(ar, FLAG_OPTION, mode);
1220                         if (ar.size()) {
1221                                 cell->push_back(MathAtom(new InsetMathRoot));
1222                                 cell->back().nucleus()->cell(0) = ar;
1223                                 parse(cell->back().nucleus()->cell(1), FLAG_ITEM, mode);
1224                         } else {
1225                                 cell->push_back(MathAtom(new InsetMathSqrt));
1226                                 parse(cell->back().nucleus()->cell(0), FLAG_ITEM, mode);
1227                         }
1228                 }
1229
1230                 else if (t.cs() == "unit") {
1231                         // Allowed formats \unit[val]{unit}
1232                         MathData ar;
1233                         parse(ar, FLAG_OPTION, mode);
1234                         if (ar.size()) {
1235                                 cell->push_back(MathAtom(new InsetMathFrac(InsetMathFrac::UNIT)));
1236                                 cell->back().nucleus()->cell(0) = ar;
1237                                 parse(cell->back().nucleus()->cell(1), FLAG_ITEM, mode);
1238                         } else {
1239                                 cell->push_back(MathAtom(new InsetMathFrac(InsetMathFrac::UNIT, 1)));
1240                                 parse(cell->back().nucleus()->cell(0), FLAG_ITEM, mode);
1241                         }
1242                 }
1243                 else if (t.cs() == "unitfrac") {
1244                         // Here allowed formats are \unitfrac[val]{num}{denom}
1245                         MathData ar;
1246                         parse(ar, FLAG_OPTION, mode);
1247                         if (ar.size()) {
1248                                 cell->push_back(MathAtom(new InsetMathFrac(InsetMathFrac::UNITFRAC, 3)));
1249                                 cell->back().nucleus()->cell(2) = ar;
1250                         } else {
1251                                 cell->push_back(MathAtom(new InsetMathFrac(InsetMathFrac::UNITFRAC)));
1252                         }
1253                         parse(cell->back().nucleus()->cell(0), FLAG_ITEM, mode);
1254                         parse(cell->back().nucleus()->cell(1), FLAG_ITEM, mode);
1255                 }
1256
1257                 else if (t.cs() == "xrightarrow" || t.cs() == "xleftarrow") {
1258                         cell->push_back(createInsetMath(t.cs()));
1259                         parse(cell->back().nucleus()->cell(1), FLAG_OPTION, mode);
1260                         parse(cell->back().nucleus()->cell(0), FLAG_ITEM, mode);
1261                 }
1262
1263                 else if (t.cs() == "ref" || t.cs() == "prettyref" ||
1264                                 t.cs() == "pageref" || t.cs() == "vpageref" || t.cs() == "vref") {
1265                         cell->push_back(MathAtom(new InsetMathRef(t.cs())));
1266                         parse(cell->back().nucleus()->cell(1), FLAG_OPTION, mode);
1267                         parse(cell->back().nucleus()->cell(0), FLAG_ITEM, mode);
1268                 }
1269
1270                 else if (t.cs() == "left") {
1271                         skipSpaces();
1272                         Token const & tl = getToken();
1273                         // \| and \Vert are equivalent, and InsetMathDelim
1274                         // can't handle \|
1275                         // FIXME: fix this in InsetMathDelim itself!
1276                         docstring const l = tl.cs() == "|" ? from_ascii("Vert") : tl.asString();
1277                         MathData ar;
1278                         parse(ar, FLAG_RIGHT, mode);
1279                         if (!good())
1280                                 break;
1281                         skipSpaces();
1282                         Token const & tr = getToken();
1283                         docstring const r = tr.cs() == "|" ? from_ascii("Vert") : tr.asString();
1284                         cell->push_back(MathAtom(new InsetMathDelim(l, r, ar)));
1285                 }
1286
1287                 else if (t.cs() == "right") {
1288                         if (flags & FLAG_RIGHT)
1289                                 return;
1290                         //lyxerr << "got so far: '" << cell << "'" << endl;
1291                         error("Unmatched right delimiter");
1292                         return;
1293                 }
1294
1295                 else if (t.cs() == "begin") {
1296                         docstring const name = getArg('{', '}');
1297                         environments_.push_back(name);
1298
1299                         if (name == "array" || name == "subarray") {
1300                                 docstring const valign = parse_verbatim_option() + 'c';
1301                                 docstring const halign = parse_verbatim_item();
1302                                 cell->push_back(MathAtom(new InsetMathArray(name,
1303                                         InsetMathGrid::guessColumns(halign), 1, (char)valign[0], halign)));
1304                                 parse2(cell->back(), FLAG_END, mode, false);
1305                         }
1306
1307                         else if (name == "tabular") {
1308                                 docstring const valign = parse_verbatim_option() + 'c';
1309                                 docstring const halign = parse_verbatim_item();
1310                                 cell->push_back(MathAtom(new InsetMathTabular(name,
1311                                         InsetMathGrid::guessColumns(halign), 1, (char)valign[0], halign)));
1312                                 parse2(cell->back(), FLAG_END, InsetMath::TEXT_MODE, false);
1313                         }
1314
1315                         else if (name == "split" || name == "cases") {
1316                                 cell->push_back(createInsetMath(name));
1317                                 parse2(cell->back(), FLAG_END, mode, false);
1318                         }
1319
1320                         else if (name == "alignedat") {
1321                                 docstring const valign = parse_verbatim_option() + 'c';
1322                                 // ignore this for a while
1323                                 getArg('{', '}');
1324                                 cell->push_back(MathAtom(new InsetMathSplit(name, (char)valign[0])));
1325                                 parse2(cell->back(), FLAG_END, mode, false);
1326                         }
1327
1328                         else if (name == "math") {
1329                                 cell->push_back(MathAtom(new InsetMathHull(hullSimple)));
1330                                 parse2(cell->back(), FLAG_END, InsetMath::MATH_MODE, true);
1331                         }
1332
1333                         else if (name == "equation" || name == "equation*"
1334                                         || name == "displaymath") {
1335                                 cell->push_back(MathAtom(new InsetMathHull(hullEquation)));
1336                                 parse2(cell->back(), FLAG_END, InsetMath::MATH_MODE, (name == "equation"));
1337                         }
1338
1339                         else if (name == "eqnarray" || name == "eqnarray*") {
1340                                 cell->push_back(MathAtom(new InsetMathHull(hullEqnArray)));
1341                                 parse2(cell->back(), FLAG_END, InsetMath::MATH_MODE, !stared(name));
1342                         }
1343
1344                         else if (name == "align" || name == "align*") {
1345                                 cell->push_back(MathAtom(new InsetMathHull(hullAlign)));
1346                                 parse2(cell->back(), FLAG_END, InsetMath::MATH_MODE, !stared(name));
1347                         }
1348
1349                         else if (name == "flalign" || name == "flalign*") {
1350                                 cell->push_back(MathAtom(new InsetMathHull(hullFlAlign)));
1351                                 parse2(cell->back(), FLAG_END, InsetMath::MATH_MODE, !stared(name));
1352                         }
1353
1354                         else if (name == "alignat" || name == "alignat*") {
1355                                 // ignore this for a while
1356                                 getArg('{', '}');
1357                                 cell->push_back(MathAtom(new InsetMathHull(hullAlignAt)));
1358                                 parse2(cell->back(), FLAG_END, InsetMath::MATH_MODE, !stared(name));
1359                         }
1360
1361                         else if (name == "xalignat" || name == "xalignat*") {
1362                                 // ignore this for a while
1363                                 getArg('{', '}');
1364                                 cell->push_back(MathAtom(new InsetMathHull(hullXAlignAt)));
1365                                 parse2(cell->back(), FLAG_END, InsetMath::MATH_MODE, !stared(name));
1366                         }
1367
1368                         else if (name == "xxalignat") {
1369                                 // ignore this for a while
1370                                 getArg('{', '}');
1371                                 cell->push_back(MathAtom(new InsetMathHull(hullXXAlignAt)));
1372                                 parse2(cell->back(), FLAG_END, InsetMath::MATH_MODE, !stared(name));
1373                         }
1374
1375                         else if (name == "multline" || name == "multline*") {
1376                                 cell->push_back(MathAtom(new InsetMathHull(hullMultline)));
1377                                 parse2(cell->back(), FLAG_END, InsetMath::MATH_MODE, !stared(name));
1378                         }
1379
1380                         else if (name == "gather" || name == "gather*") {
1381                                 cell->push_back(MathAtom(new InsetMathHull(hullGather)));
1382                                 parse2(cell->back(), FLAG_END, InsetMath::MATH_MODE, !stared(name));
1383                         }
1384
1385                         else if (latexkeys const * l = in_word_set(name)) {
1386                                 if (l->inset == "matrix") {
1387                                         cell->push_back(createInsetMath(name));
1388                                         parse2(cell->back(), FLAG_END, mode, false);
1389                                 } else if (l->inset == "split") {
1390                                         docstring const valign = parse_verbatim_option() + 'c';
1391                                         cell->push_back(MathAtom(new InsetMathSplit(name, (char)valign[0])));
1392                                         parse2(cell->back(), FLAG_END, mode, false);
1393                                 } else {
1394                                         dump();
1395                                         lyxerr << "found math environment `" << to_utf8(name)
1396                                                << "' in symbols file with unsupported inset `"
1397                                                << to_utf8(l->inset) << "'." << endl;
1398                                         // create generic environment inset
1399                                         cell->push_back(MathAtom(new InsetMathEnv(name)));
1400                                         parse(cell->back().nucleus()->cell(0), FLAG_END, mode);
1401                                 }
1402                         }
1403
1404                         else {
1405                                 dump();
1406                                 lyxerr << "found unknown math environment '" << to_utf8(name)
1407                                         << "'" << endl;
1408                                 // create generic environment inset
1409                                 cell->push_back(MathAtom(new InsetMathEnv(name)));
1410                                 parse(cell->back().nucleus()->cell(0), FLAG_END, mode);
1411                         }
1412                 }
1413
1414                 else if (t.cs() == "kern") {
1415                         // FIXME: A hack...
1416                         docstring s;
1417                         while (true) {
1418                                 Token const & t = getToken();
1419                                 if (!good()) {
1420                                         putback();
1421                                         break;
1422                                 }
1423                                 s += t.character();
1424                                 if (isValidLength(to_utf8(s)))
1425                                         break;
1426                         }
1427                         cell->push_back(MathAtom(new InsetMathKern(s)));
1428                 }
1429
1430                 else if (t.cs() == "label") {
1431                         // FIXME: This is swallowed in inline formulas
1432                         docstring label = parse_verbatim_item();
1433                         MathData ar;
1434                         asArray(label, ar);
1435                         if (grid.asHullInset()) {
1436                                 grid.asHullInset()->label(cellrow, label);
1437                         } else {
1438                                 cell->push_back(createInsetMath(t.cs()));
1439                                 cell->push_back(MathAtom(new InsetMathBrace(ar)));
1440                         }
1441                 }
1442
1443                 else if (t.cs() == "choose" || t.cs() == "over"
1444                                 || t.cs() == "atop" || t.cs() == "brace"
1445                                 || t.cs() == "brack") {
1446                         MathAtom at = createInsetMath(t.cs());
1447                         at.nucleus()->cell(0) = *cell;
1448                         cell->clear();
1449                         parse(at.nucleus()->cell(1), flags, mode);
1450                         cell->push_back(at);
1451                         return;
1452                 }
1453
1454                 else if (t.cs() == "color") {
1455                         docstring const color = parse_verbatim_item();
1456                         cell->push_back(MathAtom(new InsetMathColor(true, color)));
1457                         parse(cell->back().nucleus()->cell(0), flags, mode);
1458                         return;
1459                 }
1460
1461                 else if (t.cs() == "textcolor") {
1462                         docstring const color = parse_verbatim_item();
1463                         cell->push_back(MathAtom(new InsetMathColor(false, color)));
1464                         parse(cell->back().nucleus()->cell(0), FLAG_ITEM, InsetMath::TEXT_MODE);
1465                 }
1466
1467                 else if (t.cs() == "normalcolor") {
1468                         cell->push_back(createInsetMath(t.cs()));
1469                         parse(cell->back().nucleus()->cell(0), flags, mode);
1470                         return;
1471                 }
1472
1473                 else if (t.cs() == "substack") {
1474                         cell->push_back(createInsetMath(t.cs()));
1475                         parse2(cell->back(), FLAG_ITEM, mode, false);
1476                 }
1477
1478                 else if (t.cs() == "xymatrix") {
1479                         odocstringstream os;
1480                         while (good() && nextToken().cat() != catBegin)
1481                                 os << getToken().asInput();
1482                         cell->push_back(createInsetMath(t.cs() + os.str()));
1483                         parse2(cell->back(), FLAG_ITEM, mode, false);
1484                 }
1485
1486                 else if (t.cs() == "framebox" || t.cs() == "makebox") {
1487                         cell->push_back(createInsetMath(t.cs()));
1488                         parse(cell->back().nucleus()->cell(0), FLAG_OPTION, InsetMath::TEXT_MODE);
1489                         parse(cell->back().nucleus()->cell(1), FLAG_OPTION, InsetMath::TEXT_MODE);
1490                         parse(cell->back().nucleus()->cell(2), FLAG_ITEM, InsetMath::TEXT_MODE);
1491                 }
1492
1493                 else if (t.cs() == "tag") {
1494                         if (nextToken().character() == '*') {
1495                                 getToken();
1496                                 cell->push_back(createInsetMath(t.cs() + '*'));
1497                         } else
1498                                 cell->push_back(createInsetMath(t.cs()));
1499                         parse(cell->back().nucleus()->cell(0), FLAG_ITEM, InsetMath::TEXT_MODE);
1500                 }
1501
1502 #if 0
1503                 else if (t.cs() == "infer") {
1504                         MathData ar;
1505                         parse(ar, FLAG_OPTION, mode);
1506                         cell->push_back(createInsetMath(t.cs()));
1507                         parse2(cell->back(), FLAG_ITEM, mode, false);
1508                 }
1509
1510                 // Disabled
1511                 else if (1 && t.cs() == "ar") {
1512                         auto_ptr<InsetMathXYArrow> p(new InsetMathXYArrow);
1513                         // try to read target
1514                         parse(p->cell(0), FLAG_OTPTION, mode);
1515                         // try to read label
1516                         if (nextToken().cat() == catSuper || nextToken().cat() == catSub) {
1517                                 p->up_ = nextToken().cat() == catSuper;
1518                                 getToken();
1519                                 parse(p->cell(1), FLAG_ITEM, mode);
1520                                 //lyxerr << "read label: " << p->cell(1) << endl;
1521                         }
1522
1523                         cell->push_back(MathAtom(p.release()));
1524                         //lyxerr << "read cell: " << cell << endl;
1525                 }
1526 #endif
1527
1528                 else if (t.cs().size()) {
1529                         latexkeys const * l = in_word_set(t.cs());
1530                         if (l) {
1531                                 if (l->inset == "big") {
1532                                         skipSpaces();
1533                                         docstring const delim = getToken().asInput();
1534                                         if (InsetMathBig::isBigInsetDelim(delim))
1535                                                 cell->push_back(MathAtom(
1536                                                         new InsetMathBig(t.cs(), delim)));
1537                                         else {
1538                                                 cell->push_back(createInsetMath(t.cs()));
1539                                                 putback();
1540                                         }
1541                                 }
1542
1543                                 else if (l->inset == "font") {
1544                                         cell->push_back(createInsetMath(t.cs()));
1545                                         parse(cell->back().nucleus()->cell(0),
1546                                                 FLAG_ITEM, asMode(mode, l->extra));
1547                                 }
1548
1549                                 else if (l->inset == "oldfont") {
1550                                         cell->push_back(createInsetMath(t.cs()));
1551                                         parse(cell->back().nucleus()->cell(0),
1552                                                 flags | FLAG_ALIGN, asMode(mode, l->extra));
1553                                         if (prevToken().cat() != catAlign &&
1554                                             prevToken().cs() != "\\")
1555                                                 return;
1556                                         putback();
1557                                 }
1558
1559                                 else if (l->inset == "style") {
1560                                         cell->push_back(createInsetMath(t.cs()));
1561                                         parse(cell->back().nucleus()->cell(0),
1562                                                 flags | FLAG_ALIGN, mode);
1563                                         if (prevToken().cat() != catAlign &&
1564                                             prevToken().cs() != "\\")
1565                                                 return;
1566                                         putback();
1567                                 }
1568
1569                                 else {
1570                                         MathAtom at = createInsetMath(t.cs());
1571                                         for (InsetMath::idx_type i = 0; i < at->nargs(); ++i)
1572                                                 parse(at.nucleus()->cell(i),
1573                                                         FLAG_ITEM, asMode(mode, l->extra));
1574                                         cell->push_back(at);
1575                                 }
1576                         }
1577
1578                         else {
1579                                 MathAtom at = createInsetMath(t.cs());
1580                                 InsetMath::mode_type m = mode;
1581                                 //if (m == InsetMath::UNDECIDED_MODE)
1582                                 //lyxerr << "default creation: m1: " << m << endl;
1583                                 if (at->currentMode() != InsetMath::UNDECIDED_MODE)
1584                                         m = at->currentMode();
1585                                 //lyxerr << "default creation: m2: " << m << endl;
1586                                 InsetMath::idx_type start = 0;
1587                                 // this fails on \bigg[...\bigg]
1588                                 //MathData opt;
1589                                 //parse(opt, FLAG_OPTION, InsetMath::VERBATIM_MODE);
1590                                 //if (opt.size()) {
1591                                 //      start = 1;
1592                                 //      at.nucleus()->cell(0) = opt;
1593                                 //}
1594                                 for (InsetMath::idx_type i = start; i < at->nargs(); ++i) {
1595                                         parse(at.nucleus()->cell(i), FLAG_ITEM, m);
1596                                         skipSpaces();
1597                                 }
1598                                 cell->push_back(at);
1599                         }
1600                 }
1601
1602
1603                 if (flags & FLAG_LEAVE) {
1604                         flags &= ~FLAG_LEAVE;
1605                         break;
1606                 }
1607         }
1608 }
1609
1610
1611
1612 } // anonymous namespace
1613
1614
1615 void mathed_parse_cell(MathData & ar, docstring const & str)
1616 {
1617         Parser(str).parse(ar, 0, InsetMath::MATH_MODE);
1618 }
1619
1620
1621 void mathed_parse_cell(MathData & ar, istream & is)
1622 {
1623         Parser(is).parse(ar, 0, InsetMath::MATH_MODE);
1624 }
1625
1626
1627 bool mathed_parse_normal(MathAtom & t, docstring const & str)
1628 {
1629         return Parser(str).parse(t);
1630 }
1631
1632
1633 bool mathed_parse_normal(MathAtom & t, Lexer & lex)
1634 {
1635         return Parser(lex).parse(t);
1636 }
1637
1638
1639 void mathed_parse_normal(InsetMathGrid & grid, docstring const & str)
1640 {
1641         Parser(str).parse1(grid, 0, InsetMath::MATH_MODE, false);
1642 }
1643
1644
1645 void initParser()
1646 {
1647         fill(theCatcode, theCatcode + 128, catOther);
1648         fill(theCatcode + 'a', theCatcode + 'z' + 1, catLetter);
1649         fill(theCatcode + 'A', theCatcode + 'Z' + 1, catLetter);
1650
1651         theCatcode[int('\\')] = catEscape;
1652         theCatcode[int('{')]  = catBegin;
1653         theCatcode[int('}')]  = catEnd;
1654         theCatcode[int('$')]  = catMath;
1655         theCatcode[int('&')]  = catAlign;
1656         theCatcode[int('\n')] = catNewline;
1657         theCatcode[int('#')]  = catParameter;
1658         theCatcode[int('^')]  = catSuper;
1659         theCatcode[int('_')]  = catSub;
1660         theCatcode[int(0x7f)] = catIgnore;
1661         theCatcode[int(' ')]  = catSpace;
1662         theCatcode[int('\t')] = catSpace;
1663         theCatcode[int('\r')] = catNewline;
1664         theCatcode[int('~')]  = catActive;
1665         theCatcode[int('%')]  = catComment;
1666 }
1667
1668
1669 } // namespace lyx