3 * This file is part of LyX, the document processor.
4 * Licence details can be found in the file COPYING.
9 * Full author contact details are available in file CREDITS.
18 #include "LayoutFile.h"
21 #include "TextClass.h"
23 #include "support/convert.h"
24 #include "support/FileName.h"
25 #include "support/filetools.h"
26 #include "support/lstrings.h"
28 #include <boost/regex.hpp>
38 using namespace lyx::support;
44 // special columntypes
45 extern map<char, int> special_columns;
47 map<string, vector<string> > used_packages;
49 // needed to handle encodings with babel
50 bool one_language = true;
52 // to avoid that the babel options overwrite the documentclass options
53 bool documentclass_language;
57 const char * const known_languages[] = { "afrikaans", "american", "arabic",
58 "austrian", "bahasa", "basque", "belarusian", "brazil", "breton", "british",
59 "bulgarian", "canadian", "canadien", "catalan", "croatian", "czech", "danish",
60 "dutch", "english", "esperanto", "estonian", "finnish", "francais", "french",
61 "frenchb", "frenchle", "frenchpro", "galician", "german", "germanb", "greek",
62 "hebrew", "icelandic", "irish", "italian", "lsorbian", "magyar", "naustrian",
63 "ngerman", "ngermanb", "norsk", "nynorsk", "polish", "portuges", "romanian",
64 "russian", "russianb", "scottish", "serbian", "slovak", "slovene", "spanish",
65 "swedish", "thai", "turkish", "ukraineb", "ukrainian", "usorbian", "welsh", 0};
67 //note this when updating to lyxformat 305:
68 //bahasai, indonesian, and indon = equal to bahasa
69 //malay, and meyalu = equal to bahasam
71 const char * const known_french_languages[] = {"french", "frenchb", "francais",
72 "frenchle", "frenchpro", 0};
73 const char * const known_german_languages[] = {"german", "germanb", 0};
74 const char * const known_ngerman_languages[] = {"ngerman", "ngermanb", 0};
75 const char * const known_russian_languages[] = {"russian", "russianb", 0};
76 const char * const known_ukrainian_languages[] = {"ukrainian", "ukraineb", 0};
78 char const * const known_fontsizes[] = { "10pt", "11pt", "12pt", 0 };
80 const char * const known_roman_fonts[] = { "ae", "bookman", "charter",
81 "cmr", "fourier", "lmodern", "mathpazo", "mathptmx", "newcent", 0};
83 const char * const known_sans_fonts[] = { "avant", "berasans", "cmbr", "cmss",
86 const char * const known_typewriter_fonts[] = { "beramono", "cmtl", "cmtt",
87 "courier", "lmtt", "luximono", "fourier", "lmodern", "mathpazo", "mathptmx",
90 const char * const known_paper_sizes[] = { "a3paper", "b3paper", "a4paper",
91 "b4paper", "a5paper", "b5paper", "executivepaper", "legalpaper",
94 const char * const known_class_paper_sizes[] = { "a4paper", "a5paper",
95 "executivepaper", "legalpaper", "letterpaper", 0};
97 const char * const known_paper_margins[] = { "lmargin", "tmargin", "rmargin",
98 "bmargin", "headheight", "headsep", "footskip", "columnsep", 0};
100 const char * const known_coded_paper_margins[] = { "leftmargin", "topmargin",
101 "rightmargin", "bottommargin", "headheight", "headsep", "footskip",
105 ostringstream h_preamble;
106 string h_textclass = "article";
107 string h_options = string();
108 string h_language = "english";
109 string h_inputencoding = "auto";
110 string h_font_roman = "default";
111 string h_font_sans = "default";
112 string h_font_typewriter = "default";
113 string h_font_default_family = "default";
114 string h_font_sc = "false";
115 string h_font_osf = "false";
116 string h_font_sf_scale = "100";
117 string h_font_tt_scale = "100";
118 string h_graphics = "default";
119 string h_paperfontsize = "default";
120 string h_spacing = "single";
121 string h_papersize = "default";
122 string h_use_geometry = "false";
123 string h_use_amsmath = "0";
124 string h_cite_engine = "basic";
125 string h_use_bibtopic = "false";
126 string h_paperorientation = "portrait";
127 string h_secnumdepth = "3";
128 string h_tocdepth = "3";
129 string h_paragraph_separation = "indent";
130 string h_defskip = "medskip";
131 string h_quotes_language = "english";
132 string h_papercolumns = "1";
133 string h_papersides = string();
134 string h_paperpagestyle = "default";
135 string h_tracking_changes = "false";
136 string h_output_changes = "false";
137 string h_margins = "";
140 void handle_opt(vector<string> & opts, char const * const * what, string & target)
145 // the last language option is the document language (for babel and LyX)
146 // the last size option is the document font size
147 vector<string>::iterator it;
148 vector<string>::iterator position = opts.begin();
149 for (; *what; ++what) {
150 it = find(opts.begin(), opts.end(), *what);
151 if (it != opts.end()) {
152 documentclass_language = true;
153 if (it >= position) {
162 void delete_opt(vector<string> & opts, char const * const * what)
167 // remove found options from the list
168 // do this after handle_opt to avoid potential memory leaks and to be able
169 // to find in every case the last language option
170 vector<string>::iterator it;
171 for (; *what; ++what) {
172 it = find(opts.begin(), opts.end(), *what);
173 if (it != opts.end())
180 * Split a package options string (keyval format) into a vector.
182 * authorformat=smallcaps,
184 * titleformat=colonsep,
185 * bibformat={tabular,ibidem,numbered}
187 vector<string> split_options(string const & input)
189 vector<string> options;
193 Token const & t = p.get_token();
194 if (t.asInput() == ",") {
195 options.push_back(trim(option));
197 } else if (t.asInput() == "=") {
200 if (p.next_token().asInput() == "{")
201 option += '{' + p.getArg('{', '}') + '}';
202 } else if (t.cat() != catSpace)
203 option += t.asInput();
207 options.push_back(trim(option));
214 * Add package \p name with options \p options to used_packages.
215 * Remove options from \p options that we don't want to output.
217 void add_package(string const & name, vector<string> & options)
219 // every package inherits the global options
220 if (used_packages.find(name) == used_packages.end())
221 used_packages[name] = split_options(h_options);
223 vector<string> & v = used_packages[name];
224 v.insert(v.end(), options.begin(), options.end());
225 if (name == "jurabib") {
226 // Don't output the order argument (see the cite command
227 // handling code in text.cpp).
228 vector<string>::iterator end =
229 remove(options.begin(), options.end(), "natbiborder");
230 end = remove(options.begin(), end, "jurabiborder");
231 options.erase(end, options.end());
236 // Given is a string like "scaled=0.9", return 0.9 * 100
237 string const scale_as_percentage(string const & scale)
239 string::size_type pos = scale.find('=');
240 if (pos != string::npos) {
241 string value = scale.substr(pos + 1);
243 return convert<string>(100 * convert<double>(value));
245 // If the input string didn't match our expectations.
246 // return the default value "100"
251 void handle_package(string const & name, string const & opts,
252 bool in_lyx_preamble)
254 vector<string> options = split_options(opts);
255 add_package(name, options);
259 if (is_known(name, known_roman_fonts))
262 if (name == "fourier") {
263 h_font_roman = "utopia";
264 // when font uses real small capitals
265 if (opts == "expert")
268 if (name == "mathpazo")
269 h_font_roman = "palatino";
271 if (name == "mathptmx")
272 h_font_roman = "times";
275 if (is_known(name, known_sans_fonts)) {
279 h_font_sf_scale = scale_as_percentage(scale);
283 if (is_known(name, known_typewriter_fonts)) {
284 h_font_typewriter = name;
287 h_font_tt_scale = scale_as_percentage(scale);
290 // font uses old-style figure
294 else if (name == "amsmath" || name == "amssymb")
297 else if (name == "babel" && !opts.empty()) {
298 // check if more than one option was used - used later for inputenc
299 // in case inputenc is parsed before babel, set the encoding to auto
300 if (options.begin() != options.end() - 1) {
301 one_language = false;
302 h_inputencoding = "auto";
304 // only set the document language when there was not already one set
305 // via the documentclass options
306 // babel takes the the last language given in the documentclass options
307 // as document language. If there is no such language option, the last
308 // option of its \usepackage call is used.
309 if (documentclass_language == false) {
310 handle_opt(options, known_languages, h_language);
311 delete_opt(options, known_languages);
312 if (is_known(h_language, known_french_languages))
313 h_language = "french";
314 else if (is_known(h_language, known_german_languages))
315 h_language = "german";
316 else if (is_known(h_language, known_ngerman_languages))
317 h_language = "ngerman";
318 else if (is_known(h_language, known_russian_languages))
319 h_language = "russian";
320 else if (is_known(h_language, known_ukrainian_languages))
321 h_language = "ukrainian";
322 h_quotes_language = h_language;
325 else if (name == "fontenc")
328 else if (name == "inputenc") {
329 // only set when there is not more than one inputenc option
330 // therefore check for the "," character
331 // also only set when there is not more then one babel language option
332 if (opts.find(",") == string::npos && one_language == true)
334 //change ascii to auto to be in the unicode range, see
335 //http://bugzilla.lyx.org/show_bug.cgi?id=4719
336 h_inputencoding = "auto";
338 h_inputencoding = opts;
341 else if (name == "makeidx")
344 else if (name == "verbatim")
347 else if (name == "color")
348 // with the following command this package is only loaded when needed for
349 // undefined colors, since we only support the predefined colors
350 h_preamble << "\\@ifundefined{definecolor}\n {\\usepackage{color}}{}\n";
352 else if (name == "graphicx")
355 else if (name == "setspace")
358 else if (name == "geometry")
359 ; // Ignore this, the geometry settings are made by the \geometry
360 // command. This command is handled below.
362 else if (is_known(name, known_languages)) {
363 if (is_known(name, known_french_languages))
364 h_language = "french";
365 else if (is_known(name, known_german_languages))
366 h_language = "german";
367 else if (is_known(name, known_ngerman_languages))
368 h_language = "ngerman";
369 else if (is_known(name, known_russian_languages))
370 h_language = "russian";
371 else if (is_known(name, known_ukrainian_languages))
372 h_language = "ukrainian";
375 h_quotes_language = h_language;
377 else if (name == "natbib") {
378 h_cite_engine = "natbib_authoryear";
379 vector<string>::iterator it =
380 find(options.begin(), options.end(), "authoryear");
381 if (it != options.end())
384 it = find(options.begin(), options.end(), "numbers");
385 if (it != options.end()) {
386 h_cite_engine = "natbib_numerical";
391 else if (name == "jurabib")
392 h_cite_engine = "jurabib";
393 else if (!in_lyx_preamble) {
395 h_preamble << "\\usepackage{" << name << "}\n";
397 h_preamble << "\\usepackage[" << opts << "]{"
403 // We need to do something with the options...
404 if (!options.empty())
405 cerr << "Ignoring options '" << join(options, ",")
406 << "' of package " << name << '.' << endl;
411 void end_preamble(ostream & os, TextClass const & /*textclass*/)
413 os << "#LyX file created by tex2lyx " << PACKAGE_VERSION << "\n"
414 << "\\lyxformat 247\n"
415 << "\\begin_document\n"
416 << "\\begin_header\n"
417 << "\\textclass " << h_textclass << "\n";
418 if (!h_preamble.str().empty())
419 os << "\\begin_preamble\n" << h_preamble.str() << "\n\\end_preamble\n";
420 if (!h_options.empty())
421 os << "\\options " << h_options << "\n";
422 os << "\\language " << h_language << "\n"
423 << "\\inputencoding " << h_inputencoding << "\n"
424 << "\\font_roman " << h_font_roman << "\n"
425 << "\\font_sans " << h_font_sans << "\n"
426 << "\\font_typewriter " << h_font_typewriter << "\n"
427 << "\\font_default_family " << h_font_default_family << "\n"
428 << "\\font_sc " << h_font_sc << "\n"
429 << "\\font_osf " << h_font_osf << "\n"
430 << "\\font_sf_scale " << h_font_sf_scale << "\n"
431 << "\\font_tt_scale " << h_font_tt_scale << "\n"
432 << "\\graphics " << h_graphics << "\n"
433 << "\\paperfontsize " << h_paperfontsize << "\n"
434 << "\\spacing " << h_spacing << "\n"
435 << "\\papersize " << h_papersize << "\n"
436 << "\\use_geometry " << h_use_geometry << "\n"
437 << "\\use_amsmath " << h_use_amsmath << "\n"
438 << "\\cite_engine " << h_cite_engine << "\n"
439 << "\\use_bibtopic " << h_use_bibtopic << "\n"
440 << "\\paperorientation " << h_paperorientation << "\n"
442 << "\\secnumdepth " << h_secnumdepth << "\n"
443 << "\\tocdepth " << h_tocdepth << "\n"
444 << "\\paragraph_separation " << h_paragraph_separation << "\n"
445 << "\\defskip " << h_defskip << "\n"
446 << "\\quotes_language " << h_quotes_language << "\n"
447 << "\\papercolumns " << h_papercolumns << "\n"
448 << "\\papersides " << h_papersides << "\n"
449 << "\\paperpagestyle " << h_paperpagestyle << "\n"
450 << "\\tracking_changes " << h_tracking_changes << "\n"
451 << "\\output_changes " << h_output_changes << "\n"
452 << "\\end_header\n\n"
454 // clear preamble for subdocuments
458 } // anonymous namespace
460 void parse_preamble(Parser & p, ostream & os,
461 string const & forceclass, TeX2LyXDocClass & tc)
463 // initialize fixed types
464 special_columns['D'] = 3;
465 bool is_full_document = false;
466 bool is_lyx_file = false;
467 bool in_lyx_preamble = true;
469 // determine whether this is a full document or a fragment for inclusion
471 Token const & t = p.get_token();
473 if (t.cat() == catEscape && t.cs() == "documentclass") {
474 is_full_document = true;
480 while (is_full_document && p.good()) {
481 Token const & t = p.get_token();
484 cerr << "t: " << t << "\n";
490 if (!in_lyx_preamble &&
491 (t.cat() == catLetter ||
492 t.cat() == catSuper ||
494 t.cat() == catOther ||
495 t.cat() == catMath ||
496 t.cat() == catActive ||
497 t.cat() == catBegin ||
499 t.cat() == catAlign ||
500 t.cat() == catParameter))
501 h_preamble << t.character();
503 else if (!in_lyx_preamble &&
504 (t.cat() == catSpace || t.cat() == catNewline))
505 h_preamble << t.asInput();
507 else if (t.cat() == catComment) {
508 // regex to parse comments
509 static regex const islyxfile("%% LyX .* created this file");
510 static regex const usercommands("User specified LaTeX commands");
512 string const comment = t.asInput();
513 cerr << "Seen comment: " << comment << std::endl;
515 if (regex_search(comment, sub, islyxfile))
518 && regex_search(comment, sub, usercommands))
519 in_lyx_preamble = false;
520 else if (!in_lyx_preamble)
521 h_preamble << t.asInput();
522 cerr << "lyx_file: " << is_lyx_file << ", lyx_preamble "
523 << in_lyx_preamble << std::endl;
526 else if (t.cs() == "pagestyle")
527 h_paperpagestyle = p.verbatim_item();
529 else if (t.cs() == "makeatletter") {
530 if (!is_lyx_file || !in_lyx_preamble
531 || p.getCatCode('@') != catLetter)
532 h_preamble << "\\makeatletter";
533 p.setCatCode('@', catLetter);
536 else if (t.cs() == "makeatother") {
537 if (!is_lyx_file || !in_lyx_preamble
538 || p.getCatCode('@') != catOther)
539 h_preamble << "\\makeatother";
540 p.setCatCode('@', catOther);
543 else if (t.cs() == "newcommand" || t.cs() == "renewcommand"
544 || t.cs() == "providecommand") {
546 if (p.next_token().character() == '*') {
550 string const name = p.verbatim_item();
551 string const opt1 = p.getOpt();
552 string const opt2 = p.getFullOpt();
553 string const body = p.verbatim_item();
555 if (name == "\\rmdefault")
556 if (is_known(body, known_roman_fonts))
559 if (name == "\\sfdefault")
560 if (is_known(body, known_sans_fonts))
563 if (name == "\\ttdefault")
564 if (is_known(body, known_typewriter_fonts))
565 h_font_typewriter = body;
567 if (name == "\\familydefault") {
568 string family = body;
569 // remove leading "\"
570 h_font_default_family = family.erase(0,1);
572 // only non-lyxspecific stuff
573 if (!in_lyx_preamble) {
575 ss << '\\' << t.cs();
578 ss << '{' << name << '}' << opt1 << opt2
579 << '{' << body << "}";
580 h_preamble << ss.str();
582 // Add the command to the known commands
583 add_known_command(name, opt1, !opt2.empty());
585 ostream & out = in_preamble ? h_preamble : os;
586 out << "\\" << t.cs() << "{" << name << "}"
587 << opts << "{" << body << "}";
592 else if (t.cs() == "documentclass") {
593 vector<string>::iterator it;
594 vector<string> opts = split_options(p.getArg('[', ']'));
595 handle_opt(opts, known_fontsizes, h_paperfontsize);
596 delete_opt(opts, known_fontsizes);
597 // delete "pt" at the end
598 string::size_type i = h_paperfontsize.find("pt");
599 if (i != string::npos)
600 h_paperfontsize.erase(i);
601 // to avoid that the babel options overwrite the documentclass options
602 documentclass_language = false;
603 handle_opt(opts, known_languages, h_language);
604 delete_opt(opts, known_languages);
605 if (is_known(h_language, known_french_languages))
606 h_language = "french";
607 else if (is_known(h_language, known_german_languages))
608 h_language = "german";
609 else if (is_known(h_language, known_ngerman_languages))
610 h_language = "ngerman";
611 else if (is_known(h_language, known_russian_languages))
612 h_language = "russian";
613 else if (is_known(h_language, known_ukrainian_languages))
614 h_language = "ukrainian";
615 h_quotes_language = h_language;
617 if ((it = find(opts.begin(), opts.end(), "landscape")) != opts.end()) {
618 h_paperorientation = "landscape";
622 if ((it = find(opts.begin(), opts.end(), "oneside"))
627 if ((it = find(opts.begin(), opts.end(), "twoside"))
633 if ((it = find(opts.begin(), opts.end(), "onecolumn"))
635 h_papercolumns = "1";
638 if ((it = find(opts.begin(), opts.end(), "twocolumn"))
640 h_papercolumns = "2";
644 // some size options are know to any document classes, other sizes
645 // are handled by the \geometry command of the geometry package
646 handle_opt(opts, known_class_paper_sizes, h_papersize);
647 delete_opt(opts, known_class_paper_sizes);
648 // the remaining options
649 h_options = join(opts, ",");
650 h_textclass = p.getArg('{', '}');
653 else if (t.cs() == "usepackage") {
654 string const options = p.getArg('[', ']');
655 string const name = p.getArg('{', '}');
656 if (options.empty() && name.find(',')) {
657 vector<string> vecnames;
658 split(name, vecnames, ',');
659 vector<string>::const_iterator it = vecnames.begin();
660 vector<string>::const_iterator end = vecnames.end();
661 for (; it != end; ++it)
662 handle_package(trim(*it), string(),
665 handle_package(name, options, in_lyx_preamble);
669 else if (t.cs() == "newenvironment") {
670 string const name = p.getArg('{', '}');
672 ss << "\\newenvironment{" << name << "}";
675 ss << '{' << p.verbatim_item() << '}';
676 ss << '{' << p.verbatim_item() << '}';
677 if (!in_lyx_preamble)
678 h_preamble << ss.str();
681 else if (t.cs() == "def") {
682 string name = p.get_token().cs();
683 while (p.next_token().cat() != catBegin)
684 name += p.get_token().asString();
685 if (!in_lyx_preamble)
686 h_preamble << "\\def\\" << name << '{'
687 << p.verbatim_item() << "}";
690 else if (t.cs() == "newcolumntype") {
691 string const name = p.getArg('{', '}');
694 string opts = p.getOpt();
696 istringstream is(string(opts, 1));
699 special_columns[name[0]] = nargs;
700 h_preamble << "\\newcolumntype{" << name << "}";
702 h_preamble << "[" << nargs << "]";
703 h_preamble << "{" << p.verbatim_item() << "}";
706 else if (t.cs() == "setcounter") {
707 string const name = p.getArg('{', '}');
708 string const content = p.getArg('{', '}');
709 if (name == "secnumdepth")
710 h_secnumdepth = content;
711 else if (name == "tocdepth")
712 h_tocdepth = content;
714 h_preamble << "\\setcounter{" << name << "}{" << content << "}";
717 else if (t.cs() == "setlength") {
718 string const name = p.verbatim_item();
719 string const content = p.verbatim_item();
720 // the paragraphs are only not indented when \parindent is set to zero
721 if (name == "\\parindent" && content != "") {
722 if (content[0] == '0')
723 h_paragraph_separation = "skip";
724 } else if (name == "\\parskip") {
725 if (content == "\\smallskipamount")
726 h_defskip = "smallskip";
727 else if (content == "\\medskipamount")
728 h_defskip = "medskip";
729 else if (content == "\\bigskipamount")
730 h_defskip = "bigskip";
734 h_preamble << "\\setlength{" << name << "}{" << content << "}";
737 else if (t.cs() == "onehalfspacing")
738 h_spacing = "onehalf";
740 else if (t.cs() == "doublespacing")
741 h_spacing = "double";
743 else if (t.cs() == "setstretch")
744 h_spacing = "other " + p.verbatim_item();
746 else if (t.cs() == "begin") {
747 string const name = p.getArg('{', '}');
748 if (name == "document")
750 h_preamble << "\\begin{" << name << "}";
753 else if (t.cs() == "geometry") {
754 h_use_geometry = "true";
755 vector<string> opts = split_options(p.getArg('{', '}'));
756 vector<string>::iterator it;
758 if ((it = find(opts.begin(), opts.end(), "landscape")) != opts.end()) {
759 h_paperorientation = "landscape";
763 handle_opt(opts, known_paper_sizes, h_papersize);
764 delete_opt(opts, known_paper_sizes);
766 char const * const * margin = known_paper_margins;
768 for (; *margin; ++margin) {
770 // search for the "=" in e.g. "lmargin=2cm" to get the value
771 for(size_t i = 0; i != opts.size(); i++) {
772 if (opts.at(i).find(*margin) != string::npos) {
773 string::size_type pos = opts.at(i).find("=");
774 string value = opts.at(i).substr(pos + 1);
775 string name = known_coded_paper_margins[k];
776 h_margins += "\\" + name + " " + value + "\n";
782 else if (t.cs() == "jurabibsetup") {
783 vector<string> jurabibsetup =
784 split_options(p.getArg('{', '}'));
785 // add jurabibsetup to the jurabib package options
786 add_package("jurabib", jurabibsetup);
787 if (!jurabibsetup.empty()) {
788 h_preamble << "\\jurabibsetup{"
789 << join(jurabibsetup, ",") << '}';
793 else if (!t.cs().empty() && !in_lyx_preamble)
794 h_preamble << '\\' << t.cs();
798 // Force textclass if the user wanted it
799 if (!forceclass.empty())
800 h_textclass = forceclass;
801 if (noweb_mode && !prefixIs(h_textclass, "literate-"))
802 h_textclass.insert(0, "literate-");
803 FileName layoutfilename = libFileSearch("layouts", h_textclass, "layout");
804 if (layoutfilename.empty()) {
805 cerr << "Error: Could not find layout file for textclass \"" << h_textclass << "\"." << endl;
808 tc.read(layoutfilename);
809 if (h_papersides.empty()) {
812 h_papersides = ss.str();
814 end_preamble(os, tc);