CALS tables: base implementation of row separators on the new code from XHTML.

[features.git] / src / lyxfind.cpp
diff --git a/src/lyxfind.cpp b/src/lyxfind.cpp

index 004e10b51ed043fc4423f87d861ee8c7e78a3ce6..53058ddace7f247fceb0448e6a75c663f1ca393e 100644 (file)
--- a/src/lyxfind.cpp
+++ b/src/lyxfind.cpp
@@ -106,6 +106,8 @@ class IgnoreFormats {
         ///
         void setIgnoreDeleted(bool value);
         ///
+       bool getNonContent() const { return searchNonContent_; }
+       ///
         void setIgnoreFormat(string const & type, bool value, bool fromUser = true);
  
  private:
@@ -132,6 +134,8 @@ private:
         bool userSelectedIgnoreLanguage_ = false;
         ///
         bool ignoreDeleted_ = true;
+       ///
+       bool searchNonContent_ = true;
  };
  
  void IgnoreFormats::setIgnoreFormat(string const & type, bool value, bool fromUser)
@@ -177,6 +181,9 @@ void IgnoreFormats::setIgnoreFormat(string const & type, bool value, bool fromUs
         else if (type == "deleted") {
                 ignoreDeleted_ = value;
         }
+       else if (type == "non-output-content") {
+               searchNonContent_ = !value;
+       }
  }
  
  // The global variable that can be changed from outside
@@ -185,7 +192,7 @@ IgnoreFormats ignoreFormats;
  
  void setIgnoreFormat(string const & type, bool value, bool fromUser)
  {
-  ignoreFormats.setIgnoreFormat(type, value, fromUser);
+       ignoreFormats.setIgnoreFormat(type, value, fromUser);
  }
  
  
@@ -823,16 +830,22 @@ string string2regex(string in)
         return temp2;
  }
  
+static void buildAccentsMap();
+
  string correctRegex(string t, bool withformat)
  {
         /* Convert \backslash => \
          * and \{, \}, \[, \] => {, }, [, ]
          */
         string s("");
-       regex wordre("(\\\\)*(\\\\((backslash|mathcircumflex) ?|[\\[\\]\\{\\}]))");
+       regex wordre("(\\\\)*(\\\\(([A-Za-z]+|[\\{\\}])( |\\{\\})?|[\\[\\]\\{\\}]))");
         size_t lastpos = 0;
         smatch sub;
         bool backslashed = false;
+       if (accents.empty())
+               buildAccentsMap();
+
+       //LYXERR0("correctRegex input '" << t << "'");
         for (sregex_iterator it(t.begin(), t.end(), wordre), end; it != end; ++it) {
                 sub = *it;
                 string replace;
@@ -842,9 +855,8 @@ string correctRegex(string t, bool withformat)
                 else {
                         if (sub.str(4) == "backslash") {
                                 replace = "\\";
-                               if (withformat) {
+                               {
                                         // transforms '\backslash \{' into '\{'
-                                       // and '\{' into '{'
                                         string next = t.substr(sub.position(2) + sub.str(2).length(), 2);
                                         if ((next == "\\{") || (next == "\\}")) {
                                                 replace = "";
@@ -856,17 +868,40 @@ string correctRegex(string t, bool withformat)
                                 replace = "^";
                         else if (backslashed) {
                                 backslashed = false;
-                               if (withformat && (sub.str(3) == "{"))
-                                       replace = accents["braceleft"];
-                               else if (withformat && (sub.str(3) == "}"))
-                                       replace = accents["braceright"];
+                               if (withformat) {
+                                       if (sub.str(3) == "{")
+                                               replace = accents["braceleft"];
+                                       else if (sub.str(3) == "}")
+                                               replace = accents["braceright"];
+                                       else {
+                                               // else part should not exist
+                                               LASSERT(1, /**/);
+                                       }
+                               }
                                 else {
-                                       // else part should not exist
-                                       LASSERT(1, /**/);
+                                       if (sub.str(3) == "{")
+                                               replace = "\\{";
+                                       else if (sub.str(3) == "}")
+                                               replace = "\\}";
+                                       else {
+                                               // else part should not exist
+                                               LASSERT(1, /**/);
+                                       }
+                               }
+                       }
+                       else if (sub.str(4) == "{") // transforms '\{' into '{'
+                               replace = "{";
+                       else if (sub.str(4) == "}")
+                                replace = "}";
+                       else {
+                               AccentsIterator it_ac = accents.find(sub.str(4));
+                               if (it_ac == accents.end()) {
+                                       replace = sub.str(2);
+                               }
+                               else {
+                                       replace = it_ac->second;
                                 }
                         }
-                       else
-                               replace = sub.str(3);
                 }
                 if (lastpos < (size_t) sub.position(2))
                         s += t.substr(lastpos, sub.position(2) - lastpos);
@@ -877,6 +912,7 @@ string correctRegex(string t, bool withformat)
                 return t;
         else if (lastpos < t.length())
                 s += t.substr(lastpos, t.length() - lastpos);
+       //LYXERR0("correctRegex output '" << s << "'");
         return s;
  }
  
@@ -898,7 +934,7 @@ string escape_for_regex(string s, bool withformat)
                         if (lastpos == s.size())
                                 break;
                 }
-               size_t end_pos = s.find("\\endregexp{}}", regex_pos + 8);
+               size_t end_pos = s.find("\\endregexp", regex_pos + 8);
                 result += correctRegex(s.substr(regex_pos + 8, end_pos -(regex_pos + 8)), withformat);
                 lastpos = end_pos + 13;
         }
@@ -935,7 +971,7 @@ public:
         int pos_len;
         int searched_size;
         vector <string> result = vector <string>();
-       MatchResult(int len = 0): match_len(len),match_prefix(0),match2end(0), pos(0),leadsize(0),pos_len(-1),searched_size(0) {};
+       MatchResult(int len = 0): match_len(len),match_prefix(0),match2end(0), pos(0),leadsize(0),pos_len(-1),searched_size(0) {}
  };
  
  static MatchResult::range interpretMatch(MatchResult &oldres, MatchResult &newres)
@@ -1001,7 +1037,7 @@ private:
          ** @todo Normalization should also expand macros, if the corresponding
          ** search option was checked.
          **/
-       string normalize(docstring const & s) const;
+       string normalize(docstring const & s, bool ignore_fomat) const;
         // normalized string to search
         string par_as_string;
         // regular expression to use for searching
@@ -1059,6 +1095,9 @@ static docstring buffer_to_latex(Buffer & buffer)
                 runparams.for_searchAdv = OutputParams::SearchWithoutDeleted;
         else
                 runparams.for_searchAdv = OutputParams::SearchWithDeleted;
+       if (ignoreFormats.getNonContent()) {
+               runparams.for_searchAdv |= OutputParams::SearchNonOutput;
+       }
         pit_type const endpit = buffer.paragraphs().size();
         for (pit_type pit = 0; pit != endpit; ++pit) {
                 TeXOnePar(buffer, buffer.text(), pit, os, runparams);
@@ -1067,6 +1106,52 @@ static docstring buffer_to_latex(Buffer & buffer)
         return ods.str();
  }
  
+static string latexNamesToUtf8(docstring strIn)
+{
+       string addtmp = to_utf8(strIn);
+       static regex const rmAcc("(\\\\)*("
+                                        "\\\\([A-Za-z]+\\{.\\})"       // e.g. "ddot{A}" == sub.str(3)
+                                       "|\\\\([A-Za-z]+)( |\\{\\})?"   // e.g. "LyX", "LyX{}", "LyX " == sub.str(4)
+                                       ")"
+                               );
+       size_t lastpos = 0;
+       smatch sub;
+       string replace;
+       string add("");
+       if (accents.empty())
+               buildAccentsMap();
+       for (sregex_iterator it_add(addtmp.begin(), addtmp.end(), rmAcc), end; it_add != end; ++it_add) {
+               sub = *it_add;
+               if ((sub.position(2) - sub.position(0)) % 2 == 1) {
+                       continue;
+               }
+               else {
+                       string key;
+                       if (sub.length(3) > 0)
+                               key = sub.str(3);
+                       else
+                               key = sub.str(4);
+                       AccentsIterator it_ac = accents.find(key);
+                       if (it_ac == accents.end()) {
+                               replace = sub.str(2);
+                       }
+                       else {
+                               replace = it_ac->second;
+                       }
+               }
+               if (lastpos < (size_t) sub.position(2))
+                       add += addtmp.substr(lastpos, sub.position(2) - lastpos);
+               add += replace;
+               lastpos = sub.position(2) + sub.length(2);
+       }
+       if (lastpos == 0)
+               add = addtmp;
+       else if (addtmp.length() > lastpos)
+               add += addtmp.substr(lastpos, addtmp.length() - lastpos);
+       LYXERR(Debug::FIND, "Adding to search string: '"
+                       << add << "'");
+       return add;
+}
  
  static docstring stringifySearchBuffer(Buffer & buffer, FindAndReplaceOptions const & opt)
  {
@@ -1088,19 +1173,20 @@ static docstring stringifySearchBuffer(Buffer & buffer, FindAndReplaceOptions co
                 else {
                         runparams.for_searchAdv = OutputParams::SearchWithDeleted;
                 }
+               if (ignoreFormats.getNonContent()) {
+                       runparams.for_searchAdv |= OutputParams::SearchNonOutput;
+               }
+               string t("");
                 for (pos_type pit = pos_type(0); pit < (pos_type)buffer.paragraphs().size(); ++pit) {
                         Paragraph const & par = buffer.paragraphs().at(pit);
+                       string add = latexNamesToUtf8(par.asString(pos_type(0), par.size(),
+                                                               option,
+                                                               &runparams));
                         LYXERR(Debug::FIND, "Adding to search string: '"
-                              << par.asString(pos_type(0), par.size(),
-                                              option,
-                                              &runparams)
-                              << "'");
-                       str += par.asString(pos_type(0), par.size(),
-                                           option,
-                                           &runparams);
+                               << add << "'");
+                       t += add;
                 }
                 // Even in ignore-format we have to remove "\text{}, \lyxmathsym{}" parts
-               string t = to_utf8(str);
                 while (regex_replace(t, t, "\\\\(text|lyxmathsym|ensuremath)\\{([^\\}]*)\\}", "$2"));
                 str = from_utf8(t);
         }
@@ -1248,7 +1334,7 @@ class KeyInfo {
  
  class Border {
   public:
- Border(int l=0, int u=0) : low(l), upper(u) {};
+ Border(int l=0, int u=0) : low(l), upper(u) {}
    int low;
    int upper;
  };
@@ -1507,12 +1593,18 @@ static void addAccents(string latex_in, string unicode_out)
  
  void static fillMissingUnicodesymbols()
  {
+  addAccents("\\pounds", getutf8(0x00a3));
+  addAccents("\\textsterling", getutf8(0x00a3));
    addAccents("\\textyen", getutf8(0x00a5));
    addAccents("\\yen", getutf8(0x00a5));
    addAccents("\\textsection", getutf8(0x00a7));
    addAccents("\\mathsection", getutf8(0x00a7));
+  addAccents("\\textcopyright", getutf8(0x00a9));
+  addAccents("\\copyright", getutf8(0x00a9));
    addAccents("\\textlnot", getutf8(0x00ac));
    addAccents("\\neg", getutf8(0x00ac));
+  addAccents("\\textregistered", getutf8(0x00ae));
+  addAccents("\\circledR", getutf8(0x00ae));
    addAccents("\\textpm", getutf8(0x00b1));
    addAccents("\\pm", getutf8(0x00b1));
    addAccents("\\textparagraph", getutf8(0x00b6));
@@ -1520,12 +1612,39 @@ void static fillMissingUnicodesymbols()
    addAccents("\\textperiodcentered", getutf8(0x00b7));
    addAccents("\\texttimes", getutf8(0x00d7));
    addAccents("\\times", getutf8(0x00d7));
+  addAccents("\\O", getutf8(0x00d8));
    addAccents("\\dh", getutf8(0x00f0));
    addAccents("\\eth", getutf8(0x00f0));
    addAccents("\\textdiv", getutf8(0x00f7));
    addAccents("\\div", getutf8(0x00f7));
    addAccents("\\o", getutf8(0x00f8));
+  addAccents("\\textcrlambda", getutf8(0x019b));
    addAccents("\\j", getutf8(0x0237));
+  addAccents("\\textrevepsilon", getutf8(0x025c));
+  addAccents("\\textbaru", getutf8(0x0289));
+  addAccents("\\textquoteleft", getutf8(0x02bb));
+  addAccents("\\textGamma", getutf8(0x0393));
+  addAccents("\\Gamma", getutf8(0x0393));
+  addAccents("\\textDelta", getutf8(0x0394));
+  addAccents("\\Delta", getutf8(0x0394));
+  addAccents("\\textTheta", getutf8(0x0398));
+  addAccents("\\Theta", getutf8(0x0398));
+  addAccents("\\textLambda", getutf8(0x039b));
+  addAccents("\\Lambda", getutf8(0x039b));
+  addAccents("\\textXi", getutf8(0x039e));
+  addAccents("\\Xi", getutf8(0x039e));
+  addAccents("\\textPi", getutf8(0x03a0));
+  addAccents("\\Pi", getutf8(0x03a0));
+  addAccents("\\textSigma", getutf8(0x03a3));
+  addAccents("\\Sigma", getutf8(0x03a3));
+  addAccents("\\textUpsilon", getutf8(0x03a5));
+  addAccents("\\Upsilon", getutf8(0x03a5));
+  addAccents("\\textPhi", getutf8(0x03a6));
+  addAccents("\\Phi", getutf8(0x03a6));
+  addAccents("\\textPsi", getutf8(0x03a8));
+  addAccents("\\Psi", getutf8(0x03a8));
+  addAccents("\\textOmega", getutf8(0x03a9));
+  addAccents("\\Omega", getutf8(0x03a9));
    addAccents("\\textalpha", getutf8(0x03b1));
    addAccents("\\alpha", getutf8(0x03b1));
    addAccents("\\textbeta", getutf8(0x03b2));
@@ -1584,6 +1703,30 @@ void static fillMissingUnicodesymbols()
    addAccents("\\gimel", getutf8(0x05d2));
    addAccents("\\hebdalet", getutf8(0x05d3));
    addAccents("\\daleth", getutf8(0x05d3));
+  addAccents("\\hebhe", getutf8(0x05d4));
+  addAccents("\\hebvav", getutf8(0x05d5));
+  addAccents("\\hebzayin", getutf8(0x05d6));
+  addAccents("\\hebhet", getutf8(0x05d7));
+  addAccents("\\hebtet", getutf8(0x05d8));
+  addAccents("\\hebyod", getutf8(0x05d9));
+  addAccents("\\hebfinalkaf", getutf8(0x05da));
+  addAccents("\\hebkaf", getutf8(0x05db));
+  addAccents("\\heblamed", getutf8(0x05dc));
+  addAccents("\\hebfinalmem", getutf8(0x05dd));
+  addAccents("\\hebmem", getutf8(0x05de));
+  addAccents("\\hebfinalnun", getutf8(0x05df));
+  addAccents("\\hebnun", getutf8(0x05e0));
+  addAccents("\\hebsamekh", getutf8(0x05e1));
+  addAccents("\\hebayin", getutf8(0x05e2));
+  addAccents("\\hebfinalpe", getutf8(0x05e3));
+  addAccents("\\hebpe", getutf8(0x05e4));
+  addAccents("\\hebfinaltsadi", getutf8(0x05e5));
+  addAccents("\\hebtsadi", getutf8(0x05e6));
+  addAccents("\\hebqof", getutf8(0x05e7));
+  addAccents("\\hebresh", getutf8(0x05e8));
+  addAccents("\\hebshin", getutf8(0x05e9));
+  addAccents("\\hebtav", getutf8(0x05ea));
+
    // Thai characters
    addAccents("\\thaiKoKai", getutf8(0x0e01));
    addAccents("\\thaiKhoKhai", getutf8(0x0e02));
@@ -1671,19 +1814,25 @@ void static fillMissingUnicodesymbols()
    addAccents("\\thainine", getutf8(0x0e59));
    addAccents("\\thaiAngkhankhu", getutf8(0x0e5a));
    addAccents("\\thaiKhomut", getutf8(0x0e5b));
-
    addAccents("\\dag", getutf8(0x2020));
    addAccents("\\dagger", getutf8(0x2020));
+  addAccents("\\textdagger", getutf8(0x2020));
    addAccents("\\ddag", getutf8(0x2021));
    addAccents("\\ddagger", getutf8(0x2021));
+  addAccents("\\textdaggerdbl", getutf8(0x2021));
    addAccents("\\textbullet", getutf8(0x2022));
    addAccents("\\bullet", getutf8(0x2022));
    addAccents("\\dots", getutf8(0x2026));
    addAccents("\\ldots", getutf8(0x2026));
+  addAccents("\\textellipsis", getutf8(0x2026));
    addAccents("\\textasciiacute", getutf8(0x2032));
    addAccents("\\prime", getutf8(0x2032));
+  addAccents("\\textacutedbl", getutf8(0x2033));
+  addAccents("\\dprime", getutf8(0x2033));
    addAccents("\\textasciigrave", getutf8(0x2035));
    addAccents("\\backprime", getutf8(0x2035));
+  addAccents("\\textsubcircum{ }", getutf8(0x2038));
+  addAccents("\\caretinsert", getutf8(0x2038));
    addAccents("\\textasteriskcentered", getutf8(0x204e));
    addAccents("\\ast", getutf8(0x204e));
    addAccents("\\textmho", getutf8(0x2127));
@@ -1704,6 +1853,14 @@ void static fillMissingUnicodesymbols()
    addAccents("\\surd", getutf8(0x221a));
    addAccents("\\textbigcircle", getutf8(0x25ef));
    addAccents("\\bigcirc", getutf8(0x25ef));
+  addAccents("\\FiveStar", getutf8(0x2605));
+  addAccents("\\bigstar", getutf8(0x2605));
+  addAccents("\\FiveStarOpen", getutf8(0x2606));
+  addAccents("\\bigwhitestar", getutf8(0x2606));
+  addAccents("\\Checkmark", getutf8(0x2713));
+  addAccents("\\checkmark", getutf8(0x2713));
+  addAccents("\\CrossMaltese", getutf8(0x2720));
+  addAccents("\\maltese", getutf8(0x2720));
    addAccents("\\textlangle", getutf8(0x27e8));
    addAccents("\\langle", getutf8(0x27e8));
    addAccents("\\textrangle", getutf8(0x27e9));
@@ -1749,8 +1906,8 @@ static void buildAccentsMap()
    accents["backslash LaTeXe"]        = getutf8(0xf0013);
    accents["backslash lyxarrow"]      = getutf8(0xf0020);
    accents["ddot{\\imath}"] = "ï";
-  buildaccent("ddot", "aAeEhHiIioOtuUwWxXyY",
-                      "Ã¤Ã\84Ã«Ã\8bá¸§á¸¦Ã¯Ã\8fÃ¯Ã¶Ã\96áº\97Ã¼Ã\9cáº\85áº\84áº\8dáº\8cÃ¿Å¸");      // umlaut
+  buildaccent("ddot", "aAeEhHiIoOtuUwWxXyY",
+                      "Ã¤Ã\84Ã«Ã\8bá¸§á¸¦Ã¯Ã\8fÃ¶Ã\96áº\97Ã¼Ã\9cáº\85áº\84áº\8dáº\8cÃ¿Å¸");        // umlaut
    buildaccent("dot|.", "aAbBcCdDeEfFGghHIimMnNoOpPrRsStTwWxXyYzZ",
                         "ȧȦḃḂċĊḋḊėĖḟḞĠġḣḢİİṁṀṅṄȯȮṗṖṙṘṡṠṫṪẇẆẋẊẏẎżŻ");  // dot{i} can only happen if ignoring case, but there is no lowercase of 'İ'
    accents["acute{\\imath}"] = "í";
@@ -1795,8 +1952,8 @@ static void buildAccentsMap()
    accents["textdoublegrave{\\i}"] = "ȉ";
    buildaccent("dgrave|textdoublegrave", "AaEeIiOoRrUu",
                                          "ȀȁȄȅȈȉȌȍȐȑȔȕ"); // double grave
-  accents["rcap{\\imath}"] = "È\89";
-  accents["textroundcap{\\i}"] = "È\89";
+  accents["rcap{\\imath}"] = "È\8b";
+  accents["textroundcap{\\i}"] = "È\8b";
    buildaccent("rcap|textroundcap", "AaEeIiOoRrUu",
                                     "ȂȃȆȇȊȋȎȏȒȓȖȗ"); // inverted breve
    buildaccent("slashed", "oO",
@@ -1813,9 +1970,13 @@ void Intervall::removeAccents()
  {
    if (accents.empty())
      buildAccentsMap();
-  static regex const accre("\\\\(([\\S]|grave|breve|ddot|dot|acute|dacute|mathring|check|hat|bar|tilde|subdot|ogonek|"
-         "cedilla|subring|textsubring|subhat|textsubcircum|subtilde|textsubtilde|dgrave|textdoublegrave|rcap|textroundcap|slashed)\\{[^\\{\\}]+\\}"
-      "|((i|imath|jmath|cdot|[a-z]+space)|((backslash )?([lL]y[xX]|[tT]e[xX]|[lL]a[tT]e[xX]e?|lyxarrow))|(brace|guillemot)(left|right)|textasciicircum|mathcircumflex|sim)(?![a-zA-Z]))");
+  static regex const accre("\\\\("
+      "([\\S]|[A-Za-z]+)\\{[^\\{\\}]+\\}"
+      "|("
+        "(backslash ([lL]y[xX]|[tT]e[xX]|[lL]a[tT]e[xX]e?|lyxarrow))"
+       "|[A-Za-z]+"
+      ")"
+      "(?![a-zA-Z]))");
    smatch sub;
    for (sregex_iterator itacc(par.begin(), par.end(), accre), end; itacc != end; ++itacc) {
      sub = *itacc;
@@ -1920,7 +2081,7 @@ class LatexInfo {
      buildKeys(isPatternString);
      entries_ = vector<KeyInfo>();
      buildEntries(isPatternString);
-  };
+  }
    int getFirstKey() {
      entidx_ = 0;
      if (entries_.empty()) {
@@ -1941,7 +2102,7 @@ class LatexInfo {
          return -1;
      }
      return 0;
-  };
+  }
    int getNextKey() {
      entidx_++;
      if (int(entries_.size()) > entidx_) {
@@ -1950,7 +2111,7 @@ class LatexInfo {
      else {
        return -1;
      }
-  };
+  }
    bool setNextKey(int idx) {
      if ((idx == entidx_) && (entidx_ >= 0)) {
        entidx_--;
@@ -1958,7 +2119,7 @@ class LatexInfo {
      }
      else
        return false;
-  };
+  }
    int find(int start, KeyInfo::KeyType keytype) const {
      if (start < 0)
        return -1;
@@ -1969,20 +2130,20 @@ class LatexInfo {
        tmpIdx++;
      }
      return -1;
-  };
+  }
    int process(ostringstream & os, KeyInfo const & actual);
    int dispatch(ostringstream & os, int previousStart, KeyInfo & actual);
-  // string show(int lastpos) { return interval.show(lastpos);};
-  int nextNotIgnored(int start) { return interval_.nextNotIgnored(start);};
+  // string show(int lastpos) { return interval.show(lastpos);}
+  int nextNotIgnored(int start) { return interval_.nextNotIgnored(start);}
    KeyInfo &getKeyInfo(int keyinfo) {
      static KeyInfo invalidInfo = KeyInfo();
      if ((keyinfo < 0) || ( keyinfo >= int(entries_.size())))
        return invalidInfo;
      else
        return entries_[keyinfo];
-  };
-  void setForDefaultLang(KeyInfo const & defLang) {interval_.setForDefaultLang(defLang);};
-  void addIntervall(int low, int up) { interval_.addIntervall(low, up); };
+  }
+  void setForDefaultLang(KeyInfo const & defLang) {interval_.setForDefaultLang(defLang);}
+  void addIntervall(int low, int up) { interval_.addIntervall(low, up); }
  };
  
  
@@ -2036,7 +2197,7 @@ class MathInfo {
      m.mathSize = m.mathEnd - m.mathStart;
      entries_.push_back(m);
    }
-  bool empty() const { return entries_.empty(); };
+  bool empty() const { return entries_.empty(); }
    size_t getEndPos() const {
      if (entries_.empty() || (actualIdx_ >= entries_.size())) {
        return 0;
@@ -2071,7 +2232,7 @@ class MathInfo {
      }
      return entries_[actualIdx_].mathSize;
    }
-  void incrEntry() { actualIdx_++; };
+  void incrEntry() { actualIdx_++; }
  };
  
  void LatexInfo::buildEntries(bool isPatternString)
@@ -2868,7 +3029,7 @@ int LatexInfo::dispatch(ostringstream &os, int previousStart, KeyInfo &actual)
        // Remove the key with all parameters and following spaces
        size_t pos;
        size_t start;
-      if (interval_.par[actual._dataEnd-1] == ' ')
+      if (interval_.par[actual._dataEnd-1] == ' ' || interval_.par[actual._dataEnd-1] == '}')
          start = actual._dataEnd;
        else
          start = actual._dataEnd+1;
@@ -3304,9 +3465,9 @@ void MatchStringAdv::CreateRegexp(FindAndReplaceOptions const & opt, string rege
                                 balanced--;
                                 if (balanced < 0)
                                         break;
-                               }
-                               skip = 1;
                         }
+                       skip = 1;
+               }
                 if (balanced != 0) {
                         regexIsValid = false;
                         regexError = "Unbalanced curly brackets in regexp \"" + regexp_str + "\"";
@@ -3375,7 +3536,7 @@ MatchStringAdv::MatchStringAdv(lyx::Buffer & buf, FindAndReplaceOptions & opt)
                 previous_single_replace = true;
         }
         // When using regexp, braces are hacked already by escape_for_regex()
-       par_as_string = normalize(ds);
+       par_as_string = normalize(ds, opt.ignoreformat);
         open_braces = 0;
         close_wildcards = 0;
  
@@ -3423,6 +3584,7 @@ MatchStringAdv::MatchStringAdv(lyx::Buffer & buf, FindAndReplaceOptions & opt)
                 string lead_as_regexp;
                 if (lead_size > 0) {
                         lead_as_regexp = string2regex(par_as_string.substr(0, lead_size));
+                       (void)regex_replace(par_as_string_nolead, par_as_string_nolead, "\\$$", "");
                         (void)regex_replace(par_as_string_nolead, par_as_string_nolead, "}$", "");
                         par_as_string = par_as_string_nolead;
                         LYXERR(Debug::FIND, "lead_as_regexp is '" << lead_as_regexp << "'");
@@ -3498,7 +3660,7 @@ MatchResult MatchStringAdv::findAux(DocIterator const & cur, int len, bool at_be
  
         docstring docstr = stringifyFromForSearch(opt, cur, len);
         string str;
-       str = normalize(docstr);
+       str = normalize(docstr, opt.ignoreformat);
         if (!opt.ignoreformat) {
                 str = correctlanguagesetting(str, false, !opt.ignoreformat);
                 // remove closing '}' and '\n' to allow for use of '$' in regex
@@ -3692,16 +3854,22 @@ static bool simple_replace(string &t, string from, string to)
  }
  #endif
  
-string MatchStringAdv::normalize(docstring const & s) const
+string MatchStringAdv::normalize(docstring const & s, bool ignore_format) const
  {
         string t;
         t = lyx::to_utf8(s);
         // Remove \n at begin
         while (!t.empty() && t[0] == '\n')
                 t = t.substr(1);
-       // Remove \n at end
-       while (!t.empty() && t[t.size() - 1] == '\n')
-               t = t.substr(0, t.size() - 1);
+       // Remove [%]*\n at end
+       while (!t.empty() && t[t.size() - 1] == '\n') {
+               int count = 1;
+               if (!ignore_format) {
+                       while ((t.size() > 1 + count) && (t[t.size() - 1 - count] == '%'))
+                               count++;
+               }
+               t = t.substr(0, t.size() - count);
+       }
         size_t pos;
         // Handle all other '\n'
         while ((pos = t.find("\n")) != string::npos) {
@@ -3714,13 +3882,24 @@ string MatchStringAdv::normalize(docstring const & s) const
                                 t.replace(pos-2, 3, "");
                         }
                 }
-               else if (!isAlnumASCII(t[pos+1]) || !isAlnumASCII(t[pos-1])) {
-                       // '\n' adjacent to non-alpha-numerics, discard
-                       t.replace(pos, 1, "");
-               }
                 else {
-                       // Replace all other \n with spaces
-                       t.replace(pos, 1, " ");
+                       if (!isAlnumASCII(t[pos+1]) || !isAlnumASCII(t[pos-1])) {
+                               // '\n' adjacent to non-alpha-numerics, discard
+                               t.replace(pos, 1, "");
+                       }
+                       else {
+                               // Replace all other \n with spaces
+                               t.replace(pos, 1, " ");
+                       }
+                       if (!ignore_format) {
+                               int count = 0;
+                               while ((pos > count + 1) && (t[pos - 1 -count] == '%')) {
+                                       count++;
+                               }
+                               if (count > 0) {
+                                       t.replace(pos - count, count, "");
+                               }
+                       }
                 }
         }
         // Remove stale empty \emph{}, \textbf{} and similar blocks from latexify
@@ -3761,11 +3940,14 @@ docstring stringifyFromCursor(DocIterator const & cur, int len)
                 else {
                         runparams.for_searchAdv = OutputParams::SearchWithDeleted;
                 }
+               if (ignoreFormats.getNonContent()) {
+                       runparams.for_searchAdv |= OutputParams::SearchNonOutput;
+               }
                 LYXERR(Debug::FIND, "Stringifying with cur: "
-                      << cur << ", from pos: " << cur.pos() << ", end: " << end);
-               return par.asString(cur.pos(), end,
-                       option,
-                       &runparams);
+                       << cur << ", from pos: " << cur.pos() << ", end: " << end);
+               return from_utf8(latexNamesToUtf8(par.asString(cur.pos(), end,
+                                                               option,
+                                                               &runparams)));
         } else if (cur.inMathed()) {
                 CursorSlice cs = cur.top();
                 MathData md = cs.cell();
@@ -3774,10 +3956,9 @@ docstring stringifyFromCursor(DocIterator const & cur, int len)
                          ? md.end()
                          : md.begin() + cs.pos() + len );
                 MathData md2;
-               for (MathData::const_iterator it = md.begin() + cs.pos();
-                    it != it_end; ++it)
+               for (MathData::const_iterator it = md.begin() + cs.pos(); it != it_end; ++it)
                         md2.push_back(*it);
-               docstring s = asString(md2);
+               docstring s = from_utf8(latexNamesToUtf8(asString(md2)));
                 LYXERR(Debug::FIND, "Stringified math: '" << s << "'");
                 return s;
         }
@@ -3785,7 +3966,6 @@ docstring stringifyFromCursor(DocIterator const & cur, int len)
         return docstring();
  }
  
-
  /** Computes the LaTeX export of buf starting from cur and ending len positions
   * after cur, if len is positive, or at the paragraph or innermost inset end
   * if len is -1.
@@ -3814,6 +3994,9 @@ docstring latexifyFromCursor(DocIterator const & cur, int len)
         else {
                 runparams.for_searchAdv = OutputParams::SearchWithDeleted;
         }
+       if (ignoreFormats.getNonContent()) {
+               runparams.for_searchAdv |= OutputParams::SearchNonOutput;
+       }
  
         if (cur.inTexted()) {
                 // @TODO what about searching beyond/across paragraph breaks ?
@@ -3990,14 +4173,14 @@ MatchResult findAdvFinalize(DocIterator & cur, MatchStringAdv const & match, Mat
               max_match.match_len = actual_match_len;
                maxl = len;
                if (maxl - minl < 4)
-                len = (int)((maxl + minl)/2);
+                len = (maxl + minl)/2;
                else
-                len = (int)(minl + (maxl - minl + 3)/4);
+                len = minl + (maxl - minl + 3)/4;
              }
              else {
                // (actual_match_len < max_match.match_len)
                minl = len + 1;
-              len = (int)((maxl + minl)/2);
+              len = (maxl + minl)/2;
              }
            }
           len = minl;