From cd4ae51f7787046e8852abc4b339b5191c6adc16 Mon Sep 17 00:00:00 2001
From: Kornel Benko <kornel@lyx.org>
Date: Mon, 4 Mar 2019 14:05:44 +0100
Subject: [PATCH] FindAdv: Amend b21c8b21: Expand the list for handled latin
 characters

1.) Added for 'breve' and 'grave' accents
2.) Corrected handling for 'i'-accents (allowed \hat{i} _and_ \hat{\imath})
	because of problems with ignoring case
3.) Spaces: Changed some indents in source
---
 src/lyxfind.cpp | 68 ++++++++++++++++++++++++++++---------------------
 1 file changed, 39 insertions(+), 29 deletions(-)

diff --git a/src/lyxfind.cpp b/src/lyxfind.cpp
index f3cbd153a3..eeb4829510 100644
--- a/src/lyxfind.cpp
+++ b/src/lyxfind.cpp
@@ -1262,19 +1262,22 @@ static void buildaccent(string n, string param, string values)
       string key = name + "{" + param[i] + "}";
       // get the corresponding utf8-value
       if ((values[start] & 0xc0) != 0xc0) {
-	// should not happen, utf8 encoding starts at least with 11xxxxxx
-	start++;
-	continue;
+        // should not happen, utf8 encoding starts at least with 11xxxxxx
+        start++;
+        continue;
       }
       for (int j = 1; ;j++) {
-	if (start + j >= values.size())
-	  break;
-	if ((values[start+j] & 0xc0) == 0xc0) {
-	  // This is the first byte of following utf8 char
-	  accents[key] = values.substr(start, j);
-	  start += j;
-	  break;
-	}
+        if (start + j >= values.size()) {
+          accents[key] = values.substr(start, j);
+          start = values.size() - 1;
+          break;
+        }
+        else if ((values[start+j] & 0xc0) == 0xc0) {
+          // This is the first byte of following utf8 char
+          accents[key] = values.substr(start, j);
+          start += j;
+          break;
+        }
       }
     }
   }
@@ -1283,32 +1286,39 @@ static void buildaccent(string n, string param, string values)
 static void buildAccentsMap()
 {
   accents["imath"] = "Ä±";
+  accents["i"] = "Ä±";
   accents["jmath"] = "È·";
   accents["lyxmathsym{Ã}"] = "Ã";
   accents["ddot{\\imath}"] = "Ã¯";
-  buildaccent("ddot", "aAeEIoOuUyY",
-                      "Ã¤ÃÃ«ÃÃÃ¶ÃÃ¼ÃÃ¿Å¸");	// umlaut
-  buildaccent("dot|.", "cCeEgGIzZaAoObBdDfFyY",
-                     "ÄÄÄÄÄ¡Ä Ä°Å¼Å»È§È¦È¯È®á¸á¸á¸á¸á¸á¸áºáº");
+  buildaccent("ddot", "aAeEiIoOuUyY",
+                      "Ã¤ÃÃ«ÃÃ¯ÃÃ¶ÃÃ¼ÃÃ¿Å¸");	// umlaut
+  buildaccent("dot|.", "cCeEgGiIzZaAoObBdDfFyY",
+                       "ÄÄÄÄÄ¡Ä iÄ°Å¼Å»È§È¦È¯È®á¸á¸á¸á¸á¸á¸áºáº");
   accents["acute{\\imath}"] = "Ã­";
-  buildaccent("acute", "aAcCeElLoOnNrRsSuUyYzZI",
-                       "Ã¡ÃÄÄÃ©ÃÄºÄ¹Ã³ÃÅÅÅÅÅÅÃºÃÃ½ÃÅºÅ¹Ã");
+  buildaccent("acute", "aAcCeElLoOnNrRsSuUyYzZiI",
+                       "Ã¡ÃÄÄÃ©ÃÄºÄ¹Ã³ÃÅÅÅÅÅÅÃºÃÃ½ÃÅºÅ¹Ã­Ã");
   buildaccent("dacute|H|h", "oOuU", "ÅÅÅ±Å°");	// double acute
   buildaccent("mathring|r", "uU", "Å¯Å®");
   accents["check{\\imath}"] = "Ç";
   accents["check{\\jmath}"] = "Ç°";
-  buildaccent("check|v", "cCdDaAeEIoOuUgGkKhHlLnNrRsSTzZ",
-                         "ÄÄÄÄÇÇÄÄÇÇÇÇÇÇ§Ç¦Ç©Ç¨ÈÈÄ¾Ä½ÅÅÅÅÅ¡Å Å¤Å¾Å½");	// caron
+  buildaccent("check|v", "cCdDaAeEiIoOuUgGkKhHlLnNrRsSTzZ",
+                         "ÄÄÄÄÇÇÄÄÇÇÇÇÇÇÇ§Ç¦Ç©Ç¨ÈÈÄ¾Ä½ÅÅÅÅÅ¡Å Å¤Å¾Å½");	// caron
   accents["hat{\\imath}"] = "Ã®";
   accents["hat{\\jmath}"] = "Äµ";
-  buildaccent("hat|^", "aAeEiIcCgGhHJsSwWyYzZoOuU",
-                       "Ã¢ÃÃªÃÃ®ÃÄÄÄÄÄ¥Ä¤Ä´ÅÅÅµÅ´Å·Å¶áºáºÃ´ÃÃ»Ã");	// circ
+  buildaccent("hat|^", "aAeEiIcCgGhHjJsSwWyYzZoOuU",
+                       "Ã¢ÃÃªÃÃ®ÃÄÄÄÄÄ¥Ä¤ÄµÄ´ÅÅÅµÅ´Å·Å¶áºáºÃ´ÃÃ»Ã");	// circ
   accents["bar{\\imath}"] = "Ä«";
-  buildaccent("bar|=", "aAeEIoOuUyY",
-                       "ÄÄÄÄÄªÅÅÅ«ÅªÈ³È²");	// macron
+  buildaccent("bar|=", "aAeEiIoOuUyY",
+                       "ÄÄÄÄÄ«ÄªÅÅÅ«ÅªÈ³È²");	// macron
   accents["tilde{\\imath}"] = "Ä©";
-  buildaccent("tilde", "aAnNoOIuU",
-                       "Ã£ÃÃ±ÃÃµÃÄ¨Å©Å¨");	// tilde
+  buildaccent("tilde", "aAnNoOiIuU",
+                       "Ã£ÃÃ±ÃÃµÃÄ©Ä¨Å©Å¨");	// tilde
+  accents["breve{\\imath}"] = "Ä­";
+  buildaccent("breve|u", "aAeEgGiIoOuU",
+                         "ÄÄÄÄÄÄÄ­Ä¬ÅÅÅ­Å¬");    // breve
+  accents["grave{\\imath}"] = "Ã¬";
+  buildaccent("grave|`", "aAeEiIoOuUnNwWyY",
+                         "Ã ÃÃ¨ÃÃ¬ÃÃ²ÃÃ¹ÃÇ¹Ç¸áºáºá»³á»²");                // grave
 }
 
 /*
@@ -1319,7 +1329,7 @@ void Intervall::removeAccents()
 {
   if (accents.empty())
     buildAccentsMap();
-  static regex const accre("\\\\((lyxmathsym|ddot|dot|.|acute|dacute|h|H|mathring|r|check|v|hat|^|bar|=|tilde)\\{[^\\{\\}]+\\}|imath|jmath)");
+  static regex const accre("\\\\((.|grave|breve|u|lyxmathsym|ddot|dot|acute|dacute|mathring|check|hat|bar|tilde)\\{[^\\{\\}]+\\}|i|imath|jmath)");
   smatch sub;
   for (sregex_iterator itacc(par.begin(), par.end(), accre), end; itacc != end; ++itacc) {
     sub = *itacc;
@@ -2569,14 +2579,14 @@ static string correctlanguagesetting(string par, bool isPatternString, bool with
 		missed = 0;
 		if (withformat) {
 			regex_f = identifyFeatures(result);
-                        string features = "";
+			string features = "";
 			for (auto it = regex_f.cbegin(); it != regex_f.cend(); ++it) {
 				string a = it->first;
 				regex_with_format = true;
-                                features += " " + a;
+				features += " " + a;
 				// LYXERR0("Identified regex format:" << a);
 			}
-                        LYXERR(Debug::FIND, "Identified Features" << features);
+			LYXERR(Debug::FIND, "Identified Features" << features);
 
 		}
 	} else if (regex_with_format) {
-- 
2.39.2