Fix build with GNU libstdc++ C++11 ABI

[lyx.git] / src / support / lstrings.cpp
diff --git a/src/support/lstrings.cpp b/src/support/lstrings.cpp

index 7fbe6730f8a1595553b0afaa77f6452b57fed301..ea1ba59984a62ba7e92910d94530a930e3baf0ef 100644 (file)
--- a/src/support/lstrings.cpp
+++ b/src/support/lstrings.cpp
@@ -15,17 +15,17 @@
  #include "support/lstrings.h"
  
  #include "support/convert.h"
+#include "support/debug.h"
  #include "support/qstring_helpers.h"
-#include "support/textutils.h"
  
-#include <boost/tokenizer.hpp>
  #include "support/lassert.h"
  
  #include <QString>
-#include <QVector>
  
  #include <cstdio>
+#include <cstring>
  #include <algorithm>
+#include <typeinfo>
  
  using namespace std;
  
@@ -35,7 +35,7 @@ namespace lyx {
  // without #include "support/docstring" there.
  docstring const & empty_docstring()
  {
-       static docstring s;
+       static const docstring s;
         return s;
  }
  
@@ -43,7 +43,7 @@ docstring const & empty_docstring()
  // without #include <string>
  string const & empty_string()
  {
-       static string s;
+       static const string s;
         return s;
  }
  
@@ -57,7 +57,7 @@ namespace {
   */
  inline char_type qchar_to_ucs4(QChar const & qchar)
  {
-       LASSERT(is_utf16(static_cast<char_type>(qchar.unicode())), /**/);
+       LASSERT(is_utf16(static_cast<char_type>(qchar.unicode())), return '?');
         return static_cast<char_type>(qchar.unicode());
  }
  
@@ -70,7 +70,7 @@ inline char_type qchar_to_ucs4(QChar const & qchar)
   */
  inline QChar const ucs4_to_qchar(char_type const ucs4)
  {
-       LASSERT(is_utf16(ucs4), /**/);
+       LASSERT(is_utf16(ucs4), return QChar('?'));
         return QChar(static_cast<unsigned short>(ucs4));
  }
  
@@ -115,6 +115,11 @@ bool isPrintable(char_type c)
                 // assume that all non-utf16 characters are printable
                 return true;
         }
+       // Not yet recognized by QChar::isPrint()
+       // See https://bugreports.qt-project.org/browse/QTBUG-12144
+       // LATIN CAPITAL LETTER SHARP S
+       else if (c == 0x1e9e)
+               return true;
         return ucs4_to_qchar(c).isPrint();
  }
  
@@ -146,13 +151,13 @@ bool isSpace(char_type c)
  }
  
  
-bool isDigit(char_type c)
+bool isNumber(char_type c)
  {
         if (!is_utf16(c))
-               // assume that no non-utf16 character is a digit
+               // assume that no non-utf16 character is a numeral
                 // c outside the UCS4 range is catched as well
                 return false;
-       return ucs4_to_qchar(c).isDigit();
+       return ucs4_to_qchar(c).isNumber();
  }
  
  
@@ -164,8 +169,13 @@ bool isDigitASCII(char_type c)
  
  bool isAlnumASCII(char_type c)
  {
-       return ('0' <= c && c <= '9')
-               || ('a' <= c && c <= 'z') || ('A' <= c && c <= 'Z');
+       return isAlphaASCII(c) || isDigitASCII(c);
+}
+
+
+bool isASCII(char_type c)
+{
+       return c < 0x80;
  }
  
  
@@ -193,6 +203,29 @@ int compare_no_case(docstring const & s, docstring const & s2)
  }
  
  
+int compare_locale(docstring const & s, docstring const & s2)
+{
+       // FIXME We have a report that this does not work on windows (bug 9030)
+       try
+       {
+               string const l = to_local8bit(s);
+               string const r = to_local8bit(s2);
+               return strcoll(l.c_str(), r.c_str());
+       }
+       catch (bad_cast & e)
+       {
+               // fall back to builtin sorting
+               LYXERR0("Could not compare using the current locale: "
+                       << e.what() << ", using fallback.");
+               if (s < s2)
+                       return -1;
+               if (s > s2)
+                       return 1;
+               return 0;
+       }
+}
+
+
  namespace {
  
  template<typename Char>
@@ -265,7 +298,7 @@ bool isStrInt(string const & str)
  
         string::const_iterator end = tmpstr.end();
         for (; cit != end; ++cit)
-               if (!isdigit((*cit)))
+               if (!isDigitASCII(*cit))
                         return false;
  
         return true;
@@ -285,7 +318,7 @@ bool isStrUnsignedInt(string const & str)
         string::const_iterator cit = tmpstr.begin();
         string::const_iterator end = tmpstr.end();
         for (; cit != end; ++cit)
-               if (!isdigit((*cit)))
+               if (!isDigitASCII(*cit))
                         return false;
  
         return true;
@@ -309,7 +342,7 @@ bool isStrDbl(string const & str)
                 ++cit;
         string::const_iterator end = tmpstr.end();
         for (; cit != end; ++cit) {
-               if (!isdigit(*cit) && *cit != '.')
+               if (!isDigitASCII(*cit) && *cit != '.')
                         return false;
                 if ('.' == (*cit)) {
                         if (found_dot)
@@ -321,24 +354,18 @@ bool isStrDbl(string const & str)
  }
  
  
-bool hasDigit(docstring const & str)
+bool hasDigitASCII(docstring const & str)
  {
-       if (str.empty())
-               return false;
-
         docstring::const_iterator cit = str.begin();
         docstring::const_iterator const end = str.end();
-       for (; cit != end; ++cit) {
-               if (*cit == ' ')
-                       continue;
-               if (isdigit((*cit)))
+       for (; cit != end; ++cit)
+               if (isDigitASCII(*cit))
                         return true;
-       }
         return false;
  }
  
  
-static bool isHexChar(char_type c)
+bool isHexChar(char_type c)
  {
         return c == '0' ||
                 c == '1' ||
@@ -408,14 +435,14 @@ bool isAscii(string const & str)
  
  char lowercase(char c)
  {
-       LASSERT(static_cast<unsigned char>(c) < 0x80, /**/);
+       LASSERT(isASCII(c), return '?');
         return char(tolower(c));
  }
  
  
  char uppercase(char c)
  {
-       LASSERT(static_cast<unsigned char>(c) < 0x80, /**/);
+       LASSERT(isASCII(c), return '?');
         return char(toupper(c));
  }
  
@@ -480,6 +507,16 @@ docstring const lowercase(docstring const & a)
  }
  
  
+/* Uncomment here and in lstrings.h if you should need this.
+string const lowercase(string const & a)
+{
+       string tmp(a);
+       transform(tmp.begin(), tmp.end(), tmp.begin(), local_lowercase());
+       return tmp;
+}
+*/
+
+
  docstring const uppercase(docstring const & a)
  {
         docstring tmp(a);
@@ -823,7 +860,7 @@ template<typename String> inline
  String const subst_string(String const & a,
                 String const & oldstr, String const & newstr)
  {
-       LASSERT(!oldstr.empty(), /**/);
+       LASSERT(!oldstr.empty(), return a);
         String lstr = a;
         size_t i = 0;
         size_t const olen = oldstr.length();
@@ -839,7 +876,7 @@ String const subst_string(String const & a,
  docstring const subst_string(docstring const & a,
                 docstring const & oldstr, docstring const & newstr)
  {
-       LASSERT(!oldstr.empty(), /**/);
+       LASSERT(!oldstr.empty(), return a);
         docstring lstr = a;
         size_t i = 0;
         size_t const olen = oldstr.length();
@@ -881,6 +918,18 @@ docstring const subst(docstring const & a,
  }
  
  
+int count_char(string const & str, char chr)
+{
+       int count = 0;
+       string::const_iterator lit = str.begin();
+       string::const_iterator end = str.end();
+       for (; lit != end; ++lit)
+               if ((*lit) == chr)
+                       count++;
+       return count;
+}
+
+
  /// Count all occurences of char \a chr inside \a str
  int count_char(docstring const & str, docstring::value_type chr)
  {
@@ -894,9 +943,34 @@ int count_char(docstring const & str, docstring::value_type chr)
  }
  
  
+int count_bin_chars(string const & str)
+{
+       QString const qstr = toqstr(str).simplified();
+       int count = 0;
+       QString::const_iterator cit = qstr.begin();
+       QString::const_iterator end = qstr.end();
+       for (; cit != end; ++cit)  {
+               switch (cit->category()) {
+               case QChar::Separator_Line:
+               case QChar::Separator_Paragraph:
+               case QChar::Other_Control:
+               case QChar::Other_Format:
+               case QChar::Other_Surrogate:
+               case QChar::Other_PrivateUse:
+               case QChar::Other_NotAssigned:
+                       ++count;
+                       break;
+               default:
+                       break;
+               }
+       }
+       return count;
+}
+
+
  docstring const trim(docstring const & a, char const * p)
  {
-       LASSERT(p, /**/);
+       LASSERT(p, return a);
  
         if (a.empty() || !*p)
                 return a;
@@ -915,7 +989,7 @@ docstring const trim(docstring const & a, char const * p)
  
  string const trim(string const & a, char const * p)
  {
-       LASSERT(p, /**/);
+       LASSERT(p, return a);
  
         if (a.empty() || !*p)
                 return a;
@@ -933,7 +1007,7 @@ string const trim(string const & a, char const * p)
  
  string const rtrim(string const & a, char const * p)
  {
-       LASSERT(p, /**/);
+       LASSERT(p, return a);
  
         if (a.empty() || !*p)
                 return a;
@@ -950,7 +1024,7 @@ string const rtrim(string const & a, char const * p)
  
  docstring const rtrim(docstring const & a, char const * p)
  {
-       LASSERT(p, /**/);
+       LASSERT(p, return a);
  
         if (a.empty() || !*p)
                 return a;
@@ -967,7 +1041,7 @@ docstring const rtrim(docstring const & a, char const * p)
  
  string const ltrim(string const & a, char const * p)
  {
-       LASSERT(p, /**/);
+       LASSERT(p, return a);
         if (a.empty() || !*p)
                 return a;
         size_t l = a.find_first_not_of(p);
@@ -979,7 +1053,7 @@ string const ltrim(string const & a, char const * p)
  
  docstring const ltrim(docstring const & a, char const * p)
  {
-       LASSERT(p, /**/);
+       LASSERT(p, return a);
         if (a.empty() || !*p)
                 return a;
         size_t l = a.find_first_not_of(from_ascii(p));
@@ -1068,6 +1142,20 @@ string const rsplit(string const & a, string & piece, char delim)
  }
  
  
+docstring const rsplit(docstring const & a, docstring & piece, char_type delim)
+{
+       docstring tmp;
+       size_t i = a.rfind(delim);
+       if (i != string::npos) { // delimiter was found
+               piece = a.substr(0, i);
+               tmp = a.substr(i + 1);
+       } else { // delimiter was not found
+               piece.erase();
+       }
+       return tmp;
+}
+
+
  docstring const rsplit(docstring const & a, char_type delim)
  {
         docstring tmp;
@@ -1085,13 +1173,14 @@ docstring const escape(docstring const & lab)
         docstring enc;
         for (size_t i = 0; i < lab.length(); ++i) {
                 char_type c = lab[i];
-               if (c >= 128 || c == '=' || c == '%') {
+               if (c >= 128 || c == '=' || c == '%' || c == '#' || c == '$'
+                   || c == '}' || c == '{' || c == ']' || c == '[' || c == '&') {
                         // Although char_type is a 32 bit type we know that
                         // UCS4 occupies only 21 bits, so we don't need to
                         // encode bigger values. Test for 2^24 because we
                         // can encode that with the 6 hex digits that are
                         // needed for 21 bits anyway.
-                       LASSERT(c < (1 << 24), /**/);
+                       LASSERT(c < (1 << 24), continue);
                         enc += '=';
                         enc += hexdigit[(c>>20) & 15];
                         enc += hexdigit[(c>>16) & 15];
@@ -1159,6 +1248,7 @@ docstring wrap(docstring const & str, int const ind, size_t const width)
  docstring wrapParas(docstring const & str, int const indent,
                     size_t const width, size_t const maxlines)
  {
+       docstring const dots = from_ascii("...");
         if (str.empty())
                 return docstring();
  
@@ -1173,9 +1263,21 @@ docstring wrapParas(docstring const & str, int const indent,
                 if (nlines == 0)
                         continue;
                 size_t const curlines = retval.size();
-               if (maxlines > 0 && curlines + nlines >= maxlines) {
-                       tmp.resize(maxlines - curlines - 1);
-                       tmp.push_back(from_ascii("..."));
+               if (maxlines > 0 && curlines + nlines > maxlines) {
+                       tmp.resize(maxlines - curlines);
+                       docstring last = tmp.back();
+                       size_t const lsize = last.size();
+                       if (lsize > width - 3) {
+                               size_t const i = last.find_last_of(' ', width - 3);
+                               if (i == docstring::npos || i <= size_t(indent))
+                                       // no space found
+                                       last = last.substr(0, lsize - 3) + dots;
+                               else
+                                       last = last.substr(0, i) + dots;
+                       } else
+                               last += dots;
+                       tmp.pop_back();
+                       tmp.push_back(last);
                 }
                 retval.insert(retval.end(), tmp.begin(), tmp.end());
                 if (maxlines > 0 && retval.size() >= maxlines)
@@ -1286,7 +1388,7 @@ int findToken(char const * const str[], string const & search_token)
  template<>
  docstring bformat(docstring const & fmt, int arg1)
  {
-       LASSERT(contains(fmt, from_ascii("%1$d")), /**/);
+       LATTEST(contains(fmt, from_ascii("%1$d")));
         docstring const str = subst(fmt, from_ascii("%1$d"), convert<docstring>(arg1));
         return subst(str, from_ascii("%%"), from_ascii("%"));
  }
@@ -1295,7 +1397,7 @@ docstring bformat(docstring const & fmt, int arg1)
  template<>
  docstring bformat(docstring const & fmt, long arg1)
  {
-       LASSERT(contains(fmt, from_ascii("%1$d")), /**/);
+       LATTEST(contains(fmt, from_ascii("%1$d")));
         docstring const str = subst(fmt, from_ascii("%1$d"), convert<docstring>(arg1));
         return subst(str, from_ascii("%%"), from_ascii("%"));
  }
@@ -1304,7 +1406,7 @@ docstring bformat(docstring const & fmt, long arg1)
  template<>
  docstring bformat(docstring const & fmt, unsigned int arg1)
  {
-       LASSERT(contains(fmt, from_ascii("%1$d")), /**/);
+       LATTEST(contains(fmt, from_ascii("%1$d")));
         docstring const str = subst(fmt, from_ascii("%1$d"), convert<docstring>(arg1));
         return subst(str, from_ascii("%%"), from_ascii("%"));
  }
@@ -1313,7 +1415,7 @@ docstring bformat(docstring const & fmt, unsigned int arg1)
  template<>
  docstring bformat(docstring const & fmt, docstring arg1)
  {
-       LASSERT(contains(fmt, from_ascii("%1$s")), /**/);
+       LATTEST(contains(fmt, from_ascii("%1$s")));
         docstring const str = subst(fmt, from_ascii("%1$s"), arg1);
         return subst(str, from_ascii("%%"), from_ascii("%"));
  }
@@ -1322,7 +1424,7 @@ docstring bformat(docstring const & fmt, docstring arg1)
  template<>
  docstring bformat(docstring const & fmt, char * arg1)
  {
-       LASSERT(contains(fmt, from_ascii("%1$s")), /**/);
+       LATTEST(contains(fmt, from_ascii("%1$s")));
         docstring const str = subst(fmt, from_ascii("%1$s"), from_ascii(arg1));
         return subst(str, from_ascii("%%"), from_ascii("%"));
  }
@@ -1331,8 +1433,8 @@ docstring bformat(docstring const & fmt, char * arg1)
  template<>
  docstring bformat(docstring const & fmt, docstring arg1, docstring arg2)
  {
-       LASSERT(contains(fmt, from_ascii("%1$s")), /**/);
-       LASSERT(contains(fmt, from_ascii("%2$s")), /**/);
+       LATTEST(contains(fmt, from_ascii("%1$s")));
+       LATTEST(contains(fmt, from_ascii("%2$s")));
         docstring str = subst(fmt, from_ascii("%1$s"), arg1);
         str = subst(str, from_ascii("%2$s"), arg2);
         return subst(str, from_ascii("%%"), from_ascii("%"));
@@ -1342,8 +1444,8 @@ docstring bformat(docstring const & fmt, docstring arg1, docstring arg2)
  template<>
  docstring bformat(docstring const & fmt, docstring arg1, int arg2)
  {
-       LASSERT(contains(fmt, from_ascii("%1$s")), /**/);
-       LASSERT(contains(fmt, from_ascii("%2$d")), /**/);
+       LATTEST(contains(fmt, from_ascii("%1$s")));
+       LATTEST(contains(fmt, from_ascii("%2$d")));
         docstring str = subst(fmt, from_ascii("%1$s"), arg1);
         str = subst(str, from_ascii("%2$d"), convert<docstring>(arg2));
         return subst(str, from_ascii("%%"), from_ascii("%"));
@@ -1353,10 +1455,10 @@ docstring bformat(docstring const & fmt, docstring arg1, int arg2)
  template<>
  docstring bformat(docstring const & fmt, char const * arg1, docstring arg2)
  {
-       LASSERT(contains(fmt, from_ascii("%1$s")), /**/);
-       LASSERT(contains(fmt, from_ascii("%2$s")), /**/);
+       LATTEST(contains(fmt, from_ascii("%1$s")));
+       LATTEST(contains(fmt, from_ascii("%2$s")));
         docstring str = subst(fmt, from_ascii("%1$s"), from_ascii(arg1));
-       str = subst(fmt, from_ascii("%2$s"), arg2);
+       str = subst(str, from_ascii("%2$s"), arg2);
         return subst(str, from_ascii("%%"), from_ascii("%"));
  }
  
@@ -1364,8 +1466,8 @@ docstring bformat(docstring const & fmt, char const * arg1, docstring arg2)
  template<>
  docstring bformat(docstring const & fmt, int arg1, int arg2)
  {
-       LASSERT(contains(fmt, from_ascii("%1$d")), /**/);
-       LASSERT(contains(fmt, from_ascii("%2$d")), /**/);
+       LATTEST(contains(fmt, from_ascii("%1$d")));
+       LATTEST(contains(fmt, from_ascii("%2$d")));
         docstring str = subst(fmt, from_ascii("%1$d"), convert<docstring>(arg1));
         str = subst(str, from_ascii("%2$d"), convert<docstring>(arg2));
         return subst(str, from_ascii("%%"), from_ascii("%"));
@@ -1375,9 +1477,9 @@ docstring bformat(docstring const & fmt, int arg1, int arg2)
  template<>
  docstring bformat(docstring const & fmt, docstring arg1, docstring arg2, docstring arg3)
  {
-       LASSERT(contains(fmt, from_ascii("%1$s")), /**/);
-       LASSERT(contains(fmt, from_ascii("%2$s")), /**/);
-       LASSERT(contains(fmt, from_ascii("%3$s")), /**/);
+       LATTEST(contains(fmt, from_ascii("%1$s")));
+       LATTEST(contains(fmt, from_ascii("%2$s")));
+       LATTEST(contains(fmt, from_ascii("%3$s")));
         docstring str = subst(fmt, from_ascii("%1$s"), arg1);
         str = subst(str, from_ascii("%2$s"), arg2);
         str = subst(str, from_ascii("%3$s"), arg3);
@@ -1389,10 +1491,10 @@ template<>
  docstring bformat(docstring const & fmt,
                docstring arg1, docstring arg2, docstring arg3, docstring arg4)
  {
-       LASSERT(contains(fmt, from_ascii("%1$s")), /**/);
-       LASSERT(contains(fmt, from_ascii("%2$s")), /**/);
-       LASSERT(contains(fmt, from_ascii("%3$s")), /**/);
-       LASSERT(contains(fmt, from_ascii("%4$s")), /**/);
+       LATTEST(contains(fmt, from_ascii("%1$s")));
+       LATTEST(contains(fmt, from_ascii("%2$s")));
+       LATTEST(contains(fmt, from_ascii("%3$s")));
+       LATTEST(contains(fmt, from_ascii("%4$s")));
         docstring str = subst(fmt, from_ascii("%1$s"), arg1);
         str = subst(str, from_ascii("%2$s"), arg2);
         str = subst(str, from_ascii("%3$s"), arg3);