Improve LaTeX format detection

[features.git] / src / support / lstrings.h
diff --git a/src/support/lstrings.h b/src/support/lstrings.h

index 7a0cbd5b5f16df85954765b7bde4250cc0f6619b..2606546fa05ce3c29cdb5c0c47341e83e1fd814c 100644 (file)
--- a/src/support/lstrings.h
+++ b/src/support/lstrings.h
@@ -4,7 +4,7 @@
   * This file is part of LyX, the document processor.
   * Licence details can be found in the file COPYING.
   *
- * \author Lars Gullik Bjønnes
+ * \author Lars Gullik Bjønnes
   * \author Jean-Marc Lasgouttes
   *
   * Full author contact details are available in file CREDITS.
@@ -34,28 +34,6 @@ int compare_ascii_no_case(std::string const & s, std::string const & s2);
  /// Compare \p s and \p s2, ignoring the case of ASCII characters only.
  int compare_ascii_no_case(docstring const & s, docstring const & s2);
  
-///
-inline
-int compare(char const * a, char const * b)
-{
-#ifndef CXX_GLOBAL_CSTD
-       return std::strcmp(a, b);
-#else
-       return strcmp(a, b);
-#endif
-}
-
-///
-inline
-int compare(char const * a, char const * b, unsigned int len)
-{
-#ifndef CXX_GLOBAL_CSTD
-       return std::strncmp(a, b, len);
-#else
-       return strncmp(a, b, len);
-#endif
-}
-
  ///
  bool isStrInt(std::string const & str);
  
@@ -65,13 +43,21 @@ bool isStrUnsignedInt(std::string const & str);
  ///
  bool isStrDbl(std::string const & str);
  
-bool isHex(lyx::docstring const & str);
+/// does the string contain a digit?
+bool hasDigitASCII(docstring const & str);
  
-int hexToInt(lyx::docstring const & str);
+bool isHexChar(char_type);
+
+bool isHex(docstring const & str);
+
+int hexToInt(docstring const & str);
  
  /// is \p str pure ascii?
  bool isAscii(docstring const & str);
  
+/// is \p str pure ascii?
+bool isAscii(std::string const & str);
+
  /**
   * Changes the case of \p c to lowercase.
   * Don't use this for non-ASCII characters, since it depends on the locale.
@@ -98,6 +84,12 @@ char_type lowercase(char_type c);
  /// Does not depend on the locale.
  char_type uppercase(char_type c);
  
+/// Checks if the supplied character is lower-case
+bool isLowerCase(char_type ch);
+
+/// Checks if the supplied character is upper-case
+bool isUpperCase(char_type ch);
+
  /// same as lowercase(), but ignores locale
  std::string const ascii_lowercase(std::string const &);
  docstring const ascii_lowercase(docstring const &);
@@ -110,21 +102,30 @@ docstring const lowercase(docstring const & s);
  /// Does not depend on the locale.
  docstring const uppercase(docstring const & s);
  
-/// Does the string start with this prefix?
-bool prefixIs(docstring const &, char_type);
+/// Returns the superscript of \p c or \p c if no superscript exists.
+/// Does not depend on the locale.
+char_type superscript(char_type c);
+
+/// Returns the subscript of \p c or \p c if no subscript exists.
+/// Does not depend on the locale.
+char_type subscript(char_type c);
+
+/// Does str start with c?
+bool prefixIs(docstring const & str, char_type c);
  
-/// Does the std::string start with this prefix?
-bool prefixIs(std::string const &, std::string const &);
-bool prefixIs(docstring const &, docstring const &);
+/// Does str start with pre?
+bool prefixIs(std::string const & str, std::string const & pre);
+bool prefixIs(docstring const & str, docstring const & pre);
  
  /// Does the string end with this char?
  bool suffixIs(std::string const &, char);
  bool suffixIs(docstring const &, char_type);
  
-/// Does the std::string end with this suffix?
+/// Does the string end with this suffix?
  bool suffixIs(std::string const &, std::string const &);
+bool suffixIs(docstring const &, docstring const &);
  
-///
+/// Is b contained in a?
  inline bool contains(std::string const & a, std::string const & b)
  {
         return a.find(b) != std::string::npos;
@@ -170,6 +171,7 @@ docstring const token(docstring const & a, char_type delim, int n);
      \endcode
  */
  int tokenPos(std::string const & a, char delim, std::string const & tok);
+int tokenPos(docstring const & a, char_type delim, docstring const & tok);
  
  
  /// Substitute all \a oldchar with \a newchar
@@ -186,6 +188,12 @@ std::string const subst(std::string const & a,
  docstring const subst(docstring const & a,
                 docstring const & oldstr, docstring const & newstr);
  
+/// Count all occurences of char \a chr inside \a str
+int count_char(std::string const & str, char chr);
+
+/// Count all occurences of char \a chr inside \a str
+int count_char(docstring const & str, docstring::value_type chr);
+
  /** Trims characters off the end and beginning of a string.
      \code
      trim("ccabccc", "c") == "ab".
@@ -200,9 +208,10 @@ docstring const trim(docstring const & a, char const * p = " ");
  */
  std::string const trim(std::string const & a, char const * p = " ");
  
-/** Trims characters off the end of a string.
+/** Trims characters off the end of a string, removing any character
+    in p.
      \code
-    rtrim("abccc", "c") == "ab".
+    rtrim("abcde", "dec") == "ab".
      \endcode
  */
  std::string const rtrim(std::string const & a, char const * p = " ");
@@ -210,21 +219,25 @@ docstring const rtrim(docstring const & a, char const * p = " ");
  
  /** Trims characters off the beginning of a string.
      \code
-   ("ababcdef", "ab") = "cdef"
+   ("abbabcdef", "ab") = "cdef"
      \endcode
  */
  std::string const ltrim(std::string const & a, char const * p = " ");
  docstring const ltrim(docstring const & a, char const * p = " ");
  
-/** Splits the string by the first delim.
-    Splits the string by the first appearance of delim.
-    The leading string up to delim is returned in piece (not including
-    delim), while the original string is cut from after the delimiter.
-    Example:
+/** Splits the string given in the first argument at the first occurence 
+    of the third argument, delim.
+    What precedes delim is returned in the second argument, piece; this
+    will be the whole of the string if no delimiter is found.
+    The return value is what follows delim, if anything. So the return
+    value is the null string if no delimiter is found.
+    'a' and 'piece' must be different variables.
+    Examples:
      \code
-    s1= ""; s2= "a;bc".split(s1, ';') -> s1 == "a"; s2 == "bc";
+    s1= "a;bc"; s2= ""
+    ret = split(s1, s2, ';') -> ret = "bc", s2 == "a"
      \endcode
-*/
+ */
  std::string const split(std::string const & a, std::string & piece, char delim);
  docstring const split(docstring const & a, docstring & piece, char_type delim);
  
@@ -233,65 +246,49 @@ std::string const split(std::string const & a, char delim);
  
  /// Same as split but uses the last delim.
  std::string const rsplit(std::string const & a, std::string & piece, char delim);
+docstring const rsplit(docstring const & a, docstring & piece, char_type delim);
+docstring const rsplit(docstring const & a, char_type delim);
  
  /// Escapes non ASCII chars and other problematic characters that cause
  /// problems in latex labels.
  docstring const escape(docstring const & lab);
  
+/// Word-wraps the provided docstring, returning a line-broken string
+/// of width no wider than width, with the string broken at spaces. 
+/// If the string cannot be broken appropriately, it returns something 
+/// with "..." at the end, again no wider than width.
+/// We assume here that str does not contain newlines.
+/// If indent is positive, then the first line is indented that many 
+/// spaces. If it is negative, then successive lines are indented, as
+/// if the first line were "outdented".
+docstring wrap(docstring const & str, int const indent = 0,
+               size_t const width = 80);
+
+/// Like the preceding, except it is intended to operate on strings
+/// that may contain embedded newlines.
+/// \param numlines Don't return more than numlines lines. If numlines
+///    is 0, we return everything.
+docstring wrapParas(docstring const & str, int const indent = 0,
+                    size_t const width = 80, size_t const maxlines = 10);
+
  /// gives a vector of stringparts which have the delimiter delim
+/// If \p keepempty is true, empty strings will be pushed to the vector as well
  std::vector<std::string> const getVectorFromString(std::string const & str,
-                                             std::string const & delim = std::string(","));
+                                             std::string const & delim = std::string(","),
+                                             bool keepempty = false);
  std::vector<docstring> const getVectorFromString(docstring const & str,
-               docstring const & delim = from_ascii(","));
+               docstring const & delim = from_ascii(","), bool keepempty = false);
  
-// the same vice versa
+/// the same vice versa
  std::string const getStringFromVector(std::vector<std::string> const & vec,
                                  std::string const & delim = std::string(","));
+docstring const getStringFromVector(std::vector<docstring> const & vec,
+                                docstring const & delim = from_ascii(","));
  
  /// Search \p search_token in \p str and return the position if it is
  /// found, else -1. The last item in \p str must be "".
  int findToken(char const * const str[], std::string const & search_token);
  
-/// Convert internal line endings to line endings as expected by the OS
-docstring const externalLineEnding(docstring const & str);
-
-/// Convert line endings in any formnat to internal line endings
-docstring const internalLineEnding(docstring const & str);
-
-
-#ifdef I_AM_NOT_AFRAID_OF_HEADER_LIBRARIES
-
-#include <boost/format.hpp>
-
-template<class Arg1>
-docstring bformat(docstring const & fmt, Arg1 arg1)
-{
-       return (boost::basic_format<char_type>(fmt) % arg1).str();
-}
-
-
-template<class Arg1, class Arg2>
-docstring bformat(docstring const & fmt, Arg1 arg1, Arg2 arg2)
-{
-       return (boost::basic_format<char_type>(fmt) % arg1 % arg2).str();
-}
-
-
-template<class Arg1, class Arg2, class Arg3>
-docstring bformat(docstring const & fmt, Arg1 arg1, Arg2 arg2, Arg3 arg3)
-{
-       return (boost::basic_format<char_type>(fmt) % arg1 % arg2 % arg3).str();
-}
-
-
-template<class Arg1, class Arg2, class Arg3, class Arg4>
-docstring bformat(docstring const & fmt, Arg1 arg1, Arg2 arg2, Arg3 arg3, Arg4 arg4)
-{
-       return (boost::basic_format<char_type>(fmt) % arg1 % arg2 % arg3 % arg4).str();
-}
-
-#else
-
  template <class Arg1>
  docstring bformat(docstring const & fmt, Arg1);
  
@@ -304,7 +301,19 @@ docstring bformat(docstring const & fmt, Arg1, Arg2, Arg3);
  template <class Arg1, class Arg2, class Arg3, class Arg4>
  docstring bformat(docstring const & fmt, Arg1, Arg2, Arg3, Arg4);
  
-#endif
+
+template<> docstring bformat(docstring const & fmt, int arg1);
+template<> docstring bformat(docstring const & fmt, long arg1);
+template<> docstring bformat(docstring const & fmt, unsigned int arg1);
+template<> docstring bformat(docstring const & fmt, docstring arg1);
+template<> docstring bformat(docstring const & fmt, char * arg1);
+template<> docstring bformat(docstring const & fmt, docstring arg1, docstring arg2);
+template<> docstring bformat(docstring const & fmt, docstring arg1, int arg2);
+template<> docstring bformat(docstring const & fmt, char const * arg1, docstring arg2);
+template<> docstring bformat(docstring const & fmt, int arg1, int arg2);
+template<> docstring bformat(docstring const & fmt, docstring arg1, docstring arg2, docstring arg3);
+template<> docstring bformat(docstring const & fmt, docstring arg1, docstring arg2, docstring arg3, docstring arg4);
+
  
  } // namespace support
  } // namespace lyx