Convert most of the bibtex machinery to docstring.

[lyx.git] / src / support / lstrings.h
diff --git a/src/support/lstrings.h b/src/support/lstrings.h

index 13251b189b4d67b31ffc3bb41bcbb08181808203..87e7f242fd7691785e12966ba4f5ad98f444537b 100644 (file)
--- a/src/support/lstrings.h
+++ b/src/support/lstrings.h
@@ -1,214 +1,296 @@
  // -*- C++ -*-
-
-/** This is a collection of string helper functions that works
-    together with string (and later also with STL String. Some of these
-    would certainly benefit from a rewrite/optimization.
-*/
+/**
+ * \file lstrings.h
+ * This file is part of LyX, the document processor.
+ * Licence details can be found in the file COPYING.
+ *
+ * \author Lars Gullik Bjønnes
+ * \author Jean-Marc Lasgouttes
+ *
+ * Full author contact details are available in file CREDITS.
+ *
+ * A collection of string helper functions that works with string.
+ * Some of these would certainly benefit from a rewrite/optimization.
+ */
  
  #ifndef LSTRINGS_H
  #define LSTRINGS_H
  
-#include <cstring>
+#include "support/docstring.h"
  
-#include "LAssert.h"
+#include <vector>
  
-//#warning verify this please. Lgb
-///
-template<class T>
-size_t lstrlen(T const * t)
-{
-       Assert(t); // we don't want null pointers
-       size_t count = 0;
-       T const * r = t;
-       while(*r != 0) ++r, ++count;
-       return count;
-}
  
+namespace lyx {
+namespace support {
  
-//#warning verify this please. Lgb
  ///
-template<class T>
-T * lstrchr(T const * t, int c)
-{
-  Assert(t); // we don't want null pointers
-  T * r = const_cast<T*>(t);
-  while(*r != 0) 
-    if (*r == c) return r; else ++r;
-  return 0;
-}
-
-#include <cctype>
-#include "LString.h"
-
+int compare_no_case(std::string const & s, std::string const & s2);
+int compare_no_case(docstring const & s, docstring const & s2);
  
  ///
-inline int compare_no_case(string const & s, string const & s2)
-{
-       // ANSI C
-       string::const_iterator p = s.begin();
-       string::const_iterator p2 = s2.begin();
-
-       while (p != s.end() && p2 != s2.end()) {
-               if (tolower(*p) != tolower(*p2))
-                       return (tolower(*p) < tolower(*p2)) ? -1 : 1;
-               ++p;
-               ++p2;
-       }
-
-       return s.size() - s2.size();
-}
-
+int compare_ascii_no_case(std::string const & s, std::string const & s2);
  
  ///
-inline int compare_no_case(string const & s, string const & s2,
-                          unsigned int len)
-{
-//#warning verify this func please
-       string::const_iterator p = s.begin();
-       string::const_iterator p2 = s2.begin();
-       unsigned int i = 0;
-       while (i < len && p != s.end() && p2 != s2.end()) {
-               if (tolower(*p) != tolower(*p2))
-                       return (tolower(*p) < tolower(*p2)) ? -1 : 1;
-               ++i;
-               ++p;
-               ++p2;
-       }
-       return s.size() - s2.size();
-}
+int compare_ascii_no_case(docstring const & s, docstring const & s2);
  
+///
+int compare_no_case(std::string const & s, std::string const & s2, unsigned int len);
  
  ///
-inline int compare(char const * a, char const * b)
+inline
+int compare(char const * a, char const * b)
  {
+#ifndef CXX_GLOBAL_CSTD
+       return std::strcmp(a, b);
+#else
         return strcmp(a, b);
+#endif
  }
  
-
  ///
-inline int compare(char const * a, char const * b, unsigned int len)
+inline
+int compare(char const * a, char const * b, unsigned int len)
  {
+#ifndef CXX_GLOBAL_CSTD
+       return std::strncmp(a, b, len);
+#else
         return strncmp(a, b, len);
+#endif
  }
  
-
  ///
-bool isStrInt(string const & str);
+bool isStrInt(std::string const & str);
  
-///
-int strToInt(string const & str);
+/// does the std::string represent an unsigned integer value ?
+bool isStrUnsignedInt(std::string const & str);
  
  ///
-string lowercase(string const &);
+bool isStrDbl(std::string const & str);
  
-///
-string uppercase(string const &);
-
-/// int to string
-string tostr(int i);
+bool isHex(lyx::docstring const & str);
  
-///
-string tostr(unsigned int);
+int hexToInt(lyx::docstring const & str);
  
-/// long to string
-string tostr(long l);
+/// is \p str pure ascii?
+bool isAscii(docstring const & str);
  
  ///
-string tostr(unsigned long l); 
+char lowercase(char c);
  
  ///
-string tostr(char c);
+char uppercase(char c);
+
+/// changes the case only if c is a one-byte char
+char_type lowercase(char_type c);
+
+/// changes the case only if c is a one-byte char
+char_type uppercase(char_type c);
  
-/// void * to string
-string tostr(void * v);
+/// same as lowercase(), but ignores locale
+std::string const ascii_lowercase(std::string const &);
+docstring const ascii_lowercase(docstring const &);
  
-/// bool to string
-string tostr(bool b);
+///
+std::string const lowercase(std::string const &);
+docstring const lowercase(docstring const &);
  
  ///
-string tostr(double d);
+std::string const uppercase(std::string const &);
  
-/// Does the string start with this prefix?
-bool prefixIs(string const &, char const *);
+/// Does the std::string start with this prefix?
+bool prefixIs(std::string const &, std::string const &);
+bool prefixIs(lyx::docstring const &, lyx::docstring const &);
  
  /// Does the string end with this char?
-bool suffixIs(string const &, char);
+bool suffixIs(std::string const &, char);
  
-/// Does the string end with this suffix?
-bool suffixIs(string const &, char const *);
+/// Does the std::string end with this suffix?
+bool suffixIs(std::string const &, std::string const &);
  
  ///
-bool contains(char const * a, string const & b);
+inline bool contains(std::string const & a, std::string const & b)
+{
+       return a.find(b) != std::string::npos;
+}
  
-///
-bool contains(string const & a, char const * b);
+inline bool contains(docstring const & a, docstring const & b)
+{
+       return a.find(b) != docstring::npos;
+}
  
-///
-bool contains(string const & a, string const & b);
+inline bool contains(std::string const & a, char b)
+{
+       return a.find(b) != std::string::npos;
+}
  
-///
-bool contains(char const * a, char const * b);
+inline bool contains(docstring const & a, char_type b)
+{
+       return a.find(b) != docstring::npos;
+}
  
-/// Counts how many of character c there is in a
-int countChar(string const & a, char const c);
+///
+bool containsOnly(std::string const &, std::string const &);
  
  /** Extracts a token from this string at the nth delim.
-  Doesn't modify the original string. Similar to strtok.
-  Example:
-  #"a;bc;d".token(';', 1) == "bc";#
-  #"a;bc;d".token(';', 2) == "d";#
+    Doesn't modify the original string. Similar to strtok.
+    Example:
+    \code
+    token("a;bc;d", ';', 1) == "bc";
+    token("a;bc;d", ';', 2) == "d";
+    \endcode
  */
-string token(string const & a, char delim, int n);
+std::string const token(std::string const & a, char delim, int n);
  
+docstring const token(docstring const & a, char_type delim, int n);
  
  /** Search a token in this string using the delim.
-  Doesn't modify the original string. Returns -1 in case of
-  failure. 
-  Example:
-  #"a;bc;d".tokenPos(';', "bc") == 1;#
-  #"a;bc;d".token(';', "d") == 2;#
+    Doesn't modify the original string. Returns -1 in case of
+    failure.
+    Example:
+    \code
+    tokenPos("a;bc;d", ';', "bc") == 1;
+    tokenPos("a;bc;d", ';', "d") == 2;
+    \endcode
  */
-int tokenPos(string const & a, char delim, string const & tok);
+int tokenPos(std::string const & a, char delim, std::string const & tok);
  
  
-/** Compares a string and a (simple) regular expression
-  The only element allowed is "*" for any string of characters
-  */
-bool regexMatch(string const & a, string const & pattern);
+/// Substitute all \a oldchar with \a newchar
+std::string const subst(std::string const & a, char oldchar, char newchar);
  
-/// Substitute all "oldchar"s with "newchar"
-string subst(string const & a, char oldchar, char newchar);
+/// Substitute all \a oldchar with \a newchar
+docstring const subst(docstring const & a, char_type oldchar, char_type newchar);
  
-/// Substitutes all instances of oldstr with newstr
-string subst(string const & a,
-            char const * oldstr, string const & newstr);
+/// substitutes all instances of \a oldstr with \a newstr
+std::string const subst(std::string const & a,
+                  std::string const & oldstr, std::string const & newstr);
  
-/** Strips characters off the end of a string.
-  #"abccc".strip('c') = "ab".#
-  */
-string strip(string const & a, char const c = ' ');
+/// substitutes all instances of \a oldstr with \a newstr
+docstring const subst(docstring const & a,
+               docstring const & oldstr, docstring const & newstr);
  
-/** Strips characters of the beginning of a string.
-  #"cccba".frontstrip('c') = "ba"#. */
-string frontStrip(string const & a, char const c = ' ');
+/** Trims characters off the end and beginning of a string.
+    \code
+    trim("ccabccc", "c") == "ab".
+    \endcode
+*/
+docstring const trim(docstring const & a, char const * p = " ");
  
-/** Strips characters off the beginning of a string.
-    #"ababcdef".frontstrip("ab") = "cdef"# .*/
-string frontStrip(string const & a, char const * p);
+/** Trims characters off the end and beginning of a string.
+    \code
+    trim("ccabccc", "c") == "ab".
+    \endcode
+*/
+std::string const trim(std::string const & a, char const * p = " ");
+
+/** Trims characters off the end of a string.
+    \code
+    rtrim("abccc", "c") == "ab".
+    \endcode
+*/
+std::string const rtrim(std::string const & a, char const * p = " ");
+docstring const rtrim(docstring const & a, char const * p = " ");
+
+/** Trims characters off the beginning of a string.
+    \code
+   ("ababcdef", "ab") = "cdef"
+    \endcode
+*/
+std::string const ltrim(std::string const & a, char const * p = " ");
+docstring const ltrim(docstring const & a, char const * p = " ");
  
  /** Splits the string by the first delim.
-  Splits the string by the first appearance of delim.
-  The leading string up to delim is returned in piece (not including
-  delim), while the original string is cut from after the delimiter.
-  Example:
-  #s1= ""; s2= "a;bc".split(s1, ';') -> s1 == "a"; s2 == "bc";#
-  */
-string split(string const & a, string & piece, char delim);
+    Splits the string by the first appearance of delim.
+    The leading string up to delim is returned in piece (not including
+    delim), while the original string is cut from after the delimiter.
+    Example:
+    \code
+    s1= ""; s2= "a;bc".split(s1, ';') -> s1 == "a"; s2 == "bc";
+    \endcode
+*/
+std::string const split(std::string const & a, std::string & piece, char delim);
+docstring const split(docstring const & a, docstring & piece, char_type delim);
  
  /// Same as split but does not return a piece
-string split(string const & a, char delim);
+std::string const split(std::string const & a, char delim);
  
  /// Same as split but uses the last delim.
-string rsplit(string const & a, string & piece, char delim);
+std::string const rsplit(std::string const & a, std::string & piece, char delim);
+
+/// Escapes non ASCII chars and other problematic characters that cause
+/// problems in latex labels.
+docstring const escape(docstring const & lab);
+
+/// gives a vector of stringparts which have the delimiter delim
+std::vector<std::string> const getVectorFromString(std::string const & str,
+                                             std::string const & delim = std::string(","));
+std::vector<docstring> const getVectorFromString(docstring const & str,
+               docstring const & delim = from_ascii(","));
+
+// the same vice versa
+std::string const getStringFromVector(std::vector<std::string> const & vec,
+                                std::string const & delim = std::string(","));
+
+/// Search \p search_token in \p str and return the position if it is
+/// found, else -1. The last item in \p str must be "".
+int findToken(char const * const str[], std::string const & search_token);
+
+/// Convert internal line endings to line endings as expected by the OS
+docstring const externalLineEnding(docstring const & str);
+
+/// Convert line endings in any formnat to internal line endings
+docstring const internalLineEnding(docstring const & str);
+
+
+#ifdef I_AM_NOT_AFRAID_OF_HEADER_LIBRARIES
+
+#include <boost/format.hpp>
+
+template<class Arg1>
+docstring bformat(docstring const & fmt, Arg1 arg1)
+{
+       return (boost::basic_format<char_type>(fmt) % arg1).str();
+}
+
+
+template<class Arg1, class Arg2>
+docstring bformat(docstring const & fmt, Arg1 arg1, Arg2 arg2)
+{
+       return (boost::basic_format<char_type>(fmt) % arg1 % arg2).str();
+}
+
+
+template<class Arg1, class Arg2, class Arg3>
+docstring bformat(docstring const & fmt, Arg1 arg1, Arg2 arg2, Arg3 arg3)
+{
+       return (boost::basic_format<char_type>(fmt) % arg1 % arg2 % arg3).str();
+}
+
+
+template<class Arg1, class Arg2, class Arg3, class Arg4>
+docstring bformat(docstring const & fmt, Arg1 arg1, Arg2 arg2, Arg3 arg3, Arg4 arg4)
+{
+       return (boost::basic_format<char_type>(fmt) % arg1 % arg2 % arg3 % arg4).str();
+}
+
+#else
+
+template <class Arg1>
+docstring bformat(docstring const & fmt, Arg1);
+
+template <class Arg1, class Arg2>
+docstring bformat(docstring const & fmt, Arg1, Arg2);
+
+template <class Arg1, class Arg2, class Arg3>
+docstring bformat(docstring const & fmt, Arg1, Arg2, Arg3);
+
+template <class Arg1, class Arg2, class Arg3, class Arg4>
+docstring bformat(docstring const & fmt, Arg1, Arg2, Arg3, Arg4);
+
+#endif
+
+} // namespace support
+} // namespace lyx
  
  #endif