1999-10-02 16:21:10 +00:00
|
|
|
|
// -*- C++ -*-
|
2002-09-25 10:03:41 +00:00
|
|
|
|
/**
|
|
|
|
|
* \file lstrings.h
|
|
|
|
|
* This file is part of LyX, the document processor.
|
|
|
|
|
* Licence details can be found in the file COPYING.
|
|
|
|
|
*
|
|
|
|
|
* \author Lars Gullik Bj<EFBFBD>nnes
|
|
|
|
|
* \author Jean-Marc Lasgouttes
|
|
|
|
|
*
|
2003-08-23 00:17:00 +00:00
|
|
|
|
* Full author contact details are available in file CREDITS.
|
2002-09-25 10:03:41 +00:00
|
|
|
|
*
|
|
|
|
|
* A collection of string helper functions that works with string.
|
|
|
|
|
* Some of these would certainly benefit from a rewrite/optimization.
|
|
|
|
|
*/
|
1999-10-02 16:21:10 +00:00
|
|
|
|
|
|
|
|
|
#ifndef LSTRINGS_H
|
|
|
|
|
#define LSTRINGS_H
|
|
|
|
|
|
2006-09-13 21:13:49 +00:00
|
|
|
|
#include "support/docstring.h"
|
2006-08-13 22:54:59 +00:00
|
|
|
|
|
2002-04-15 12:05:07 +00:00
|
|
|
|
#include <vector>
|
1999-10-02 16:21:10 +00:00
|
|
|
|
|
|
|
|
|
|
2003-06-30 23:56:22 +00:00
|
|
|
|
namespace lyx {
|
|
|
|
|
namespace support {
|
|
|
|
|
|
2007-02-26 09:03:21 +00:00
|
|
|
|
/// Compare \p s and \p s2, ignoring the case.
|
|
|
|
|
/// Caution: Depends on the locale
|
2003-10-06 15:43:21 +00:00
|
|
|
|
int compare_no_case(std::string const & s, std::string const & s2);
|
2007-02-26 09:03:21 +00:00
|
|
|
|
|
|
|
|
|
/// Compare \p s and \p s2, ignoring the case.
|
|
|
|
|
/// Does not depend on the locale.
|
2006-10-21 00:16:43 +00:00
|
|
|
|
int compare_no_case(docstring const & s, docstring const & s2);
|
1999-11-26 06:57:35 +00:00
|
|
|
|
|
2007-02-26 09:03:21 +00:00
|
|
|
|
/// Compare \p s and \p s2, ignoring the case of ASCII characters only.
|
2003-10-06 15:43:21 +00:00
|
|
|
|
int compare_ascii_no_case(std::string const & s, std::string const & s2);
|
2001-06-25 00:06:33 +00:00
|
|
|
|
|
2007-02-26 09:03:21 +00:00
|
|
|
|
/// Compare \p s and \p s2, ignoring the case of ASCII characters only.
|
2006-10-11 19:40:50 +00:00
|
|
|
|
int compare_ascii_no_case(docstring const & s, docstring const & s2);
|
|
|
|
|
|
2007-02-26 09:03:21 +00:00
|
|
|
|
/// Compare the first \p len characters of \p s and \p s2, ignoring the case.
|
|
|
|
|
/// Caution: Depends on the locale
|
2003-10-06 15:43:21 +00:00
|
|
|
|
int compare_no_case(std::string const & s, std::string const & s2, unsigned int len);
|
1999-11-26 06:57:35 +00:00
|
|
|
|
|
2000-08-07 20:58:24 +00:00
|
|
|
|
///
|
2000-03-07 01:14:37 +00:00
|
|
|
|
inline
|
|
|
|
|
int compare(char const * a, char const * b)
|
1999-10-02 16:21:10 +00:00
|
|
|
|
{
|
2001-06-01 10:53:24 +00:00
|
|
|
|
#ifndef CXX_GLOBAL_CSTD
|
2001-05-31 02:23:46 +00:00
|
|
|
|
return std::strcmp(a, b);
|
2001-06-01 10:53:24 +00:00
|
|
|
|
#else
|
|
|
|
|
return strcmp(a, b);
|
2002-03-21 17:09:55 +00:00
|
|
|
|
#endif
|
1999-10-02 16:21:10 +00:00
|
|
|
|
}
|
|
|
|
|
|
2000-08-07 20:58:24 +00:00
|
|
|
|
///
|
2000-03-07 01:14:37 +00:00
|
|
|
|
inline
|
|
|
|
|
int compare(char const * a, char const * b, unsigned int len)
|
1999-10-02 16:21:10 +00:00
|
|
|
|
{
|
2001-06-01 10:53:24 +00:00
|
|
|
|
#ifndef CXX_GLOBAL_CSTD
|
2001-05-31 02:23:46 +00:00
|
|
|
|
return std::strncmp(a, b, len);
|
2001-06-01 10:53:24 +00:00
|
|
|
|
#else
|
|
|
|
|
return strncmp(a, b, len);
|
2002-03-21 17:09:55 +00:00
|
|
|
|
#endif
|
1999-10-02 16:21:10 +00:00
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
///
|
2003-10-06 15:43:21 +00:00
|
|
|
|
bool isStrInt(std::string const & str);
|
1999-10-02 16:21:10 +00:00
|
|
|
|
|
2003-10-06 15:43:21 +00:00
|
|
|
|
/// does the std::string represent an unsigned integer value ?
|
|
|
|
|
bool isStrUnsignedInt(std::string const & str);
|
2000-12-04 17:18:01 +00:00
|
|
|
|
|
2000-06-12 11:27:15 +00:00
|
|
|
|
///
|
2003-10-06 15:43:21 +00:00
|
|
|
|
bool isStrDbl(std::string const & str);
|
2000-06-12 11:27:15 +00:00
|
|
|
|
|
2006-10-22 18:47:19 +00:00
|
|
|
|
bool isHex(lyx::docstring const & str);
|
|
|
|
|
|
|
|
|
|
int hexToInt(lyx::docstring const & str);
|
|
|
|
|
|
2006-11-11 12:00:34 +00:00
|
|
|
|
/// is \p str pure ascii?
|
|
|
|
|
bool isAscii(docstring const & str);
|
|
|
|
|
|
2007-02-26 09:03:21 +00:00
|
|
|
|
/// Changes the case of \p c to lowercase.
|
|
|
|
|
/// Caution: Depends on the locale
|
2000-07-24 13:53:19 +00:00
|
|
|
|
char lowercase(char c);
|
|
|
|
|
|
2007-02-26 09:03:21 +00:00
|
|
|
|
/// Changes the case of \p c to uppercase.
|
|
|
|
|
/// Caution: Depends on the locale
|
2000-07-24 13:53:19 +00:00
|
|
|
|
char uppercase(char c);
|
|
|
|
|
|
2007-02-26 09:03:21 +00:00
|
|
|
|
/// Changes the case of \p c to lowercase.
|
|
|
|
|
/// Does not depend on the locale.
|
2006-09-03 14:09:24 +00:00
|
|
|
|
char_type lowercase(char_type c);
|
|
|
|
|
|
2007-02-26 09:03:21 +00:00
|
|
|
|
/// Changes the case of \p c to uppercase.
|
|
|
|
|
/// Does not depend on the locale.
|
2006-09-03 14:09:24 +00:00
|
|
|
|
char_type uppercase(char_type c);
|
|
|
|
|
|
2002-07-16 21:17:10 +00:00
|
|
|
|
/// same as lowercase(), but ignores locale
|
2003-10-06 15:43:21 +00:00
|
|
|
|
std::string const ascii_lowercase(std::string const &);
|
2006-12-15 16:09:05 +00:00
|
|
|
|
docstring const ascii_lowercase(docstring const &);
|
2002-07-16 21:17:10 +00:00
|
|
|
|
|
2007-02-26 09:03:21 +00:00
|
|
|
|
/// Changes the case of \p s to lowercase.
|
|
|
|
|
/// Caution: Depends on the locale
|
|
|
|
|
std::string const lowercase(std::string const & s);
|
1999-10-02 16:21:10 +00:00
|
|
|
|
|
2007-02-26 09:03:21 +00:00
|
|
|
|
/// Changes the case of \p s to lowercase.
|
|
|
|
|
/// Does not depend on the locale.
|
|
|
|
|
docstring const lowercase(docstring const & s);
|
|
|
|
|
|
|
|
|
|
/// Changes the case of \p s to uppercase.
|
|
|
|
|
/// Caution: Depends on the locale
|
|
|
|
|
std::string const uppercase(std::string const & s);
|
1999-12-15 06:12:28 +00:00
|
|
|
|
|
2007-01-05 17:11:32 +00:00
|
|
|
|
/// Does the string start with this prefix?
|
|
|
|
|
bool prefixIs(docstring const &, char_type);
|
|
|
|
|
|
2003-10-06 15:43:21 +00:00
|
|
|
|
/// Does the std::string start with this prefix?
|
|
|
|
|
bool prefixIs(std::string const &, std::string const &);
|
2007-01-05 17:11:32 +00:00
|
|
|
|
bool prefixIs(docstring const &, docstring const &);
|
2000-09-26 13:54:57 +00:00
|
|
|
|
|
1999-10-02 16:21:10 +00:00
|
|
|
|
/// Does the string end with this char?
|
2003-10-06 15:43:21 +00:00
|
|
|
|
bool suffixIs(std::string const &, char);
|
2007-01-05 17:11:32 +00:00
|
|
|
|
bool suffixIs(docstring const &, char_type);
|
1999-10-02 16:21:10 +00:00
|
|
|
|
|
2003-10-06 15:43:21 +00:00
|
|
|
|
/// Does the std::string end with this suffix?
|
|
|
|
|
bool suffixIs(std::string const &, std::string const &);
|
2000-09-26 13:54:57 +00:00
|
|
|
|
|
1999-10-02 16:21:10 +00:00
|
|
|
|
///
|
2006-10-22 10:15:23 +00:00
|
|
|
|
inline bool contains(std::string const & a, std::string const & b)
|
2004-01-31 15:30:24 +00:00
|
|
|
|
{
|
2004-02-01 12:46:14 +00:00
|
|
|
|
return a.find(b) != std::string::npos;
|
|
|
|
|
}
|
2002-02-16 15:59:55 +00:00
|
|
|
|
|
2006-10-22 10:15:23 +00:00
|
|
|
|
inline bool contains(docstring const & a, docstring const & b)
|
|
|
|
|
{
|
|
|
|
|
return a.find(b) != docstring::npos;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
inline bool contains(std::string const & a, char b)
|
|
|
|
|
{
|
|
|
|
|
return a.find(b) != std::string::npos;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
inline bool contains(docstring const & a, char_type b)
|
2006-09-02 10:18:20 +00:00
|
|
|
|
{
|
2006-10-21 00:16:43 +00:00
|
|
|
|
return a.find(b) != docstring::npos;
|
2006-09-02 10:18:20 +00:00
|
|
|
|
}
|
|
|
|
|
|
2000-06-12 11:27:15 +00:00
|
|
|
|
///
|
2003-10-06 15:43:21 +00:00
|
|
|
|
bool containsOnly(std::string const &, std::string const &);
|
2000-06-12 11:27:15 +00:00
|
|
|
|
|
1999-10-02 16:21:10 +00:00
|
|
|
|
/** Extracts a token from this string at the nth delim.
|
2001-02-16 09:25:43 +00:00
|
|
|
|
Doesn't modify the original string. Similar to strtok.
|
|
|
|
|
Example:
|
|
|
|
|
\code
|
2002-07-21 15:51:07 +00:00
|
|
|
|
token("a;bc;d", ';', 1) == "bc";
|
|
|
|
|
token("a;bc;d", ';', 2) == "d";
|
2001-02-16 09:25:43 +00:00
|
|
|
|
\endcode
|
1999-10-02 16:21:10 +00:00
|
|
|
|
*/
|
2003-10-06 15:43:21 +00:00
|
|
|
|
std::string const token(std::string const & a, char delim, int n);
|
1999-10-02 16:21:10 +00:00
|
|
|
|
|
2006-10-21 00:16:43 +00:00
|
|
|
|
docstring const token(docstring const & a, char_type delim, int n);
|
1999-10-02 16:21:10 +00:00
|
|
|
|
|
|
|
|
|
/** Search a token in this string using the delim.
|
2001-02-16 09:25:43 +00:00
|
|
|
|
Doesn't modify the original string. Returns -1 in case of
|
2002-03-21 17:09:55 +00:00
|
|
|
|
failure.
|
2001-02-16 09:25:43 +00:00
|
|
|
|
Example:
|
|
|
|
|
\code
|
2002-07-21 15:51:07 +00:00
|
|
|
|
tokenPos("a;bc;d", ';', "bc") == 1;
|
|
|
|
|
tokenPos("a;bc;d", ';', "d") == 2;
|
2001-02-16 09:25:43 +00:00
|
|
|
|
\endcode
|
1999-10-02 16:21:10 +00:00
|
|
|
|
*/
|
2003-10-06 15:43:21 +00:00
|
|
|
|
int tokenPos(std::string const & a, char delim, std::string const & tok);
|
1999-10-02 16:21:10 +00:00
|
|
|
|
|
|
|
|
|
|
2001-02-16 09:25:43 +00:00
|
|
|
|
/// Substitute all \a oldchar with \a newchar
|
2003-10-06 15:43:21 +00:00
|
|
|
|
std::string const subst(std::string const & a, char oldchar, char newchar);
|
1999-10-02 16:21:10 +00:00
|
|
|
|
|
2006-09-03 07:02:38 +00:00
|
|
|
|
/// Substitute all \a oldchar with \a newchar
|
2006-10-21 00:16:43 +00:00
|
|
|
|
docstring const subst(docstring const & a, char_type oldchar, char_type newchar);
|
2006-09-03 07:02:38 +00:00
|
|
|
|
|
2001-02-16 09:25:43 +00:00
|
|
|
|
/// substitutes all instances of \a oldstr with \a newstr
|
2003-10-06 15:43:21 +00:00
|
|
|
|
std::string const subst(std::string const & a,
|
|
|
|
|
std::string const & oldstr, std::string const & newstr);
|
2000-09-26 13:54:57 +00:00
|
|
|
|
|
2006-09-03 07:02:38 +00:00
|
|
|
|
/// substitutes all instances of \a oldstr with \a newstr
|
2006-10-21 00:16:43 +00:00
|
|
|
|
docstring const subst(docstring const & a,
|
|
|
|
|
docstring const & oldstr, docstring const & newstr);
|
2006-09-03 07:02:38 +00:00
|
|
|
|
|
2006-10-09 09:15:37 +00:00
|
|
|
|
/** Trims characters off the end and beginning of a string.
|
|
|
|
|
\code
|
|
|
|
|
trim("ccabccc", "c") == "ab".
|
|
|
|
|
\endcode
|
|
|
|
|
*/
|
2006-10-21 00:16:43 +00:00
|
|
|
|
docstring const trim(docstring const & a, char const * p = " ");
|
2006-10-09 09:15:37 +00:00
|
|
|
|
|
2002-07-28 22:50:13 +00:00
|
|
|
|
/** Trims characters off the end and beginning of a string.
|
2001-02-16 09:25:43 +00:00
|
|
|
|
\code
|
2002-07-28 22:50:13 +00:00
|
|
|
|
trim("ccabccc", "c") == "ab".
|
2001-02-16 09:25:43 +00:00
|
|
|
|
\endcode
|
|
|
|
|
*/
|
2003-10-06 15:43:21 +00:00
|
|
|
|
std::string const trim(std::string const & a, char const * p = " ");
|
1999-10-02 16:21:10 +00:00
|
|
|
|
|
2002-07-28 22:50:13 +00:00
|
|
|
|
/** Trims characters off the end of a string.
|
2001-02-16 09:25:43 +00:00
|
|
|
|
\code
|
2002-07-28 22:50:13 +00:00
|
|
|
|
rtrim("abccc", "c") == "ab".
|
2001-02-16 09:25:43 +00:00
|
|
|
|
\endcode
|
|
|
|
|
*/
|
2003-10-06 15:43:21 +00:00
|
|
|
|
std::string const rtrim(std::string const & a, char const * p = " ");
|
2006-10-22 10:15:23 +00:00
|
|
|
|
docstring const rtrim(docstring const & a, char const * p = " ");
|
2002-07-28 22:50:13 +00:00
|
|
|
|
|
|
|
|
|
/** Trims characters off the beginning of a string.
|
|
|
|
|
\code
|
2006-10-22 10:15:23 +00:00
|
|
|
|
("ababcdef", "ab") = "cdef"
|
2002-07-28 22:50:13 +00:00
|
|
|
|
\endcode
|
|
|
|
|
*/
|
2003-10-06 15:43:21 +00:00
|
|
|
|
std::string const ltrim(std::string const & a, char const * p = " ");
|
2006-10-22 10:15:23 +00:00
|
|
|
|
docstring const ltrim(docstring const & a, char const * p = " ");
|
1999-10-02 16:21:10 +00:00
|
|
|
|
|
|
|
|
|
/** Splits the string by the first delim.
|
2001-02-16 09:25:43 +00:00
|
|
|
|
Splits the string by the first appearance of delim.
|
|
|
|
|
The leading string up to delim is returned in piece (not including
|
|
|
|
|
delim), while the original string is cut from after the delimiter.
|
|
|
|
|
Example:
|
|
|
|
|
\code
|
|
|
|
|
s1= ""; s2= "a;bc".split(s1, ';') -> s1 == "a"; s2 == "bc";
|
|
|
|
|
\endcode
|
|
|
|
|
*/
|
2003-10-06 15:43:21 +00:00
|
|
|
|
std::string const split(std::string const & a, std::string & piece, char delim);
|
2006-10-11 18:32:32 +00:00
|
|
|
|
docstring const split(docstring const & a, docstring & piece, char_type delim);
|
1999-10-02 16:21:10 +00:00
|
|
|
|
|
|
|
|
|
/// Same as split but does not return a piece
|
2003-10-06 15:43:21 +00:00
|
|
|
|
std::string const split(std::string const & a, char delim);
|
1999-10-02 16:21:10 +00:00
|
|
|
|
|
|
|
|
|
/// Same as split but uses the last delim.
|
2003-10-06 15:43:21 +00:00
|
|
|
|
std::string const rsplit(std::string const & a, std::string & piece, char delim);
|
1999-10-02 16:21:10 +00:00
|
|
|
|
|
2006-11-12 13:42:20 +00:00
|
|
|
|
/// Escapes non ASCII chars and other problematic characters that cause
|
|
|
|
|
/// problems in latex labels.
|
2006-10-21 00:16:43 +00:00
|
|
|
|
docstring const escape(docstring const & lab);
|
2001-06-27 14:10:35 +00:00
|
|
|
|
|
2002-04-15 12:05:07 +00:00
|
|
|
|
/// gives a vector of stringparts which have the delimiter delim
|
2003-10-06 15:43:21 +00:00
|
|
|
|
std::vector<std::string> const getVectorFromString(std::string const & str,
|
|
|
|
|
std::string const & delim = std::string(","));
|
2006-12-17 10:52:04 +00:00
|
|
|
|
std::vector<docstring> const getVectorFromString(docstring const & str,
|
|
|
|
|
docstring const & delim = from_ascii(","));
|
2002-04-15 12:05:07 +00:00
|
|
|
|
|
|
|
|
|
// the same vice versa
|
2003-10-06 15:43:21 +00:00
|
|
|
|
std::string const getStringFromVector(std::vector<std::string> const & vec,
|
|
|
|
|
std::string const & delim = std::string(","));
|
2002-04-15 12:05:07 +00:00
|
|
|
|
|
2006-04-20 09:55:45 +00:00
|
|
|
|
/// Search \p search_token in \p str and return the position if it is
|
|
|
|
|
/// found, else -1. The last item in \p str must be "".
|
|
|
|
|
int findToken(char const * const str[], std::string const & search_token);
|
|
|
|
|
|
2006-06-20 08:39:16 +00:00
|
|
|
|
/// Convert internal line endings to line endings as expected by the OS
|
2006-10-21 00:16:43 +00:00
|
|
|
|
docstring const externalLineEnding(docstring const & str);
|
2006-06-20 08:39:16 +00:00
|
|
|
|
|
|
|
|
|
/// Convert line endings in any formnat to internal line endings
|
2006-10-21 00:16:43 +00:00
|
|
|
|
docstring const internalLineEnding(docstring const & str);
|
2006-06-20 08:39:16 +00:00
|
|
|
|
|
2005-01-06 15:40:49 +00:00
|
|
|
|
|
|
|
|
|
#ifdef I_AM_NOT_AFRAID_OF_HEADER_LIBRARIES
|
|
|
|
|
|
|
|
|
|
#include <boost/format.hpp>
|
|
|
|
|
|
|
|
|
|
template<class Arg1>
|
2006-10-21 00:16:43 +00:00
|
|
|
|
docstring bformat(docstring const & fmt, Arg1 arg1)
|
2005-01-06 15:40:49 +00:00
|
|
|
|
{
|
2006-09-11 08:54:10 +00:00
|
|
|
|
return (boost::basic_format<char_type>(fmt) % arg1).str();
|
2005-01-06 15:40:49 +00:00
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
template<class Arg1, class Arg2>
|
2006-10-21 00:16:43 +00:00
|
|
|
|
docstring bformat(docstring const & fmt, Arg1 arg1, Arg2 arg2)
|
2005-01-06 15:40:49 +00:00
|
|
|
|
{
|
2006-09-11 08:54:10 +00:00
|
|
|
|
return (boost::basic_format<char_type>(fmt) % arg1 % arg2).str();
|
2005-01-06 15:40:49 +00:00
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
template<class Arg1, class Arg2, class Arg3>
|
2006-10-21 00:16:43 +00:00
|
|
|
|
docstring bformat(docstring const & fmt, Arg1 arg1, Arg2 arg2, Arg3 arg3)
|
2005-01-06 15:40:49 +00:00
|
|
|
|
{
|
2006-09-11 08:54:10 +00:00
|
|
|
|
return (boost::basic_format<char_type>(fmt) % arg1 % arg2 % arg3).str();
|
2005-01-06 15:40:49 +00:00
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
template<class Arg1, class Arg2, class Arg3, class Arg4>
|
2006-10-21 00:16:43 +00:00
|
|
|
|
docstring bformat(docstring const & fmt, Arg1 arg1, Arg2 arg2, Arg3 arg3, Arg4 arg4)
|
2005-01-06 15:40:49 +00:00
|
|
|
|
{
|
2006-09-11 08:54:10 +00:00
|
|
|
|
return (boost::basic_format<char_type>(fmt) % arg1 % arg2 % arg3 % arg4).str();
|
2005-01-06 15:40:49 +00:00
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
#else
|
|
|
|
|
|
|
|
|
|
template <class Arg1>
|
2006-10-21 00:16:43 +00:00
|
|
|
|
docstring bformat(docstring const & fmt, Arg1);
|
2005-01-06 15:40:49 +00:00
|
|
|
|
|
|
|
|
|
template <class Arg1, class Arg2>
|
2006-10-21 00:16:43 +00:00
|
|
|
|
docstring bformat(docstring const & fmt, Arg1, Arg2);
|
2005-01-06 15:40:49 +00:00
|
|
|
|
|
|
|
|
|
template <class Arg1, class Arg2, class Arg3>
|
2006-10-21 00:16:43 +00:00
|
|
|
|
docstring bformat(docstring const & fmt, Arg1, Arg2, Arg3);
|
2005-01-06 15:40:49 +00:00
|
|
|
|
|
|
|
|
|
template <class Arg1, class Arg2, class Arg3, class Arg4>
|
2006-10-21 00:16:43 +00:00
|
|
|
|
docstring bformat(docstring const & fmt, Arg1, Arg2, Arg3, Arg4);
|
2005-01-06 15:40:49 +00:00
|
|
|
|
|
|
|
|
|
#endif
|
2003-05-13 09:48:57 +00:00
|
|
|
|
|
2003-06-30 23:56:22 +00:00
|
|
|
|
} // namespace support
|
|
|
|
|
} // namespace lyx
|
|
|
|
|
|
1999-10-02 16:21:10 +00:00
|
|
|
|
#endif
|