2002-05-24 12:53:12 +00:00
|
|
|
/*
|
|
|
|
*
|
|
|
|
* Copyright (c) 1998-2002
|
2006-03-05 18:22:35 +00:00
|
|
|
* John Maddock
|
2002-05-24 12:53:12 +00:00
|
|
|
*
|
2004-02-05 09:14:22 +00:00
|
|
|
* Use, modification and distribution are subject to the
|
|
|
|
* Boost Software License, Version 1.0. (See accompanying file
|
|
|
|
* LICENSE_1_0.txt or copy at http://www.boost.org/LICENSE_1_0.txt)
|
2002-05-24 12:53:12 +00:00
|
|
|
*
|
|
|
|
*/
|
|
|
|
|
|
|
|
/*
|
|
|
|
* LOCATION: see http://www.boost.org for most recent version.
|
|
|
|
* FILE: wide_posix_api.cpp
|
|
|
|
* VERSION: see <boost/version.hpp>
|
|
|
|
* DESCRIPTION: Implements the wide character POSIX API wrappers.
|
|
|
|
*/
|
|
|
|
|
|
|
|
#define BOOST_REGEX_SOURCE
|
|
|
|
|
|
|
|
#include <boost/regex/config.hpp>
|
|
|
|
|
|
|
|
#ifndef BOOST_NO_WREGEX
|
|
|
|
|
|
|
|
#include <boost/regex.hpp>
|
2008-09-30 18:01:03 +00:00
|
|
|
#include <boost/cregex.hpp>
|
2002-05-24 12:53:12 +00:00
|
|
|
|
|
|
|
#include <cwchar>
|
|
|
|
#include <cstring>
|
|
|
|
#include <cstdio>
|
|
|
|
|
2011-06-05 12:59:35 +00:00
|
|
|
#ifdef BOOST_INTEL
|
|
|
|
#pragma warning(disable:981)
|
|
|
|
#endif
|
|
|
|
|
2009-11-07 11:55:44 +00:00
|
|
|
#if defined(BOOST_NO_STDC_NAMESPACE) || defined(__NetBSD__)
|
2006-03-05 18:22:35 +00:00
|
|
|
namespace std{
|
|
|
|
# ifndef BOOST_NO_SWPRINTF
|
|
|
|
using ::swprintf;
|
|
|
|
# endif
|
|
|
|
}
|
|
|
|
#endif
|
|
|
|
|
|
|
|
|
2002-05-24 12:53:12 +00:00
|
|
|
namespace boost{
|
|
|
|
|
|
|
|
namespace {
|
|
|
|
|
|
|
|
unsigned int wmagic_value = 28631;
|
|
|
|
|
2006-09-05 07:18:36 +00:00
|
|
|
const wchar_t* wnames[] = {
|
|
|
|
L"REG_NOERROR",
|
|
|
|
L"REG_NOMATCH",
|
|
|
|
L"REG_BADPAT",
|
|
|
|
L"REG_ECOLLATE",
|
|
|
|
L"REG_ECTYPE",
|
|
|
|
L"REG_EESCAPE",
|
|
|
|
L"REG_ESUBREG",
|
|
|
|
L"REG_EBRACK",
|
|
|
|
L"REG_EPAREN",
|
|
|
|
L"REG_EBRACE",
|
|
|
|
L"REG_BADBR",
|
|
|
|
L"REG_ERANGE",
|
|
|
|
L"REG_ESPACE",
|
|
|
|
L"REG_BADRPT",
|
|
|
|
L"REG_EEND",
|
|
|
|
L"REG_ESIZE",
|
|
|
|
L"REG_ERPAREN",
|
|
|
|
L"REG_EMPTY",
|
|
|
|
L"REG_ECOMPLEXITY",
|
|
|
|
L"REG_ESTACK",
|
2010-02-17 20:54:47 +00:00
|
|
|
L"REG_E_PERL",
|
2006-09-05 07:18:36 +00:00
|
|
|
L"REG_E_UNKNOWN",
|
|
|
|
};
|
2002-05-24 12:53:12 +00:00
|
|
|
}
|
|
|
|
|
2011-11-20 18:58:15 +00:00
|
|
|
typedef boost::basic_regex<wchar_t, c_regex_traits<wchar_t> > wc_regex_type;
|
2008-09-30 18:01:03 +00:00
|
|
|
|
2002-05-24 12:53:12 +00:00
|
|
|
BOOST_REGEX_DECL int BOOST_REGEX_CCALL regcompW(regex_tW* expression, const wchar_t* ptr, int f)
|
|
|
|
{
|
|
|
|
if(expression->re_magic != wmagic_value)
|
|
|
|
{
|
|
|
|
expression->guts = 0;
|
|
|
|
#ifndef BOOST_NO_EXCEPTIONS
|
|
|
|
try{
|
|
|
|
#endif
|
2011-11-20 18:58:15 +00:00
|
|
|
expression->guts = new wc_regex_type();
|
2002-05-24 12:53:12 +00:00
|
|
|
#ifndef BOOST_NO_EXCEPTIONS
|
|
|
|
} catch(...)
|
|
|
|
{
|
|
|
|
return REG_ESPACE;
|
|
|
|
}
|
|
|
|
#else
|
|
|
|
if(0 == expression->guts)
|
|
|
|
return REG_E_MEMORY;
|
|
|
|
#endif
|
|
|
|
}
|
|
|
|
// set default flags:
|
2006-03-05 18:22:35 +00:00
|
|
|
boost::uint_fast32_t flags = (f & REG_PERLEX) ? 0 : ((f & REG_EXTENDED) ? wregex::extended : wregex::basic);
|
2004-02-05 09:14:22 +00:00
|
|
|
expression->eflags = (f & REG_NEWLINE) ? match_not_dot_newline : match_default;
|
2002-05-24 12:53:12 +00:00
|
|
|
|
|
|
|
// and translate those that are actually set:
|
|
|
|
if(f & REG_NOCOLLATE)
|
2004-02-05 09:14:22 +00:00
|
|
|
{
|
|
|
|
flags |= wregex::nocollate;
|
|
|
|
#ifndef BOOST_REGEX_V3
|
|
|
|
flags &= ~wregex::collate;
|
|
|
|
#endif
|
|
|
|
}
|
2002-05-24 12:53:12 +00:00
|
|
|
|
|
|
|
if(f & REG_NOSUB)
|
2006-03-05 18:22:35 +00:00
|
|
|
{
|
|
|
|
//expression->eflags |= match_any;
|
|
|
|
flags |= wregex::nosubs;
|
|
|
|
}
|
2002-05-24 12:53:12 +00:00
|
|
|
|
|
|
|
if(f & REG_NOSPEC)
|
2004-02-05 09:14:22 +00:00
|
|
|
flags |= wregex::literal;
|
2002-05-24 12:53:12 +00:00
|
|
|
if(f & REG_ICASE)
|
2004-02-05 09:14:22 +00:00
|
|
|
flags |= wregex::icase;
|
2002-05-24 12:53:12 +00:00
|
|
|
if(f & REG_ESCAPE_IN_LISTS)
|
2006-03-05 18:22:35 +00:00
|
|
|
flags &= ~wregex::no_escape_in_lists;
|
2002-05-24 12:53:12 +00:00
|
|
|
if(f & REG_NEWLINE_ALT)
|
2004-02-05 09:14:22 +00:00
|
|
|
flags |= wregex::newline_alt;
|
2002-05-24 12:53:12 +00:00
|
|
|
|
|
|
|
const wchar_t* p2;
|
|
|
|
if(f & REG_PEND)
|
|
|
|
p2 = expression->re_endp;
|
|
|
|
else p2 = ptr + std::wcslen(ptr);
|
|
|
|
|
|
|
|
int result;
|
|
|
|
|
|
|
|
#ifndef BOOST_NO_EXCEPTIONS
|
|
|
|
try{
|
|
|
|
#endif
|
|
|
|
expression->re_magic = wmagic_value;
|
2011-11-20 18:58:15 +00:00
|
|
|
static_cast<wc_regex_type*>(expression->guts)->set_expression(ptr, p2, flags);
|
|
|
|
expression->re_nsub = static_cast<wc_regex_type*>(expression->guts)->mark_count() - 1;
|
|
|
|
result = static_cast<wc_regex_type*>(expression->guts)->error_code();
|
2002-05-24 12:53:12 +00:00
|
|
|
#ifndef BOOST_NO_EXCEPTIONS
|
2006-03-05 18:22:35 +00:00
|
|
|
}
|
|
|
|
catch(const boost::regex_error& be)
|
|
|
|
{
|
|
|
|
result = be.code();
|
|
|
|
}
|
|
|
|
catch(...)
|
2002-05-24 12:53:12 +00:00
|
|
|
{
|
|
|
|
result = REG_E_UNKNOWN;
|
|
|
|
}
|
|
|
|
#endif
|
|
|
|
if(result)
|
|
|
|
regfreeW(expression);
|
|
|
|
return result;
|
|
|
|
|
|
|
|
}
|
|
|
|
|
|
|
|
BOOST_REGEX_DECL regsize_t BOOST_REGEX_CCALL regerrorW(int code, const regex_tW* e, wchar_t* buf, regsize_t buf_size)
|
|
|
|
{
|
|
|
|
std::size_t result = 0;
|
|
|
|
if(code & REG_ITOA)
|
|
|
|
{
|
|
|
|
code &= ~REG_ITOA;
|
2006-03-05 18:22:35 +00:00
|
|
|
if((code <= (int)REG_E_UNKNOWN) && (code >= 0))
|
2002-05-24 12:53:12 +00:00
|
|
|
{
|
|
|
|
result = std::wcslen(wnames[code]) + 1;
|
|
|
|
if(buf_size >= result)
|
2008-09-30 18:01:03 +00:00
|
|
|
#if BOOST_WORKAROUND(BOOST_MSVC, >= 1400) && !defined(_WIN32_WCE) && !defined(UNDER_CE)
|
2006-03-05 18:22:35 +00:00
|
|
|
::wcscpy_s(buf, buf_size, wnames[code]);
|
|
|
|
#else
|
2002-05-24 12:53:12 +00:00
|
|
|
std::wcscpy(buf, wnames[code]);
|
2006-03-05 18:22:35 +00:00
|
|
|
#endif
|
2002-05-24 12:53:12 +00:00
|
|
|
return result;
|
|
|
|
}
|
|
|
|
return result;
|
|
|
|
}
|
|
|
|
#if !defined(BOOST_NO_SWPRINTF)
|
|
|
|
if(code == REG_ATOI)
|
|
|
|
{
|
|
|
|
wchar_t localbuf[5];
|
|
|
|
if(e == 0)
|
|
|
|
return 0;
|
2006-03-05 18:22:35 +00:00
|
|
|
for(int i = 0; i <= (int)REG_E_UNKNOWN; ++i)
|
2002-05-24 12:53:12 +00:00
|
|
|
{
|
|
|
|
if(std::wcscmp(e->re_endp, wnames[i]) == 0)
|
|
|
|
{
|
2008-09-30 18:01:03 +00:00
|
|
|
#if defined(_WIN32_WCE) && !defined(UNDER_CE)
|
|
|
|
(std::swprintf)(localbuf, L"%d", i);
|
|
|
|
#else
|
2006-03-05 18:22:35 +00:00
|
|
|
(std::swprintf)(localbuf, 5, L"%d", i);
|
2008-09-30 18:01:03 +00:00
|
|
|
#endif
|
2002-05-24 12:53:12 +00:00
|
|
|
if(std::wcslen(localbuf) < buf_size)
|
2008-09-30 18:01:03 +00:00
|
|
|
#if BOOST_WORKAROUND(BOOST_MSVC, >= 1400) && !defined(_WIN32_WCE) && !defined(UNDER_CE)
|
2006-03-05 18:22:35 +00:00
|
|
|
::wcscpy_s(buf, buf_size, localbuf);
|
|
|
|
#else
|
2002-05-24 12:53:12 +00:00
|
|
|
std::wcscpy(buf, localbuf);
|
2006-03-05 18:22:35 +00:00
|
|
|
#endif
|
2002-05-24 12:53:12 +00:00
|
|
|
return std::wcslen(localbuf) + 1;
|
|
|
|
}
|
|
|
|
}
|
2008-09-30 18:01:03 +00:00
|
|
|
#if defined(_WIN32_WCE) && !defined(UNDER_CE)
|
|
|
|
(std::swprintf)(localbuf, L"%d", 0);
|
|
|
|
#else
|
2006-03-05 18:22:35 +00:00
|
|
|
(std::swprintf)(localbuf, 5, L"%d", 0);
|
2008-09-30 18:01:03 +00:00
|
|
|
#endif
|
2002-05-24 12:53:12 +00:00
|
|
|
if(std::wcslen(localbuf) < buf_size)
|
2008-09-30 18:01:03 +00:00
|
|
|
#if BOOST_WORKAROUND(BOOST_MSVC, >= 1400) && !defined(_WIN32_WCE) && !defined(UNDER_CE)
|
2006-03-05 18:22:35 +00:00
|
|
|
::wcscpy_s(buf, buf_size, localbuf);
|
|
|
|
#else
|
2002-05-24 12:53:12 +00:00
|
|
|
std::wcscpy(buf, localbuf);
|
2006-03-05 18:22:35 +00:00
|
|
|
#endif
|
2002-05-24 12:53:12 +00:00
|
|
|
return std::wcslen(localbuf) + 1;
|
|
|
|
}
|
|
|
|
#endif
|
2006-03-05 18:22:35 +00:00
|
|
|
if(code <= (int)REG_E_UNKNOWN)
|
2002-05-24 12:53:12 +00:00
|
|
|
{
|
2006-03-05 18:22:35 +00:00
|
|
|
std::string p;
|
|
|
|
if((e) && (e->re_magic == wmagic_value))
|
2011-11-20 18:58:15 +00:00
|
|
|
p = static_cast<wc_regex_type*>(e->guts)->get_traits().error_string(static_cast< ::boost::regex_constants::error_type>(code));
|
2006-03-05 18:22:35 +00:00
|
|
|
else
|
|
|
|
{
|
|
|
|
p = re_detail::get_default_error_string(static_cast< ::boost::regex_constants::error_type>(code));
|
|
|
|
}
|
|
|
|
std::size_t len = p.size();
|
2002-05-24 12:53:12 +00:00
|
|
|
if(len < buf_size)
|
|
|
|
{
|
2006-03-05 18:22:35 +00:00
|
|
|
re_detail::copy(p.c_str(), p.c_str() + p.size() + 1, buf);
|
2002-05-24 12:53:12 +00:00
|
|
|
}
|
|
|
|
return len + 1;
|
|
|
|
}
|
|
|
|
if(buf_size)
|
|
|
|
*buf = 0;
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
BOOST_REGEX_DECL int BOOST_REGEX_CCALL regexecW(const regex_tW* expression, const wchar_t* buf, regsize_t n, regmatch_t* array, int eflags)
|
|
|
|
{
|
2006-03-05 18:22:35 +00:00
|
|
|
#ifdef BOOST_MSVC
|
|
|
|
#pragma warning(push)
|
|
|
|
#pragma warning(disable:4267)
|
|
|
|
#endif
|
2002-05-24 12:53:12 +00:00
|
|
|
bool result = false;
|
2004-02-05 09:14:22 +00:00
|
|
|
match_flag_type flags = match_default | expression->eflags;
|
2002-05-24 12:53:12 +00:00
|
|
|
const wchar_t* end;
|
|
|
|
const wchar_t* start;
|
|
|
|
wcmatch m;
|
|
|
|
|
|
|
|
if(eflags & REG_NOTBOL)
|
|
|
|
flags |= match_not_bol;
|
|
|
|
if(eflags & REG_NOTEOL)
|
|
|
|
flags |= match_not_eol;
|
|
|
|
if(eflags & REG_STARTEND)
|
|
|
|
{
|
|
|
|
start = buf + array[0].rm_so;
|
|
|
|
end = buf + array[0].rm_eo;
|
|
|
|
}
|
|
|
|
else
|
|
|
|
{
|
|
|
|
start = buf;
|
|
|
|
end = buf + std::wcslen(buf);
|
|
|
|
}
|
|
|
|
|
|
|
|
#ifndef BOOST_NO_EXCEPTIONS
|
|
|
|
try{
|
|
|
|
#endif
|
|
|
|
if(expression->re_magic == wmagic_value)
|
|
|
|
{
|
2011-11-20 18:58:15 +00:00
|
|
|
result = regex_search(start, end, m, *static_cast<wc_regex_type*>(expression->guts), flags);
|
2002-05-24 12:53:12 +00:00
|
|
|
}
|
|
|
|
else
|
|
|
|
return result;
|
|
|
|
#ifndef BOOST_NO_EXCEPTIONS
|
|
|
|
} catch(...)
|
|
|
|
{
|
|
|
|
return REG_E_UNKNOWN;
|
|
|
|
}
|
|
|
|
#endif
|
|
|
|
if(result)
|
|
|
|
{
|
|
|
|
// extract what matched:
|
2006-03-05 18:22:35 +00:00
|
|
|
std::size_t i;
|
2002-05-24 12:53:12 +00:00
|
|
|
for(i = 0; (i < n) && (i < expression->re_nsub + 1); ++i)
|
|
|
|
{
|
|
|
|
array[i].rm_so = (m[i].matched == false) ? -1 : (m[i].first - buf);
|
|
|
|
array[i].rm_eo = (m[i].matched == false) ? -1 : (m[i].second - buf);
|
|
|
|
}
|
|
|
|
// and set anything else to -1:
|
|
|
|
for(i = expression->re_nsub + 1; i < n; ++i)
|
|
|
|
{
|
|
|
|
array[i].rm_so = -1;
|
|
|
|
array[i].rm_eo = -1;
|
|
|
|
}
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
return REG_NOMATCH;
|
2006-03-05 18:22:35 +00:00
|
|
|
#ifdef BOOST_MSVC
|
|
|
|
#pragma warning(pop)
|
|
|
|
#endif
|
2002-05-24 12:53:12 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
BOOST_REGEX_DECL void BOOST_REGEX_CCALL regfreeW(regex_tW* expression)
|
|
|
|
{
|
|
|
|
if(expression->re_magic == wmagic_value)
|
|
|
|
{
|
2011-11-20 18:58:15 +00:00
|
|
|
delete static_cast<wc_regex_type*>(expression->guts);
|
2002-05-24 12:53:12 +00:00
|
|
|
}
|
|
|
|
expression->re_magic = 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
} // namespace boost;
|
|
|
|
|
|
|
|
#endif
|
|
|
|
|
|
|
|
|
|
|
|
|
2004-02-05 09:14:22 +00:00
|
|
|
|