poco/Foundation/include/Poco/UTFString.h

306 lines
6.4 KiB
C
Raw Normal View History

2012-11-11 09:57:01 +01:00
//
// UTFString.h
2012-11-11 09:57:01 +01:00
//
// Library: Foundation
// Package: Text
// Module: UTFString
//
// Definitions of strings for UTF encodings.
//
// Copyright (c) 2004-2006, Applied Informatics Software Engineering GmbH.
// and Contributors.
//
// SPDX-License-Identifier: BSL-1.0
2012-11-11 09:57:01 +01:00
//
#ifndef Foundation_UTFString_INCLUDED
#define Foundation_UTFString_INCLUDED
#include "Poco/Foundation.h"
#include "Poco/Types.h"
2012-11-11 09:57:01 +01:00
#include <string>
namespace Poco {
struct UTF16CharTraits
{
2017-09-01 20:22:27 +02:00
typedef std::fpos<std::mbstate_t> u16streampos;
typedef UInt16 char_type;
typedef int int_type;
typedef std::streamoff off_type;
typedef u16streampos pos_type;
typedef std::mbstate_t state_type;
static void assign(char_type& c1, const char_type& c2)
{
c1 = c2;
}
2022-07-07 11:18:20 +02:00
static bool eq(char_type c1, char_type c2)
{
return c1 == c2;
}
2022-07-07 11:18:20 +02:00
static bool lt(char_type c1, char_type c2)
{
return c1 < c2;
}
2017-10-18 23:15:20 +02:00
static int compare(const char_type* s1, const char_type* s2, std::size_t n)
{
for (; n; --n, ++s1, ++s2)
{
if (lt(*s1, *s2))
return -1;
if (lt(*s2, *s1))
return 1;
}
return 0;
}
2017-10-18 23:15:20 +02:00
static std::size_t length(const char_type* s)
{
2017-10-18 23:15:20 +02:00
std::size_t len = 0;
for (; !eq(*s, char_type(0)); ++s)
++len;
return len;
}
2017-10-18 23:15:20 +02:00
static const char_type* find(const char_type* s, std::size_t n, const char_type& a)
{
for (; n; --n)
{
if (eq(*s, a))
return s;
++s;
}
return 0;
}
2017-10-18 23:15:20 +02:00
static char_type* move(char_type* s1, const char_type* s2, std::size_t n)
{
char_type* r = s1;
if (s1 < s2)
{
for (; n; --n, ++s1, ++s2)
assign(*s1, *s2);
}
else if (s2 < s1)
{
s1 += n;
s2 += n;
for (; n; --n)
assign(*--s1, *--s2);
}
return r;
}
2017-10-18 23:15:20 +02:00
static char_type* copy(char_type* s1, const char_type* s2, std::size_t n)
{
poco_assert(s2 < s1 || s2 >= s1 + n);
char_type* r = s1;
for (; n; --n, ++s1, ++s2)
assign(*s1, *s2);
return r;
}
2017-10-18 23:15:20 +02:00
static char_type* assign(char_type* s, std::size_t n, char_type a)
{
char_type* r = s;
for (; n; --n, ++s)
assign(*s, a);
return r;
}
static int_type not_eof(int_type c)
{
return eq_int_type(c, eof()) ? ~eof() : c;
}
2022-07-07 11:18:20 +02:00
static char_type to_char_type(int_type c)
{
return char_type(c);
}
2022-07-07 11:18:20 +02:00
static int_type to_int_type(char_type c)
{
return int_type(c);
}
2022-07-07 11:18:20 +02:00
static bool eq_int_type(int_type c1, int_type c2)
{
return c1 == c2;
}
2022-07-07 11:18:20 +02:00
static int_type eof()
{
return int_type(0xDFFF);
}
};
struct UTF32CharTraits
{
2017-09-01 20:22:27 +02:00
typedef std::fpos<std::mbstate_t> u32streampos;
typedef UInt32 char_type;
typedef int int_type;
typedef std::streamoff off_type;
typedef u32streampos pos_type;
typedef std::mbstate_t state_type;
static void assign(char_type& c1, const char_type& c2)
{
c1 = c2;
}
2022-07-07 11:18:20 +02:00
static bool eq(char_type c1, char_type c2)
{
return c1 == c2;
}
2022-07-07 11:18:20 +02:00
static bool lt(char_type c1, char_type c2)
{
return c1 < c2;
}
2017-10-18 23:15:20 +02:00
static int compare(const char_type* s1, const char_type* s2, std::size_t n)
{
for (; n; --n, ++s1, ++s2)
{
if (lt(*s1, *s2))
return -1;
if (lt(*s2, *s1))
return 1;
}
return 0;
}
2017-10-18 23:15:20 +02:00
static std::size_t length(const char_type* s)
{
2017-10-18 23:15:20 +02:00
std::size_t len = 0;
for (; !eq(*s, char_type(0)); ++s)
++len;
return len;
}
2017-10-18 23:15:20 +02:00
static const char_type* find(const char_type* s, std::size_t n, const char_type& a)
{
for (; n; --n)
{
if (eq(*s, a))
return s;
++s;
}
return 0;
}
2017-10-18 23:15:20 +02:00
static char_type* move(char_type* s1, const char_type* s2, std::size_t n)
{
char_type* r = s1;
if (s1 < s2)
{
for (; n; --n, ++s1, ++s2)
assign(*s1, *s2);
}
else if (s2 < s1)
{
s1 += n;
s2 += n;
for (; n; --n)
assign(*--s1, *--s2);
}
return r;
}
2017-10-18 23:15:20 +02:00
static char_type* copy(char_type* s1, const char_type* s2, std::size_t n)
{
poco_assert(s2 < s1 || s2 >= s1 + n);
char_type* r = s1;
for (; n; --n, ++s1, ++s2)
assign(*s1, *s2);
return r;
}
2017-10-18 23:15:20 +02:00
static char_type* assign(char_type* s, std::size_t n, char_type a)
{
char_type* r = s;
for (; n; --n, ++s)
assign(*s, a);
return r;
}
static int_type not_eof(int_type c)
{
return eq_int_type(c, eof()) ? ~eof() : c;
}
2022-07-07 11:18:20 +02:00
static char_type to_char_type(int_type c)
{
return char_type(c);
}
2022-07-07 11:18:20 +02:00
static int_type to_int_type(char_type c)
{
return int_type(c);
}
2022-07-07 11:18:20 +02:00
static bool eq_int_type(int_type c1, int_type c2)
{
return c1 == c2;
}
2022-07-07 11:18:20 +02:00
static int_type eof()
{
return int_type(0xDFFF);
}
};
2012-11-11 09:57:01 +01:00
//#if defined(POCO_ENABLE_CPP11) //TODO
// typedef char16_t UTF16Char;
// typedef std::u16string UTF16String;
// typedef char32_t UTF32Char;
// typedef std::u32string UTF32String;
//#else
#ifdef POCO_NO_WSTRING
typedef Poco::UInt16 UTF16Char;
typedef std::basic_string<UTF16Char, UTF16CharTraits> UTF16String;
typedef UInt32 UTF32Char;
typedef std::basic_string<UTF32Char, UTF32CharTraits> UTF32String;
2012-11-11 09:57:01 +01:00
#else // POCO_NO_WSTRING
#if defined(POCO_OS_FAMILY_WINDOWS)
typedef wchar_t UTF16Char;
typedef std::wstring UTF16String;
typedef UInt32 UTF32Char;
typedef std::basic_string<UTF32Char, UTF32CharTraits> UTF32String;
2012-11-11 09:57:01 +01:00
#elif defined(__SIZEOF_WCHAR_T__) //gcc
#if (__SIZEOF_WCHAR_T__ == 2)
typedef wchar_t UTF16Char;
typedef std::wstring UTF16String;
typedef UInt32 UTF32Char;
typedef std::basic_string<UTF32Char, UTF32CharTraits> UTF32String;
2012-11-11 09:57:01 +01:00
#elif (__SIZEOF_WCHAR_T__ == 4)
typedef Poco::UInt16 UTF16Char;
typedef std::basic_string<UTF16Char, UTF16CharTraits> UTF16String;
typedef wchar_t UTF32Char;
typedef std::wstring UTF32String;
2012-11-11 09:57:01 +01:00
#endif
#else // default to 32-bit wchar_t
typedef Poco::UInt16 UTF16Char;
typedef std::basic_string<UTF16Char, UTF16CharTraits> UTF16String;
typedef wchar_t UTF32Char;
typedef std::wstring UTF32String;
2012-11-11 09:57:01 +01:00
#endif //POCO_OS_FAMILY_WINDOWS
#endif //POCO_NO_WSTRING
//#endif // POCO_ENABLE_CPP11
} // namespace Poco
#endif // Foundation_UTFString_INCLUDED