2008-11-08 23:07:23 +01:00
|
|
|
// Copyright (c) 2008, Rodrigo Braz Monteiro
|
|
|
|
// All rights reserved.
|
|
|
|
//
|
|
|
|
// Redistribution and use in source and binary forms, with or without
|
|
|
|
// modification, are permitted provided that the following conditions are met:
|
|
|
|
//
|
|
|
|
// * Redistributions of source code must retain the above copyright notice,
|
|
|
|
// this list of conditions and the following disclaimer.
|
|
|
|
// * Redistributions in binary form must reproduce the above copyright notice,
|
|
|
|
// this list of conditions and the following disclaimer in the documentation
|
|
|
|
// and/or other materials provided with the distribution.
|
|
|
|
// * Neither the name of the Aegisub Group nor the names of its contributors
|
|
|
|
// may be used to endorse or promote products derived from this software
|
|
|
|
// without specific prior written permission.
|
|
|
|
//
|
|
|
|
// THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
|
|
|
|
// AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
|
|
|
|
// IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
|
|
|
|
// ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
|
|
|
|
// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
|
|
|
|
// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
|
|
|
|
// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
|
|
|
|
// INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
|
|
|
|
// CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
|
|
|
|
// ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
|
|
|
|
// POSSIBILITY OF SUCH DAMAGE.
|
|
|
|
//
|
|
|
|
// -----------------------------------------------------------------------------
|
|
|
|
//
|
|
|
|
// AEGISUB/ATHENASUB
|
|
|
|
//
|
|
|
|
// Website: http://www.aegisub.net
|
|
|
|
// Contact: mailto:amz@aegisub.net
|
|
|
|
//
|
|
|
|
|
|
|
|
#include "athenastring.h"
|
2008-11-09 19:48:37 +01:00
|
|
|
#include "exception.h"
|
|
|
|
#include <wx/string.h>
|
2008-11-08 23:07:23 +01:00
|
|
|
|
|
|
|
using namespace Athenasub;
|
|
|
|
|
|
|
|
|
|
|
|
String::String()
|
|
|
|
{
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
String::String(const char* utf8)
|
|
|
|
: std::basic_string<Character>(utf8)
|
|
|
|
{
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
String::String(const char* utf8,size_t bytes)
|
|
|
|
{
|
|
|
|
resize(bytes);
|
|
|
|
memcpy(GetCharPointer(0),utf8,bytes);
|
|
|
|
*GetCharPointer(bytes) = 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
String::String(const basic_string<Character>& str)
|
|
|
|
: std::basic_string<Character>(str)
|
|
|
|
{
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
String::String(const wchar_t* utf16)
|
|
|
|
{
|
|
|
|
size_t len = GetUTF8Len(utf16);
|
|
|
|
resize(len);
|
|
|
|
UTF16toUTF8(utf16,GetCharPointer(0));
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
String::String(const wxString& wxstring)
|
|
|
|
{
|
|
|
|
const wchar_t* utf16 = wxstring.c_str();
|
|
|
|
size_t len = GetUTF8Len(utf16);
|
|
|
|
resize(len);
|
|
|
|
UTF16toUTF8(utf16,GetCharPointer(0));
|
|
|
|
}
|
|
|
|
|
|
|
|
|
2008-11-16 01:58:08 +01:00
|
|
|
String::String(char character)
|
|
|
|
{
|
|
|
|
*this = std::string(character,1);
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
String::String(wchar_t character)
|
|
|
|
{
|
|
|
|
wchar_t tmp[2];
|
|
|
|
tmp[0] = character;
|
|
|
|
tmp[1] = 0;
|
|
|
|
*this = String(tmp);
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
String::String(int integer)
|
|
|
|
{
|
|
|
|
*this = IntegerToString(integer);
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
String::String(float number)
|
|
|
|
{
|
|
|
|
*this = FloatToString(number);
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
String::String(double number)
|
|
|
|
{
|
|
|
|
*this = FloatToString(number);
|
|
|
|
}
|
|
|
|
|
|
|
|
|
2008-11-08 23:07:23 +01:00
|
|
|
Character* String::GetCharPointer(size_t pos)
|
|
|
|
{
|
|
|
|
return &operator[](pos);
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
wxString String::GetWxString() const
|
|
|
|
{
|
2008-11-13 03:13:48 +01:00
|
|
|
// TODO: optimize this to use UTF8ToUTF16()
|
2008-11-08 23:07:23 +01:00
|
|
|
return wxString(c_str(),wxConvUTF8);
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
bool String::IsEmpty() const
|
|
|
|
{
|
|
|
|
return size()==0;
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
void String::SetSize(size_t size)
|
|
|
|
{
|
|
|
|
_Mysize = size;
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
void String::Truncate(size_t size)
|
|
|
|
{
|
|
|
|
operator[](size) = 0;
|
|
|
|
SetSize(size);
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
bool IsSpace(char chr)
|
|
|
|
{
|
|
|
|
return (chr == ' ' || chr == '\t' || chr == '\n' || chr == '\r');
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
String& String::Trim(bool fromRight)
|
|
|
|
{
|
|
|
|
int len = Length();
|
|
|
|
size_t start = 0;
|
|
|
|
size_t n = len;
|
|
|
|
|
|
|
|
if (fromRight) {
|
|
|
|
for (int i=len;--i>=0;) {
|
|
|
|
if (IsSpace(operator[](i))) n = i;
|
|
|
|
else break;
|
|
|
|
}
|
|
|
|
} else {
|
|
|
|
for (int i=0;i<len;i++) {
|
|
|
|
if (IsSpace(operator[](i))) start = i+1;
|
|
|
|
else break;
|
|
|
|
}
|
|
|
|
n = len - start;
|
|
|
|
}
|
|
|
|
|
2008-11-15 04:55:58 +01:00
|
|
|
*this = String(substr(start,n));
|
2008-11-08 23:07:23 +01:00
|
|
|
return *this;
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
String& String::TrimBoth()
|
|
|
|
{
|
|
|
|
return Trim(true).Trim(false);
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
size_t String::Length() const
|
|
|
|
{
|
|
|
|
return size();
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
size_t String::UTF8Length() const
|
|
|
|
{
|
2008-11-09 19:48:37 +01:00
|
|
|
THROW_ATHENA_EXCEPTION(Exception::TODO);
|
2008-11-08 23:07:23 +01:00
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
bool String::Contains(const String& string) const
|
|
|
|
{
|
|
|
|
return find(string) != npos;
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
size_t String::Find(Character c) const
|
|
|
|
{
|
|
|
|
return find(c,0);
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
String String::Left(size_t n) const
|
|
|
|
{
|
2008-11-15 04:55:58 +01:00
|
|
|
return String(substr(0,n));
|
2008-11-08 23:07:23 +01:00
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
String String::Right(size_t n) const
|
|
|
|
{
|
|
|
|
size_t len = size();
|
2008-11-15 04:55:58 +01:00
|
|
|
return String(substr(len-n,n));
|
2008-11-08 23:07:23 +01:00
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
String String::Mid(size_t start,size_t count) const
|
|
|
|
{
|
2008-11-15 04:55:58 +01:00
|
|
|
return String(substr(start,count));
|
2008-11-08 23:07:23 +01:00
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
bool String::StartsWith(const String& string,bool caseSensitive) const
|
|
|
|
{
|
|
|
|
if (caseSensitive) {
|
2008-11-15 04:55:58 +01:00
|
|
|
String tmp = String(substr(0,string.size()));
|
2008-11-08 23:07:23 +01:00
|
|
|
return compare(0,string.size(),string) == 0;
|
|
|
|
} else {
|
2008-11-09 19:48:37 +01:00
|
|
|
return AsciiLower().StartsWith(string.AsciiLower(),true);
|
2008-11-08 23:07:23 +01:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
bool String::EndsWith(const String& string,bool caseSensitive) const
|
|
|
|
{
|
|
|
|
if (caseSensitive) {
|
|
|
|
size_t strSize = string.size();
|
|
|
|
return compare(size() - strSize,strSize,string) == 0;
|
|
|
|
} else {
|
2008-11-09 19:48:37 +01:00
|
|
|
return AsciiLower().EndsWith(string.AsciiLower(),true);
|
2008-11-08 23:07:23 +01:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
void String::WriteText(const Character* src,size_t len,size_t &pos)
|
|
|
|
{
|
|
|
|
char *dst = GetCharPointer(pos);
|
|
|
|
memcpy(dst,src,len*sizeof(Character));
|
|
|
|
pos += len;
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
void String::WriteChar(const Character &src,size_t &pos)
|
|
|
|
{
|
|
|
|
char *dst = GetCharPointer(pos);
|
|
|
|
*dst = src;
|
|
|
|
pos++;
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
void String::WriteNumber(Character *temp,int number,int pad,size_t &pos)
|
|
|
|
{
|
|
|
|
char *dst = GetCharPointer(pos);
|
|
|
|
|
|
|
|
// Write number backwards first
|
|
|
|
int div, value;
|
|
|
|
size_t len;
|
|
|
|
for (len=0;true;len++) {
|
|
|
|
div = number / 10;
|
|
|
|
value = number - (div*10);
|
|
|
|
temp[len] = (value + '0');
|
|
|
|
if (!div) break;
|
|
|
|
number = div;
|
|
|
|
}
|
|
|
|
len++;
|
|
|
|
|
|
|
|
// Pad with zeroes
|
|
|
|
pad -= (int)len;
|
|
|
|
for (int i=0;i<pad;i++) {
|
|
|
|
*dst++ = '0';
|
|
|
|
pos++;
|
|
|
|
}
|
|
|
|
|
|
|
|
// Write number
|
|
|
|
for (size_t i=0;i<len;i++) {
|
|
|
|
*dst++ = temp[len-i-1];
|
|
|
|
pos++;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
bool String::AsciiCompareNoCase(const Character *src) const
|
|
|
|
{
|
2008-11-15 05:33:22 +01:00
|
|
|
unsigned char mask = 0xDF; // 0xDF
|
|
|
|
unsigned char c1,c2;
|
2008-11-08 23:07:23 +01:00
|
|
|
size_t len = size();
|
|
|
|
for (size_t i=0;i<len;i++) {
|
|
|
|
// Abort on end of string 2
|
2008-11-15 05:33:22 +01:00
|
|
|
c2 = (unsigned char) operator[](i);
|
2008-11-08 23:07:23 +01:00
|
|
|
if (!c2) return false;
|
|
|
|
|
|
|
|
// Upper case both, this ONLY WORKS FOR ASCII
|
2008-11-15 05:33:22 +01:00
|
|
|
c1 = ((unsigned char)src[i]) & mask;
|
2008-11-08 23:07:23 +01:00
|
|
|
c2 = c2 & mask;
|
|
|
|
|
|
|
|
// Check them
|
|
|
|
if (c1 != c2) return false;
|
|
|
|
}
|
|
|
|
|
|
|
|
// Equal strings
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
bool String::IsNumber() const
|
|
|
|
{
|
2008-11-09 19:48:37 +01:00
|
|
|
for (const char *chr = c_str();*chr;chr++) {
|
|
|
|
char cur = *chr;
|
|
|
|
if (cur < '0' || cur > '9') {
|
|
|
|
if (cur != '.' && cur != ',' && cur != '+' && cur != '-') {
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
return true;
|
2008-11-08 23:07:23 +01:00
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
//
|
|
|
|
|
|
|
|
const Character* String::StringPtrTrim(Character *chr,size_t len,size_t startPos)
|
|
|
|
{
|
|
|
|
// String metrics
|
|
|
|
Character *read = chr;
|
|
|
|
size_t start = startPos;
|
|
|
|
size_t end = len;
|
|
|
|
bool isStart = true;
|
|
|
|
bool isEnd = false;
|
|
|
|
Character cur;
|
|
|
|
|
|
|
|
// Search for spaces
|
|
|
|
for (size_t i=start;i<len;i++) {
|
|
|
|
cur = read[i];
|
|
|
|
bool isSpace = (cur == ' ');
|
|
|
|
if (isStart) {
|
|
|
|
if (isSpace) start++;
|
|
|
|
else isStart = false;
|
|
|
|
}
|
|
|
|
if (isEnd) {
|
|
|
|
if (!isSpace) isEnd = false;
|
|
|
|
}
|
|
|
|
else {
|
|
|
|
if (isSpace) {
|
|
|
|
isEnd = true;
|
|
|
|
end = i;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
// Apply changes to pointer
|
|
|
|
if (isEnd) chr[end] = 0;
|
|
|
|
return chr + start;
|
|
|
|
}
|
|
|
|
|
|
|
|
const Character* String::StringTrim(String &str,size_t startPos)
|
|
|
|
{
|
|
|
|
// Get a pointer to the string data
|
|
|
|
Character *chr = const_cast<Character*> (str.c_str());
|
|
|
|
return StringPtrTrim(chr,str.Length(),startPos);
|
|
|
|
}
|
|
|
|
|
2008-11-09 19:48:37 +01:00
|
|
|
/*
|
2008-11-08 23:07:23 +01:00
|
|
|
String String::Lower() const
|
|
|
|
{
|
|
|
|
String tmp(*this);
|
|
|
|
tmp.MakeLower();
|
|
|
|
return tmp;
|
|
|
|
}
|
|
|
|
|
|
|
|
String String::Upper() const {
|
|
|
|
String tmp(*this);
|
|
|
|
tmp.MakeUpper();
|
|
|
|
return tmp;
|
|
|
|
}
|
|
|
|
|
|
|
|
void String::MakeUpper()
|
|
|
|
{
|
2008-11-09 19:48:37 +01:00
|
|
|
THROW_ATHENA_EXCEPTION(Exception::TODO);
|
2008-11-08 23:07:23 +01:00
|
|
|
}
|
|
|
|
|
|
|
|
void String::MakeLower()
|
|
|
|
{
|
2008-11-09 19:48:37 +01:00
|
|
|
THROW_ATHENA_EXCEPTION(Exception::TODO);
|
|
|
|
}
|
|
|
|
*/
|
|
|
|
|
|
|
|
String String::AsciiLower() const
|
|
|
|
{
|
|
|
|
String tmp(*this);
|
|
|
|
tmp.AsciiMakeLower();
|
|
|
|
return tmp;
|
|
|
|
}
|
|
|
|
|
|
|
|
String String::AsciiUpper() const {
|
|
|
|
String tmp(*this);
|
|
|
|
tmp.AsciiMakeUpper();
|
|
|
|
return tmp;
|
|
|
|
}
|
|
|
|
|
|
|
|
void String::AsciiMakeUpper()
|
|
|
|
{
|
|
|
|
char* str = GetCharPointer(0);
|
|
|
|
for (int i=0; str[i]; str++) {
|
|
|
|
char cur = str[i];
|
|
|
|
if (cur >= 'a' && cur <= 'z') str[i] -= 32;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
void String::AsciiMakeLower()
|
|
|
|
{
|
|
|
|
char* str = GetCharPointer(0);
|
|
|
|
for (int i=0; str[i]; str++) {
|
|
|
|
char cur = str[i];
|
|
|
|
if (cur >= 'A' && cur <= 'Z') str[i] += 32;
|
|
|
|
}
|
2008-11-08 23:07:23 +01:00
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
///////////////
|
|
|
|
|
|
|
|
String String::operator += (const String &p)
|
|
|
|
{
|
|
|
|
append(p);
|
|
|
|
return *this;
|
|
|
|
}
|
|
|
|
|
|
|
|
String String::operator += (const wxString &p)
|
|
|
|
{
|
|
|
|
append(String(p));
|
|
|
|
return *this;
|
|
|
|
}
|
|
|
|
|
|
|
|
String String::operator += (const char* p)
|
|
|
|
{
|
|
|
|
append(p);
|
|
|
|
return *this;
|
|
|
|
}
|
|
|
|
|
|
|
|
String String::operator += (const wchar_t* p)
|
|
|
|
{
|
|
|
|
append(String(p));
|
|
|
|
return *this;
|
|
|
|
}
|
|
|
|
|
|
|
|
String String::operator += (const double &p)
|
|
|
|
{
|
|
|
|
append(FloatToString(p));
|
|
|
|
return *this;
|
|
|
|
}
|
|
|
|
|
|
|
|
String String::operator += (const int &p)
|
|
|
|
{
|
|
|
|
append(IntegerToString(p));
|
|
|
|
return *this;
|
|
|
|
}
|
|
|
|
|
|
|
|
String String::operator += (const Character &p)
|
|
|
|
{
|
|
|
|
append(1,p);
|
|
|
|
return *this;
|
|
|
|
}
|
|
|
|
|
|
|
|
void Athenasub::operator <<(double &p1,String &p2)
|
|
|
|
{
|
|
|
|
p1 = atof(p2.c_str());
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
//////////////////////////////////
|
|
|
|
// Convert a string to an integer
|
|
|
|
int String::ToInteger() const
|
|
|
|
{
|
|
|
|
size_t len = Length();
|
|
|
|
int value = 0;
|
2008-11-10 04:37:15 +01:00
|
|
|
int mult = 1;
|
2008-11-08 23:07:23 +01:00
|
|
|
int chr;
|
2008-11-10 04:37:15 +01:00
|
|
|
bool firstChar = true;
|
2008-11-08 23:07:23 +01:00
|
|
|
const char *data = c_str();
|
|
|
|
for (size_t i=0;i<len;i++) {
|
2008-11-10 04:37:15 +01:00
|
|
|
if (data[i] == ' ') continue;
|
2008-11-08 23:07:23 +01:00
|
|
|
chr = (int)(data[i])-(int)'0';
|
|
|
|
if (chr >= 0 && chr <= 9) value = 10*value+chr;
|
2008-11-10 04:37:15 +01:00
|
|
|
else if (firstChar && data[i] == '-') mult = -1;
|
|
|
|
else if (firstChar && data[i] == '+') {
|
|
|
|
firstChar = false;
|
|
|
|
continue;
|
|
|
|
}
|
|
|
|
else THROW_ATHENA_EXCEPTION(Exception::Out_Of_Range);
|
|
|
|
firstChar = false;
|
2008-11-08 23:07:23 +01:00
|
|
|
}
|
2008-11-10 04:37:15 +01:00
|
|
|
return value * mult;
|
2008-11-08 23:07:23 +01:00
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
//////////////////////////////////////
|
|
|
|
// Converts a substring to an integer
|
|
|
|
int String::SubToInteger(size_t start,size_t end) const
|
|
|
|
{
|
|
|
|
int value = 0;
|
|
|
|
int chr;
|
|
|
|
const char *data = c_str();
|
|
|
|
for (size_t i=start;i<end;i++) {
|
|
|
|
chr = (int)(data[i])-(int)'0';
|
|
|
|
if (chr >= 0 && chr <= 9) value = 10*value+chr;
|
|
|
|
}
|
|
|
|
return value;
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
////////////////
|
|
|
|
// Pretty float
|
|
|
|
String String::PrettyFloat(String src)
|
|
|
|
{
|
|
|
|
if (src.Contains(".")) {
|
|
|
|
size_t len = src.Length();
|
|
|
|
while (src.EndsWith("0")) {
|
|
|
|
len--;
|
|
|
|
src.Truncate(len);
|
|
|
|
}
|
|
|
|
if (src.EndsWith(".")) {
|
|
|
|
len--;
|
|
|
|
src.Truncate(len);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
return src;
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
///////////////////
|
|
|
|
// Float to string
|
|
|
|
String String::FloatToString(float src)
|
|
|
|
{
|
2008-11-15 04:55:58 +01:00
|
|
|
return PrettyFloat(String(wxString::Format(_T("%f"),src)));
|
2008-11-08 23:07:23 +01:00
|
|
|
}
|
|
|
|
|
|
|
|
String String::FloatToString(double src)
|
|
|
|
{
|
2008-11-15 04:55:58 +01:00
|
|
|
return PrettyFloat(String(wxString::Format(_T("%f"),src)));
|
2008-11-08 23:07:23 +01:00
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
/////////////////
|
|
|
|
// Int to string
|
|
|
|
String String::IntegerToString(int value)
|
|
|
|
{
|
2008-11-15 04:55:58 +01:00
|
|
|
return String(wxString::Format(_T("%i"),value));
|
2008-11-08 23:07:23 +01:00
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
///////////////////////////////////////////////
|
|
|
|
// Get the UTF-8 length out of a UTF-16 string
|
|
|
|
size_t String::GetUTF8Len(const wchar_t *utf16)
|
|
|
|
{
|
|
|
|
size_t len = 0;
|
|
|
|
wchar_t curChar = utf16[0];
|
|
|
|
for (size_t i=0;curChar;) {
|
|
|
|
// 1 byte
|
|
|
|
if ((curChar & 0xFF80) == 0) len++;
|
|
|
|
|
|
|
|
// Surrogate pair UTF-16, 4 bytes
|
|
|
|
else if ((curChar & 0xFC00) == 0xD800) {
|
|
|
|
len += 4;
|
|
|
|
i++;
|
|
|
|
}
|
|
|
|
|
|
|
|
// 3 bytes
|
|
|
|
else if (curChar & 0xF800) len += 3;
|
|
|
|
|
|
|
|
// 2 bytes
|
|
|
|
else if (curChar & 0xFF80) len += 2;
|
|
|
|
|
|
|
|
// Get next
|
|
|
|
curChar = utf16[++i];
|
|
|
|
}
|
|
|
|
|
|
|
|
return len;
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
///////////////////////////
|
|
|
|
// Convert UTF-16 to UTF-8
|
|
|
|
size_t String::UTF16toUTF8(const wchar_t *utf16,char *utf8)
|
|
|
|
{
|
|
|
|
wchar_t curChar = utf16[0];
|
|
|
|
size_t value;
|
|
|
|
size_t written = 0;
|
|
|
|
for (size_t i=0;;i++) {
|
|
|
|
// 1 byte
|
|
|
|
if ((curChar & 0xFF80) == 0) {
|
|
|
|
utf8[written] = char(curChar);
|
|
|
|
if (curChar == 0) break;
|
|
|
|
written++;
|
|
|
|
}
|
|
|
|
|
|
|
|
// 2 bytes
|
|
|
|
else if ((curChar & 0xF800) == 0) {
|
|
|
|
utf8[written] = char(((curChar & 0x07C0) >> 6) | 0xC0);
|
|
|
|
utf8[written+1] = char((curChar & 0x003F) | 0x80);
|
|
|
|
written += 2;
|
|
|
|
}
|
|
|
|
|
|
|
|
// Surrogate pair UTF-16
|
|
|
|
else if ((curChar & 0xFC00) == 0xD800) {
|
|
|
|
// Read
|
|
|
|
value = (curChar - 0xD800) << 10;
|
|
|
|
value |= utf16[i+1] & 0x3FF;
|
|
|
|
i++;
|
|
|
|
|
|
|
|
// Write
|
|
|
|
utf8[written] = char(((value & 0x1C0000) >> 18) | 0xF0);
|
|
|
|
utf8[written+1] = char(((value & 0x03F000) >> 12) | 0x80);
|
|
|
|
utf8[written+2] = char(((value & 0x000FC0) >> 6) | 0x80);
|
|
|
|
utf8[written+3] = char((value & 0x00003F) | 0x80);
|
|
|
|
written += 4;
|
|
|
|
}
|
|
|
|
|
|
|
|
// 3 bytes
|
|
|
|
else if (curChar & 0xF800) {
|
|
|
|
utf8[written] = char(((curChar & 0xF000) >> 12) | 0xE0);
|
|
|
|
utf8[written+1] = char(((curChar & 0x0FC0) >> 6) | 0x80);
|
|
|
|
utf8[written+2] = char((curChar & 0x003F) | 0x80);
|
|
|
|
written += 3;
|
|
|
|
}
|
|
|
|
|
|
|
|
// Get next
|
|
|
|
curChar = utf16[i+1];
|
|
|
|
}
|
|
|
|
return written;
|
|
|
|
}
|
|
|
|
|
2008-11-13 03:13:48 +01:00
|
|
|
size_t String::UTF8toUTF16(const char *utf8,wchar_t *utf16)
|
|
|
|
{
|
|
|
|
(void) utf8;
|
|
|
|
(void) utf16;
|
|
|
|
THROW_ATHENA_EXCEPTION(Exception::TODO);
|
|
|
|
}
|