623 lines
15 KiB
C++
623 lines
15 KiB
C++
/*
|
|
* Copyright (C) 2005 The Android Open Source Project
|
|
*
|
|
* Licensed under the Apache License, Version 2.0 (the "License");
|
|
* you may not use this file except in compliance with the License.
|
|
* You may obtain a copy of the License at
|
|
*
|
|
* http://www.apache.org/licenses/LICENSE-2.0
|
|
*
|
|
* Unless required by applicable law or agreed to in writing, software
|
|
* distributed under the License is distributed on an "AS IS" BASIS,
|
|
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
* See the License for the specific language governing permissions and
|
|
* limitations under the License.
|
|
*/
|
|
|
|
#include <utils/String16.h>
|
|
|
|
#include <utils/Debug.h>
|
|
#include <utils/Log.h>
|
|
#include <utils/String8.h>
|
|
#include <utils/TextOutput.h>
|
|
#include <utils/threads.h>
|
|
|
|
#include <private/utils/Static.h>
|
|
|
|
#ifdef HAVE_WINSOCK
|
|
# undef nhtol
|
|
# undef htonl
|
|
# undef nhtos
|
|
# undef htons
|
|
|
|
# ifdef HAVE_LITTLE_ENDIAN
|
|
# define ntohl(x) ( ((x) << 24) | (((x) >> 24) & 255) | (((x) << 8) & 0xff0000) | (((x) >> 8) & 0xff00) )
|
|
# define htonl(x) ntohl(x)
|
|
# define ntohs(x) ( (((x) << 8) & 0xff00) | (((x) >> 8) & 255) )
|
|
# define htons(x) ntohs(x)
|
|
# else
|
|
# define ntohl(x) (x)
|
|
# define htonl(x) (x)
|
|
# define ntohs(x) (x)
|
|
# define htons(x) (x)
|
|
# endif
|
|
#else
|
|
# include <netinet/in.h>
|
|
#endif
|
|
|
|
#include <memory.h>
|
|
#include <stdio.h>
|
|
#include <ctype.h>
|
|
|
|
// ---------------------------------------------------------------------------
|
|
|
|
int strcmp16(const char16_t *s1, const char16_t *s2)
|
|
{
|
|
char16_t ch;
|
|
int d = 0;
|
|
|
|
while ( 1 ) {
|
|
d = (int)(ch = *s1++) - (int)*s2++;
|
|
if ( d || !ch )
|
|
break;
|
|
}
|
|
|
|
return d;
|
|
}
|
|
|
|
int strncmp16(const char16_t *s1, const char16_t *s2, size_t n)
|
|
{
|
|
char16_t ch;
|
|
int d = 0;
|
|
|
|
while ( n-- ) {
|
|
d = (int)(ch = *s1++) - (int)*s2++;
|
|
if ( d || !ch )
|
|
break;
|
|
}
|
|
|
|
return d;
|
|
}
|
|
|
|
char16_t *strcpy16(char16_t *dst, const char16_t *src)
|
|
{
|
|
char16_t *q = dst;
|
|
const char16_t *p = src;
|
|
char16_t ch;
|
|
|
|
do {
|
|
*q++ = ch = *p++;
|
|
} while ( ch );
|
|
|
|
return dst;
|
|
}
|
|
|
|
size_t strlen16(const char16_t *s)
|
|
{
|
|
const char16_t *ss = s;
|
|
while ( *ss )
|
|
ss++;
|
|
return ss-s;
|
|
}
|
|
|
|
|
|
char16_t *strncpy16(char16_t *dst, const char16_t *src, size_t n)
|
|
{
|
|
char16_t *q = dst;
|
|
const char16_t *p = src;
|
|
char ch;
|
|
|
|
while (n) {
|
|
n--;
|
|
*q++ = ch = *p++;
|
|
if ( !ch )
|
|
break;
|
|
}
|
|
|
|
*q = 0;
|
|
|
|
return dst;
|
|
}
|
|
|
|
size_t strnlen16(const char16_t *s, size_t maxlen)
|
|
{
|
|
const char16_t *ss = s;
|
|
|
|
/* Important: the maxlen test must precede the reference through ss;
|
|
since the byte beyond the maximum may segfault */
|
|
while ((maxlen > 0) && *ss) {
|
|
ss++;
|
|
maxlen--;
|
|
}
|
|
return ss-s;
|
|
}
|
|
|
|
int strzcmp16(const char16_t *s1, size_t n1, const char16_t *s2, size_t n2)
|
|
{
|
|
const char16_t* e1 = s1+n1;
|
|
const char16_t* e2 = s2+n2;
|
|
|
|
while (s1 < e1 && s2 < e2) {
|
|
const int d = (int)*s1++ - (int)*s2++;
|
|
if (d) {
|
|
return d;
|
|
}
|
|
}
|
|
|
|
return n1 < n2
|
|
? (0 - (int)*s2)
|
|
: (n1 > n2
|
|
? ((int)*s1 - 0)
|
|
: 0);
|
|
}
|
|
|
|
int strzcmp16_h_n(const char16_t *s1H, size_t n1, const char16_t *s2N, size_t n2)
|
|
{
|
|
const char16_t* e1 = s1H+n1;
|
|
const char16_t* e2 = s2N+n2;
|
|
|
|
while (s1H < e1 && s2N < e2) {
|
|
const char16_t c2 = ntohs(*s2N);
|
|
const int d = (int)*s1H++ - (int)c2;
|
|
s2N++;
|
|
if (d) {
|
|
return d;
|
|
}
|
|
}
|
|
|
|
return n1 < n2
|
|
? (0 - (int)ntohs(*s2N))
|
|
: (n1 > n2
|
|
? ((int)*s1H - 0)
|
|
: 0);
|
|
}
|
|
|
|
// ---------------------------------------------------------------------------
|
|
|
|
namespace android {
|
|
|
|
static inline size_t
|
|
utf8_char_len(uint8_t ch)
|
|
{
|
|
return ((0xe5000000 >> ((ch >> 3) & 0x1e)) & 3) + 1;
|
|
}
|
|
|
|
#define UTF8_SHIFT_AND_MASK(unicode, byte) (unicode)<<=6; (unicode) |= (0x3f & (byte));
|
|
|
|
static inline uint32_t
|
|
utf8_to_utf32(const uint8_t *src, size_t length)
|
|
{
|
|
uint32_t unicode;
|
|
|
|
switch (length)
|
|
{
|
|
case 1:
|
|
return src[0];
|
|
case 2:
|
|
unicode = src[0] & 0x1f;
|
|
UTF8_SHIFT_AND_MASK(unicode, src[1])
|
|
return unicode;
|
|
case 3:
|
|
unicode = src[0] & 0x0f;
|
|
UTF8_SHIFT_AND_MASK(unicode, src[1])
|
|
UTF8_SHIFT_AND_MASK(unicode, src[2])
|
|
return unicode;
|
|
case 4:
|
|
unicode = src[0] & 0x07;
|
|
UTF8_SHIFT_AND_MASK(unicode, src[1])
|
|
UTF8_SHIFT_AND_MASK(unicode, src[2])
|
|
UTF8_SHIFT_AND_MASK(unicode, src[3])
|
|
return unicode;
|
|
default:
|
|
return 0xffff;
|
|
}
|
|
|
|
//printf("Char at %p: len=%d, utf-16=%p\n", src, length, (void*)result);
|
|
}
|
|
|
|
// ---------------------------------------------------------------------------
|
|
|
|
static SharedBuffer* gEmptyStringBuf = NULL;
|
|
static char16_t* gEmptyString = NULL;
|
|
|
|
static inline char16_t* getEmptyString()
|
|
{
|
|
gEmptyStringBuf->acquire();
|
|
return gEmptyString;
|
|
}
|
|
|
|
void initialize_string16()
|
|
{
|
|
SharedBuffer* buf = SharedBuffer::alloc(sizeof(char16_t));
|
|
char16_t* str = (char16_t*)buf->data();
|
|
*str = 0;
|
|
gEmptyStringBuf = buf;
|
|
gEmptyString = str;
|
|
}
|
|
|
|
void terminate_string16()
|
|
{
|
|
SharedBuffer::bufferFromData(gEmptyString)->release();
|
|
gEmptyStringBuf = NULL;
|
|
gEmptyString = NULL;
|
|
}
|
|
|
|
// ---------------------------------------------------------------------------
|
|
|
|
static char16_t* allocFromUTF8(const char* in, size_t len)
|
|
{
|
|
if (len == 0) return getEmptyString();
|
|
|
|
size_t chars = 0;
|
|
const char* end = in+len;
|
|
const char* p = in;
|
|
|
|
while (p < end) {
|
|
chars++;
|
|
int utf8len = utf8_char_len(*p);
|
|
uint32_t codepoint = utf8_to_utf32((const uint8_t*)p, utf8len);
|
|
if (codepoint > 0xFFFF) chars++; // this will be a surrogate pair in utf16
|
|
p += utf8len;
|
|
}
|
|
|
|
SharedBuffer* buf = SharedBuffer::alloc((chars+1)*sizeof(char16_t));
|
|
if (buf) {
|
|
p = in;
|
|
char16_t* str = (char16_t*)buf->data();
|
|
char16_t* d = str;
|
|
while (p < end) {
|
|
size_t len = utf8_char_len(*p);
|
|
uint32_t codepoint = utf8_to_utf32((const uint8_t*)p, len);
|
|
|
|
// Convert the UTF32 codepoint to one or more UTF16 codepoints
|
|
if (codepoint <= 0xFFFF) {
|
|
// Single UTF16 character
|
|
*d++ = (char16_t) codepoint;
|
|
} else {
|
|
// Multiple UTF16 characters with surrogates
|
|
codepoint = codepoint - 0x10000;
|
|
*d++ = (char16_t) ((codepoint >> 10) + 0xD800);
|
|
*d++ = (char16_t) ((codepoint & 0x3FF) + 0xDC00);
|
|
}
|
|
|
|
p += len;
|
|
}
|
|
*d = 0;
|
|
|
|
//printf("Created UTF-16 string from UTF-8 \"%s\":", in);
|
|
//printHexData(1, str, buf->size(), 16, 1);
|
|
//printf("\n");
|
|
|
|
return str;
|
|
}
|
|
|
|
return getEmptyString();
|
|
}
|
|
|
|
// ---------------------------------------------------------------------------
|
|
|
|
String16::String16()
|
|
: mString(getEmptyString())
|
|
{
|
|
}
|
|
|
|
String16::String16(const String16& o)
|
|
: mString(o.mString)
|
|
{
|
|
SharedBuffer::bufferFromData(mString)->acquire();
|
|
}
|
|
|
|
String16::String16(const String16& o, size_t len, size_t begin)
|
|
: mString(getEmptyString())
|
|
{
|
|
setTo(o, len, begin);
|
|
}
|
|
|
|
String16::String16(const char16_t* o)
|
|
{
|
|
size_t len = strlen16(o);
|
|
SharedBuffer* buf = SharedBuffer::alloc((len+1)*sizeof(char16_t));
|
|
LOG_ASSERT(buf, "Unable to allocate shared buffer");
|
|
if (buf) {
|
|
char16_t* str = (char16_t*)buf->data();
|
|
strcpy16(str, o);
|
|
mString = str;
|
|
return;
|
|
}
|
|
|
|
mString = getEmptyString();
|
|
}
|
|
|
|
String16::String16(const char16_t* o, size_t len)
|
|
{
|
|
SharedBuffer* buf = SharedBuffer::alloc((len+1)*sizeof(char16_t));
|
|
LOG_ASSERT(buf, "Unable to allocate shared buffer");
|
|
if (buf) {
|
|
char16_t* str = (char16_t*)buf->data();
|
|
memcpy(str, o, len*sizeof(char16_t));
|
|
str[len] = 0;
|
|
mString = str;
|
|
return;
|
|
}
|
|
|
|
mString = getEmptyString();
|
|
}
|
|
|
|
String16::String16(const String8& o)
|
|
: mString(allocFromUTF8(o.string(), o.size()))
|
|
{
|
|
}
|
|
|
|
String16::String16(const char* o)
|
|
: mString(allocFromUTF8(o, strlen(o)))
|
|
{
|
|
}
|
|
|
|
String16::String16(const char* o, size_t len)
|
|
: mString(allocFromUTF8(o, len))
|
|
{
|
|
}
|
|
|
|
String16::~String16()
|
|
{
|
|
SharedBuffer::bufferFromData(mString)->release();
|
|
}
|
|
|
|
void String16::setTo(const String16& other)
|
|
{
|
|
SharedBuffer::bufferFromData(other.mString)->acquire();
|
|
SharedBuffer::bufferFromData(mString)->release();
|
|
mString = other.mString;
|
|
}
|
|
|
|
status_t String16::setTo(const String16& other, size_t len, size_t begin)
|
|
{
|
|
const size_t N = other.size();
|
|
if (begin >= N) {
|
|
SharedBuffer::bufferFromData(mString)->release();
|
|
mString = getEmptyString();
|
|
return NO_ERROR;
|
|
}
|
|
if ((begin+len) > N) len = N-begin;
|
|
if (begin == 0 && len == N) {
|
|
setTo(other);
|
|
return NO_ERROR;
|
|
}
|
|
|
|
if (&other == this) {
|
|
LOG_ALWAYS_FATAL("Not implemented");
|
|
}
|
|
|
|
return setTo(other.string()+begin, len);
|
|
}
|
|
|
|
status_t String16::setTo(const char16_t* other)
|
|
{
|
|
return setTo(other, strlen16(other));
|
|
}
|
|
|
|
status_t String16::setTo(const char16_t* other, size_t len)
|
|
{
|
|
SharedBuffer* buf = SharedBuffer::bufferFromData(mString)
|
|
->editResize((len+1)*sizeof(char16_t));
|
|
if (buf) {
|
|
char16_t* str = (char16_t*)buf->data();
|
|
memmove(str, other, len*sizeof(char16_t));
|
|
str[len] = 0;
|
|
mString = str;
|
|
return NO_ERROR;
|
|
}
|
|
return NO_MEMORY;
|
|
}
|
|
|
|
status_t String16::append(const String16& other)
|
|
{
|
|
const size_t myLen = size();
|
|
const size_t otherLen = other.size();
|
|
if (myLen == 0) {
|
|
setTo(other);
|
|
return NO_ERROR;
|
|
} else if (otherLen == 0) {
|
|
return NO_ERROR;
|
|
}
|
|
|
|
SharedBuffer* buf = SharedBuffer::bufferFromData(mString)
|
|
->editResize((myLen+otherLen+1)*sizeof(char16_t));
|
|
if (buf) {
|
|
char16_t* str = (char16_t*)buf->data();
|
|
memcpy(str+myLen, other, (otherLen+1)*sizeof(char16_t));
|
|
mString = str;
|
|
return NO_ERROR;
|
|
}
|
|
return NO_MEMORY;
|
|
}
|
|
|
|
status_t String16::append(const char16_t* chrs, size_t otherLen)
|
|
{
|
|
const size_t myLen = size();
|
|
if (myLen == 0) {
|
|
setTo(chrs, otherLen);
|
|
return NO_ERROR;
|
|
} else if (otherLen == 0) {
|
|
return NO_ERROR;
|
|
}
|
|
|
|
SharedBuffer* buf = SharedBuffer::bufferFromData(mString)
|
|
->editResize((myLen+otherLen+1)*sizeof(char16_t));
|
|
if (buf) {
|
|
char16_t* str = (char16_t*)buf->data();
|
|
memcpy(str+myLen, chrs, otherLen*sizeof(char16_t));
|
|
str[myLen+otherLen] = 0;
|
|
mString = str;
|
|
return NO_ERROR;
|
|
}
|
|
return NO_MEMORY;
|
|
}
|
|
|
|
status_t String16::insert(size_t pos, const char16_t* chrs)
|
|
{
|
|
return insert(pos, chrs, strlen16(chrs));
|
|
}
|
|
|
|
status_t String16::insert(size_t pos, const char16_t* chrs, size_t len)
|
|
{
|
|
const size_t myLen = size();
|
|
if (myLen == 0) {
|
|
return setTo(chrs, len);
|
|
return NO_ERROR;
|
|
} else if (len == 0) {
|
|
return NO_ERROR;
|
|
}
|
|
|
|
if (pos > myLen) pos = myLen;
|
|
|
|
#if 0
|
|
printf("Insert in to %s: pos=%d, len=%d, myLen=%d, chrs=%s\n",
|
|
String8(*this).string(), pos,
|
|
len, myLen, String8(chrs, len).string());
|
|
#endif
|
|
|
|
SharedBuffer* buf = SharedBuffer::bufferFromData(mString)
|
|
->editResize((myLen+len+1)*sizeof(char16_t));
|
|
if (buf) {
|
|
char16_t* str = (char16_t*)buf->data();
|
|
if (pos < myLen) {
|
|
memmove(str+pos+len, str+pos, (myLen-pos)*sizeof(char16_t));
|
|
}
|
|
memcpy(str+pos, chrs, len*sizeof(char16_t));
|
|
str[myLen+len] = 0;
|
|
mString = str;
|
|
#if 0
|
|
printf("Result (%d chrs): %s\n", size(), String8(*this).string());
|
|
#endif
|
|
return NO_ERROR;
|
|
}
|
|
return NO_MEMORY;
|
|
}
|
|
|
|
ssize_t String16::findFirst(char16_t c) const
|
|
{
|
|
const char16_t* str = string();
|
|
const char16_t* p = str;
|
|
const char16_t* e = p + size();
|
|
while (p < e) {
|
|
if (*p == c) {
|
|
return p-str;
|
|
}
|
|
p++;
|
|
}
|
|
return -1;
|
|
}
|
|
|
|
ssize_t String16::findLast(char16_t c) const
|
|
{
|
|
const char16_t* str = string();
|
|
const char16_t* p = str;
|
|
const char16_t* e = p + size();
|
|
while (p < e) {
|
|
e--;
|
|
if (*e == c) {
|
|
return e-str;
|
|
}
|
|
}
|
|
return -1;
|
|
}
|
|
|
|
bool String16::startsWith(const String16& prefix) const
|
|
{
|
|
const size_t ps = prefix.size();
|
|
if (ps > size()) return false;
|
|
return strzcmp16(mString, ps, prefix.string(), ps) == 0;
|
|
}
|
|
|
|
bool String16::startsWith(const char16_t* prefix) const
|
|
{
|
|
const size_t ps = strlen16(prefix);
|
|
if (ps > size()) return false;
|
|
return strncmp16(mString, prefix, ps) == 0;
|
|
}
|
|
|
|
status_t String16::makeLower()
|
|
{
|
|
const size_t N = size();
|
|
const char16_t* str = string();
|
|
char16_t* edit = NULL;
|
|
for (size_t i=0; i<N; i++) {
|
|
const char16_t v = str[i];
|
|
if (v >= 'A' && v <= 'Z') {
|
|
if (!edit) {
|
|
SharedBuffer* buf = SharedBuffer::bufferFromData(mString)->edit();
|
|
if (!buf) {
|
|
return NO_MEMORY;
|
|
}
|
|
edit = (char16_t*)buf->data();
|
|
mString = str = edit;
|
|
}
|
|
edit[i] = tolower((char)v);
|
|
}
|
|
}
|
|
return NO_ERROR;
|
|
}
|
|
|
|
status_t String16::replaceAll(char16_t replaceThis, char16_t withThis)
|
|
{
|
|
const size_t N = size();
|
|
const char16_t* str = string();
|
|
char16_t* edit = NULL;
|
|
for (size_t i=0; i<N; i++) {
|
|
if (str[i] == replaceThis) {
|
|
if (!edit) {
|
|
SharedBuffer* buf = SharedBuffer::bufferFromData(mString)->edit();
|
|
if (!buf) {
|
|
return NO_MEMORY;
|
|
}
|
|
edit = (char16_t*)buf->data();
|
|
mString = str = edit;
|
|
}
|
|
edit[i] = withThis;
|
|
}
|
|
}
|
|
return NO_ERROR;
|
|
}
|
|
|
|
status_t String16::remove(size_t len, size_t begin)
|
|
{
|
|
const size_t N = size();
|
|
if (begin >= N) {
|
|
SharedBuffer::bufferFromData(mString)->release();
|
|
mString = getEmptyString();
|
|
return NO_ERROR;
|
|
}
|
|
if ((begin+len) > N) len = N-begin;
|
|
if (begin == 0 && len == N) {
|
|
return NO_ERROR;
|
|
}
|
|
|
|
if (begin > 0) {
|
|
SharedBuffer* buf = SharedBuffer::bufferFromData(mString)
|
|
->editResize((N+1)*sizeof(char16_t));
|
|
if (!buf) {
|
|
return NO_MEMORY;
|
|
}
|
|
char16_t* str = (char16_t*)buf->data();
|
|
memmove(str, str+begin, (N-begin+1)*sizeof(char16_t));
|
|
mString = str;
|
|
}
|
|
SharedBuffer* buf = SharedBuffer::bufferFromData(mString)
|
|
->editResize((len+1)*sizeof(char16_t));
|
|
if (buf) {
|
|
char16_t* str = (char16_t*)buf->data();
|
|
str[len] = 0;
|
|
mString = str;
|
|
return NO_ERROR;
|
|
}
|
|
return NO_MEMORY;
|
|
}
|
|
|
|
TextOutput& operator<<(TextOutput& to, const String16& val)
|
|
{
|
|
to << String8(val).string();
|
|
return to;
|
|
}
|
|
|
|
}; // namespace android
|