|  | /* | 
|  | * Copyright (C) 2005 The Android Open Source Project | 
|  | * | 
|  | * Licensed under the Apache License, Version 2.0 (the "License"); | 
|  | * you may not use this file except in compliance with the License. | 
|  | * You may obtain a copy of the License at | 
|  | * | 
|  | *      http://www.apache.org/licenses/LICENSE-2.0 | 
|  | * | 
|  | * Unless required by applicable law or agreed to in writing, software | 
|  | * distributed under the License is distributed on an "AS IS" BASIS, | 
|  | * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. | 
|  | * See the License for the specific language governing permissions and | 
|  | * limitations under the License. | 
|  | */ | 
|  |  | 
|  | #include <utils/String16.h> | 
|  |  | 
|  | #include <utils/Debug.h> | 
|  | #include <utils/Log.h> | 
|  | #include <utils/String8.h> | 
|  | #include <utils/TextOutput.h> | 
|  | #include <utils/threads.h> | 
|  |  | 
|  | #include <private/utils/Static.h> | 
|  |  | 
|  | #ifdef HAVE_WINSOCK | 
|  | # undef  nhtol | 
|  | # undef  htonl | 
|  | # undef  nhtos | 
|  | # undef  htons | 
|  |  | 
|  | # ifdef HAVE_LITTLE_ENDIAN | 
|  | #  define ntohl(x)    ( ((x) << 24) | (((x) >> 24) & 255) | (((x) << 8) & 0xff0000) | (((x) >> 8) & 0xff00) ) | 
|  | #  define htonl(x)    ntohl(x) | 
|  | #  define ntohs(x)    ( (((x) << 8) & 0xff00) | (((x) >> 8) & 255) ) | 
|  | #  define htons(x)    ntohs(x) | 
|  | # else | 
|  | #  define ntohl(x)    (x) | 
|  | #  define htonl(x)    (x) | 
|  | #  define ntohs(x)    (x) | 
|  | #  define htons(x)    (x) | 
|  | # endif | 
|  | #else | 
|  | # include <netinet/in.h> | 
|  | #endif | 
|  |  | 
|  | #include <memory.h> | 
|  | #include <stdio.h> | 
|  | #include <ctype.h> | 
|  |  | 
|  | // --------------------------------------------------------------------------- | 
|  |  | 
|  | int strcmp16(const char16_t *s1, const char16_t *s2) | 
|  | { | 
|  | char16_t ch; | 
|  | int d = 0; | 
|  |  | 
|  | while ( 1 ) { | 
|  | d = (int)(ch = *s1++) - (int)*s2++; | 
|  | if ( d || !ch ) | 
|  | break; | 
|  | } | 
|  |  | 
|  | return d; | 
|  | } | 
|  |  | 
|  | int strncmp16(const char16_t *s1, const char16_t *s2, size_t n) | 
|  | { | 
|  | char16_t ch; | 
|  | int d = 0; | 
|  |  | 
|  | while ( n-- ) { | 
|  | d = (int)(ch = *s1++) - (int)*s2++; | 
|  | if ( d || !ch ) | 
|  | break; | 
|  | } | 
|  |  | 
|  | return d; | 
|  | } | 
|  |  | 
|  | char16_t *strcpy16(char16_t *dst, const char16_t *src) | 
|  | { | 
|  | char16_t *q = dst; | 
|  | const char16_t *p = src; | 
|  | char16_t ch; | 
|  |  | 
|  | do { | 
|  | *q++ = ch = *p++; | 
|  | } while ( ch ); | 
|  |  | 
|  | return dst; | 
|  | } | 
|  |  | 
|  | size_t strlen16(const char16_t *s) | 
|  | { | 
|  | const char16_t *ss = s; | 
|  | while ( *ss ) | 
|  | ss++; | 
|  | return ss-s; | 
|  | } | 
|  |  | 
|  |  | 
|  | char16_t *strncpy16(char16_t *dst, const char16_t *src, size_t n) | 
|  | { | 
|  | char16_t *q = dst; | 
|  | const char16_t *p = src; | 
|  | char ch; | 
|  |  | 
|  | while (n) { | 
|  | n--; | 
|  | *q++ = ch = *p++; | 
|  | if ( !ch ) | 
|  | break; | 
|  | } | 
|  |  | 
|  | *q = 0; | 
|  |  | 
|  | return dst; | 
|  | } | 
|  |  | 
|  | size_t strnlen16(const char16_t *s, size_t maxlen) | 
|  | { | 
|  | const char16_t *ss = s; | 
|  |  | 
|  | /* Important: the maxlen test must precede the reference through ss; | 
|  | since the byte beyond the maximum may segfault */ | 
|  | while ((maxlen > 0) && *ss) { | 
|  | ss++; | 
|  | maxlen--; | 
|  | } | 
|  | return ss-s; | 
|  | } | 
|  |  | 
|  | int strzcmp16(const char16_t *s1, size_t n1, const char16_t *s2, size_t n2) | 
|  | { | 
|  | const char16_t* e1 = s1+n1; | 
|  | const char16_t* e2 = s2+n2; | 
|  |  | 
|  | while (s1 < e1 && s2 < e2) { | 
|  | const int d = (int)*s1++ - (int)*s2++; | 
|  | if (d) { | 
|  | return d; | 
|  | } | 
|  | } | 
|  |  | 
|  | return n1 < n2 | 
|  | ? (0 - (int)*s2) | 
|  | : (n1 > n2 | 
|  | ? ((int)*s1 - 0) | 
|  | : 0); | 
|  | } | 
|  |  | 
|  | int strzcmp16_h_n(const char16_t *s1H, size_t n1, const char16_t *s2N, size_t n2) | 
|  | { | 
|  | const char16_t* e1 = s1H+n1; | 
|  | const char16_t* e2 = s2N+n2; | 
|  |  | 
|  | while (s1H < e1 && s2N < e2) { | 
|  | const char16_t c2 = ntohs(*s2N); | 
|  | const int d = (int)*s1H++ - (int)c2; | 
|  | s2N++; | 
|  | if (d) { | 
|  | return d; | 
|  | } | 
|  | } | 
|  |  | 
|  | return n1 < n2 | 
|  | ? (0 - (int)ntohs(*s2N)) | 
|  | : (n1 > n2 | 
|  | ? ((int)*s1H - 0) | 
|  | : 0); | 
|  | } | 
|  |  | 
|  | // --------------------------------------------------------------------------- | 
|  |  | 
|  | namespace android { | 
|  |  | 
|  | static inline size_t | 
|  | utf8_char_len(uint8_t ch) | 
|  | { | 
|  | return ((0xe5000000 >> ((ch >> 3) & 0x1e)) & 3) + 1; | 
|  | } | 
|  |  | 
|  | #define UTF8_SHIFT_AND_MASK(unicode, byte)  (unicode)<<=6; (unicode) |= (0x3f & (byte)); | 
|  |  | 
|  | static inline uint32_t | 
|  | utf8_to_utf32(const uint8_t *src, size_t length) | 
|  | { | 
|  | uint32_t unicode; | 
|  |  | 
|  | switch (length) | 
|  | { | 
|  | case 1: | 
|  | return src[0]; | 
|  | case 2: | 
|  | unicode = src[0] & 0x1f; | 
|  | UTF8_SHIFT_AND_MASK(unicode, src[1]) | 
|  | return unicode; | 
|  | case 3: | 
|  | unicode = src[0] & 0x0f; | 
|  | UTF8_SHIFT_AND_MASK(unicode, src[1]) | 
|  | UTF8_SHIFT_AND_MASK(unicode, src[2]) | 
|  | return unicode; | 
|  | case 4: | 
|  | unicode = src[0] & 0x07; | 
|  | UTF8_SHIFT_AND_MASK(unicode, src[1]) | 
|  | UTF8_SHIFT_AND_MASK(unicode, src[2]) | 
|  | UTF8_SHIFT_AND_MASK(unicode, src[3]) | 
|  | return unicode; | 
|  | default: | 
|  | return 0xffff; | 
|  | } | 
|  |  | 
|  | //printf("Char at %p: len=%d, utf-16=%p\n", src, length, (void*)result); | 
|  | } | 
|  |  | 
|  | // --------------------------------------------------------------------------- | 
|  |  | 
|  | static SharedBuffer* gEmptyStringBuf = NULL; | 
|  | static char16_t* gEmptyString = NULL; | 
|  |  | 
|  | static inline char16_t* getEmptyString() | 
|  | { | 
|  | gEmptyStringBuf->acquire(); | 
|  | return gEmptyString; | 
|  | } | 
|  |  | 
|  | void initialize_string16() | 
|  | { | 
|  | SharedBuffer* buf = SharedBuffer::alloc(sizeof(char16_t)); | 
|  | char16_t* str = (char16_t*)buf->data(); | 
|  | *str = 0; | 
|  | gEmptyStringBuf = buf; | 
|  | gEmptyString = str; | 
|  | } | 
|  |  | 
|  | void terminate_string16() | 
|  | { | 
|  | SharedBuffer::bufferFromData(gEmptyString)->release(); | 
|  | gEmptyStringBuf = NULL; | 
|  | gEmptyString = NULL; | 
|  | } | 
|  |  | 
|  | // --------------------------------------------------------------------------- | 
|  |  | 
|  | // Note: not dealing with generating surrogate pairs. | 
|  | static char16_t* allocFromUTF8(const char* in, size_t len) | 
|  | { | 
|  | if (len == 0) return getEmptyString(); | 
|  |  | 
|  | size_t chars = 0; | 
|  | const char* end = in+len; | 
|  | const char* p = in; | 
|  |  | 
|  | while (p < end) { | 
|  | chars++; | 
|  | p += utf8_char_len(*p); | 
|  | } | 
|  |  | 
|  | SharedBuffer* buf = SharedBuffer::alloc((chars+1)*sizeof(char16_t)); | 
|  | if (buf) { | 
|  | p = in; | 
|  | char16_t* str = (char16_t*)buf->data(); | 
|  | char16_t* d = str; | 
|  | while (p < end) { | 
|  | size_t len = utf8_char_len(*p); | 
|  | *d++ = (char16_t)utf8_to_utf32((const uint8_t*)p, len); | 
|  | p += len; | 
|  | } | 
|  | *d = 0; | 
|  |  | 
|  | //printf("Created UTF-16 string from UTF-8 \"%s\":", in); | 
|  | //printHexData(1, str, buf->size(), 16, 1); | 
|  | //printf("\n"); | 
|  |  | 
|  | return str; | 
|  | } | 
|  |  | 
|  | return getEmptyString(); | 
|  | } | 
|  |  | 
|  | // --------------------------------------------------------------------------- | 
|  |  | 
|  | String16::String16() | 
|  | : mString(getEmptyString()) | 
|  | { | 
|  | } | 
|  |  | 
|  | String16::String16(const String16& o) | 
|  | : mString(o.mString) | 
|  | { | 
|  | SharedBuffer::bufferFromData(mString)->acquire(); | 
|  | } | 
|  |  | 
|  | String16::String16(const String16& o, size_t len, size_t begin) | 
|  | : mString(getEmptyString()) | 
|  | { | 
|  | setTo(o, len, begin); | 
|  | } | 
|  |  | 
|  | String16::String16(const char16_t* o) | 
|  | { | 
|  | size_t len = strlen16(o); | 
|  | SharedBuffer* buf = SharedBuffer::alloc((len+1)*sizeof(char16_t)); | 
|  | LOG_ASSERT(buf, "Unable to allocate shared buffer"); | 
|  | if (buf) { | 
|  | char16_t* str = (char16_t*)buf->data(); | 
|  | strcpy16(str, o); | 
|  | mString = str; | 
|  | return; | 
|  | } | 
|  |  | 
|  | mString = getEmptyString(); | 
|  | } | 
|  |  | 
|  | String16::String16(const char16_t* o, size_t len) | 
|  | { | 
|  | SharedBuffer* buf = SharedBuffer::alloc((len+1)*sizeof(char16_t)); | 
|  | LOG_ASSERT(buf, "Unable to allocate shared buffer"); | 
|  | if (buf) { | 
|  | char16_t* str = (char16_t*)buf->data(); | 
|  | memcpy(str, o, len*sizeof(char16_t)); | 
|  | str[len] = 0; | 
|  | mString = str; | 
|  | return; | 
|  | } | 
|  |  | 
|  | mString = getEmptyString(); | 
|  | } | 
|  |  | 
|  | String16::String16(const String8& o) | 
|  | : mString(allocFromUTF8(o.string(), o.size())) | 
|  | { | 
|  | } | 
|  |  | 
|  | String16::String16(const char* o) | 
|  | : mString(allocFromUTF8(o, strlen(o))) | 
|  | { | 
|  | } | 
|  |  | 
|  | String16::String16(const char* o, size_t len) | 
|  | : mString(allocFromUTF8(o, len)) | 
|  | { | 
|  | } | 
|  |  | 
|  | String16::~String16() | 
|  | { | 
|  | SharedBuffer::bufferFromData(mString)->release(); | 
|  | } | 
|  |  | 
|  | void String16::setTo(const String16& other) | 
|  | { | 
|  | SharedBuffer::bufferFromData(other.mString)->acquire(); | 
|  | SharedBuffer::bufferFromData(mString)->release(); | 
|  | mString = other.mString; | 
|  | } | 
|  |  | 
|  | status_t String16::setTo(const String16& other, size_t len, size_t begin) | 
|  | { | 
|  | const size_t N = other.size(); | 
|  | if (begin >= N) { | 
|  | SharedBuffer::bufferFromData(mString)->release(); | 
|  | mString = getEmptyString(); | 
|  | return NO_ERROR; | 
|  | } | 
|  | if ((begin+len) > N) len = N-begin; | 
|  | if (begin == 0 && len == N) { | 
|  | setTo(other); | 
|  | return NO_ERROR; | 
|  | } | 
|  |  | 
|  | if (&other == this) { | 
|  | LOG_ALWAYS_FATAL("Not implemented"); | 
|  | } | 
|  |  | 
|  | return setTo(other.string()+begin, len); | 
|  | } | 
|  |  | 
|  | status_t String16::setTo(const char16_t* other) | 
|  | { | 
|  | return setTo(other, strlen16(other)); | 
|  | } | 
|  |  | 
|  | status_t String16::setTo(const char16_t* other, size_t len) | 
|  | { | 
|  | SharedBuffer* buf = SharedBuffer::bufferFromData(mString) | 
|  | ->editResize((len+1)*sizeof(char16_t)); | 
|  | if (buf) { | 
|  | char16_t* str = (char16_t*)buf->data(); | 
|  | memcpy(str, other, len*sizeof(char16_t)); | 
|  | str[len] = 0; | 
|  | mString = str; | 
|  | return NO_ERROR; | 
|  | } | 
|  | return NO_MEMORY; | 
|  | } | 
|  |  | 
|  | status_t String16::append(const String16& other) | 
|  | { | 
|  | const size_t myLen = size(); | 
|  | const size_t otherLen = other.size(); | 
|  | if (myLen == 0) { | 
|  | setTo(other); | 
|  | return NO_ERROR; | 
|  | } else if (otherLen == 0) { | 
|  | return NO_ERROR; | 
|  | } | 
|  |  | 
|  | SharedBuffer* buf = SharedBuffer::bufferFromData(mString) | 
|  | ->editResize((myLen+otherLen+1)*sizeof(char16_t)); | 
|  | if (buf) { | 
|  | char16_t* str = (char16_t*)buf->data(); | 
|  | memcpy(str+myLen, other, (otherLen+1)*sizeof(char16_t)); | 
|  | mString = str; | 
|  | return NO_ERROR; | 
|  | } | 
|  | return NO_MEMORY; | 
|  | } | 
|  |  | 
|  | status_t String16::append(const char16_t* chrs, size_t otherLen) | 
|  | { | 
|  | const size_t myLen = size(); | 
|  | if (myLen == 0) { | 
|  | setTo(chrs, otherLen); | 
|  | return NO_ERROR; | 
|  | } else if (otherLen == 0) { | 
|  | return NO_ERROR; | 
|  | } | 
|  |  | 
|  | SharedBuffer* buf = SharedBuffer::bufferFromData(mString) | 
|  | ->editResize((myLen+otherLen+1)*sizeof(char16_t)); | 
|  | if (buf) { | 
|  | char16_t* str = (char16_t*)buf->data(); | 
|  | memcpy(str+myLen, chrs, otherLen*sizeof(char16_t)); | 
|  | str[myLen+otherLen] = 0; | 
|  | mString = str; | 
|  | return NO_ERROR; | 
|  | } | 
|  | return NO_MEMORY; | 
|  | } | 
|  |  | 
|  | status_t String16::insert(size_t pos, const char16_t* chrs) | 
|  | { | 
|  | return insert(pos, chrs, strlen16(chrs)); | 
|  | } | 
|  |  | 
|  | status_t String16::insert(size_t pos, const char16_t* chrs, size_t len) | 
|  | { | 
|  | const size_t myLen = size(); | 
|  | if (myLen == 0) { | 
|  | return setTo(chrs, len); | 
|  | return NO_ERROR; | 
|  | } else if (len == 0) { | 
|  | return NO_ERROR; | 
|  | } | 
|  |  | 
|  | if (pos > myLen) pos = myLen; | 
|  |  | 
|  | #if 0 | 
|  | printf("Insert in to %s: pos=%d, len=%d, myLen=%d, chrs=%s\n", | 
|  | String8(*this).string(), pos, | 
|  | len, myLen, String8(chrs, len).string()); | 
|  | #endif | 
|  |  | 
|  | SharedBuffer* buf = SharedBuffer::bufferFromData(mString) | 
|  | ->editResize((myLen+len+1)*sizeof(char16_t)); | 
|  | if (buf) { | 
|  | char16_t* str = (char16_t*)buf->data(); | 
|  | if (pos < myLen) { | 
|  | memmove(str+pos+len, str+pos, (myLen-pos)*sizeof(char16_t)); | 
|  | } | 
|  | memcpy(str+pos, chrs, len*sizeof(char16_t)); | 
|  | str[myLen+len] = 0; | 
|  | mString = str; | 
|  | #if 0 | 
|  | printf("Result (%d chrs): %s\n", size(), String8(*this).string()); | 
|  | #endif | 
|  | return NO_ERROR; | 
|  | } | 
|  | return NO_MEMORY; | 
|  | } | 
|  |  | 
|  | ssize_t String16::findFirst(char16_t c) const | 
|  | { | 
|  | const char16_t* str = string(); | 
|  | const char16_t* p = str; | 
|  | const char16_t* e = p + size(); | 
|  | while (p < e) { | 
|  | if (*p == c) { | 
|  | return p-str; | 
|  | } | 
|  | p++; | 
|  | } | 
|  | return -1; | 
|  | } | 
|  |  | 
|  | ssize_t String16::findLast(char16_t c) const | 
|  | { | 
|  | const char16_t* str = string(); | 
|  | const char16_t* p = str; | 
|  | const char16_t* e = p + size(); | 
|  | while (p < e) { | 
|  | e--; | 
|  | if (*e == c) { | 
|  | return e-str; | 
|  | } | 
|  | } | 
|  | return -1; | 
|  | } | 
|  |  | 
|  | bool String16::startsWith(const String16& prefix) const | 
|  | { | 
|  | const size_t ps = prefix.size(); | 
|  | if (ps > size()) return false; | 
|  | return strzcmp16(mString, ps, prefix.string(), ps) == 0; | 
|  | } | 
|  |  | 
|  | bool String16::startsWith(const char16_t* prefix) const | 
|  | { | 
|  | const size_t ps = strlen16(prefix); | 
|  | if (ps > size()) return false; | 
|  | return strncmp16(mString, prefix, ps) == 0; | 
|  | } | 
|  |  | 
|  | status_t String16::makeLower() | 
|  | { | 
|  | const size_t N = size(); | 
|  | const char16_t* str = string(); | 
|  | char16_t* edit = NULL; | 
|  | for (size_t i=0; i<N; i++) { | 
|  | const char16_t v = str[i]; | 
|  | if (v >= 'A' && v <= 'Z') { | 
|  | if (!edit) { | 
|  | SharedBuffer* buf = SharedBuffer::bufferFromData(mString)->edit(); | 
|  | if (!buf) { | 
|  | return NO_MEMORY; | 
|  | } | 
|  | edit = (char16_t*)buf->data(); | 
|  | mString = str = edit; | 
|  | } | 
|  | edit[i] = tolower((char)v); | 
|  | } | 
|  | } | 
|  | return NO_ERROR; | 
|  | } | 
|  |  | 
|  | status_t String16::replaceAll(char16_t replaceThis, char16_t withThis) | 
|  | { | 
|  | const size_t N = size(); | 
|  | const char16_t* str = string(); | 
|  | char16_t* edit = NULL; | 
|  | for (size_t i=0; i<N; i++) { | 
|  | if (str[i] == replaceThis) { | 
|  | if (!edit) { | 
|  | SharedBuffer* buf = SharedBuffer::bufferFromData(mString)->edit(); | 
|  | if (!buf) { | 
|  | return NO_MEMORY; | 
|  | } | 
|  | edit = (char16_t*)buf->data(); | 
|  | mString = str = edit; | 
|  | } | 
|  | edit[i] = withThis; | 
|  | } | 
|  | } | 
|  | return NO_ERROR; | 
|  | } | 
|  |  | 
|  | status_t String16::remove(size_t len, size_t begin) | 
|  | { | 
|  | const size_t N = size(); | 
|  | if (begin >= N) { | 
|  | SharedBuffer::bufferFromData(mString)->release(); | 
|  | mString = getEmptyString(); | 
|  | return NO_ERROR; | 
|  | } | 
|  | if ((begin+len) > N) len = N-begin; | 
|  | if (begin == 0 && len == N) { | 
|  | return NO_ERROR; | 
|  | } | 
|  |  | 
|  | if (begin > 0) { | 
|  | SharedBuffer* buf = SharedBuffer::bufferFromData(mString) | 
|  | ->editResize((N+1)*sizeof(char16_t)); | 
|  | if (!buf) { | 
|  | return NO_MEMORY; | 
|  | } | 
|  | char16_t* str = (char16_t*)buf->data(); | 
|  | memmove(str, str+begin, (N-begin+1)*sizeof(char16_t)); | 
|  | mString = str; | 
|  | } | 
|  | SharedBuffer* buf = SharedBuffer::bufferFromData(mString) | 
|  | ->editResize((len+1)*sizeof(char16_t)); | 
|  | if (buf) { | 
|  | char16_t* str = (char16_t*)buf->data(); | 
|  | str[len] = 0; | 
|  | mString = str; | 
|  | return NO_ERROR; | 
|  | } | 
|  | return NO_MEMORY; | 
|  | } | 
|  |  | 
|  | TextOutput& operator<<(TextOutput& to, const String16& val) | 
|  | { | 
|  | to << String8(val).string(); | 
|  | return to; | 
|  | } | 
|  |  | 
|  | }; // namespace android |