2020-08-11 11:10:23 +02:00
|
|
|
// © 2016 and later: Unicode, Inc. and others.
|
|
|
|
// License & terms of use: http://www.unicode.org/copyright.html
|
|
|
|
/*
|
|
|
|
*******************************************************************************
|
|
|
|
* Copyright (C) 2010-2015, International Business Machines
|
|
|
|
* Corporation and others. All Rights Reserved.
|
|
|
|
*******************************************************************************
|
|
|
|
* file name: charstr.cpp
|
|
|
|
* encoding: UTF-8
|
|
|
|
* tab size: 8 (not used)
|
|
|
|
* indentation:4
|
|
|
|
*
|
|
|
|
* created on: 2010may19
|
|
|
|
* created by: Markus W. Scherer
|
|
|
|
*/
|
|
|
|
|
2021-04-22 14:08:59 +02:00
|
|
|
#include <cstdlib>
|
|
|
|
|
2020-08-11 11:10:23 +02:00
|
|
|
#include "unicode/utypes.h"
|
|
|
|
#include "unicode/putil.h"
|
|
|
|
#include "charstr.h"
|
|
|
|
#include "cmemory.h"
|
|
|
|
#include "cstring.h"
|
|
|
|
#include "uinvchar.h"
|
|
|
|
#include "ustr_imp.h"
|
|
|
|
|
|
|
|
U_NAMESPACE_BEGIN
|
|
|
|
|
2023-05-23 02:05:01 +02:00
|
|
|
CharString::CharString(CharString&& src) noexcept
|
2020-08-11 11:10:23 +02:00
|
|
|
: buffer(std::move(src.buffer)), len(src.len) {
|
|
|
|
src.len = 0; // not strictly necessary because we make no guarantees on the source string
|
|
|
|
}
|
|
|
|
|
2023-05-23 02:05:01 +02:00
|
|
|
CharString& CharString::operator=(CharString&& src) noexcept {
|
2020-08-11 11:10:23 +02:00
|
|
|
buffer = std::move(src.buffer);
|
|
|
|
len = src.len;
|
|
|
|
src.len = 0; // not strictly necessary because we make no guarantees on the source string
|
|
|
|
return *this;
|
|
|
|
}
|
|
|
|
|
|
|
|
char *CharString::cloneData(UErrorCode &errorCode) const {
|
|
|
|
if (U_FAILURE(errorCode)) { return nullptr; }
|
|
|
|
char *p = static_cast<char *>(uprv_malloc(len + 1));
|
|
|
|
if (p == nullptr) {
|
|
|
|
errorCode = U_MEMORY_ALLOCATION_ERROR;
|
|
|
|
return nullptr;
|
|
|
|
}
|
|
|
|
uprv_memcpy(p, buffer.getAlias(), len + 1);
|
|
|
|
return p;
|
|
|
|
}
|
|
|
|
|
|
|
|
int32_t CharString::extract(char *dest, int32_t capacity, UErrorCode &errorCode) const {
|
|
|
|
if (U_FAILURE(errorCode)) { return len; }
|
|
|
|
if (capacity < 0 || (capacity > 0 && dest == nullptr)) {
|
|
|
|
errorCode = U_ILLEGAL_ARGUMENT_ERROR;
|
|
|
|
return len;
|
|
|
|
}
|
|
|
|
const char *src = buffer.getAlias();
|
|
|
|
if (0 < len && len <= capacity && src != dest) {
|
|
|
|
uprv_memcpy(dest, src, len);
|
|
|
|
}
|
|
|
|
return u_terminateChars(dest, capacity, len, &errorCode);
|
|
|
|
}
|
|
|
|
|
|
|
|
CharString &CharString::copyFrom(const CharString &s, UErrorCode &errorCode) {
|
|
|
|
if(U_SUCCESS(errorCode) && this!=&s && ensureCapacity(s.len+1, 0, errorCode)) {
|
|
|
|
len=s.len;
|
|
|
|
uprv_memcpy(buffer.getAlias(), s.buffer.getAlias(), len+1);
|
|
|
|
}
|
|
|
|
return *this;
|
|
|
|
}
|
|
|
|
|
|
|
|
int32_t CharString::lastIndexOf(char c) const {
|
|
|
|
for(int32_t i=len; i>0;) {
|
|
|
|
if(buffer[--i]==c) {
|
|
|
|
return i;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
return -1;
|
|
|
|
}
|
|
|
|
|
|
|
|
bool CharString::contains(StringPiece s) const {
|
|
|
|
if (s.empty()) { return false; }
|
|
|
|
const char *p = buffer.getAlias();
|
|
|
|
int32_t lastStart = len - s.length();
|
|
|
|
for (int32_t i = 0; i <= lastStart; ++i) {
|
|
|
|
if (uprv_memcmp(p + i, s.data(), s.length()) == 0) {
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
|
|
|
|
CharString &CharString::truncate(int32_t newLength) {
|
|
|
|
if(newLength<0) {
|
|
|
|
newLength=0;
|
|
|
|
}
|
|
|
|
if(newLength<len) {
|
|
|
|
buffer[len=newLength]=0;
|
|
|
|
}
|
|
|
|
return *this;
|
|
|
|
}
|
|
|
|
|
|
|
|
CharString &CharString::append(char c, UErrorCode &errorCode) {
|
|
|
|
if(ensureCapacity(len+2, 0, errorCode)) {
|
|
|
|
buffer[len++]=c;
|
|
|
|
buffer[len]=0;
|
|
|
|
}
|
|
|
|
return *this;
|
|
|
|
}
|
|
|
|
|
|
|
|
CharString &CharString::append(const char *s, int32_t sLength, UErrorCode &errorCode) {
|
|
|
|
if(U_FAILURE(errorCode)) {
|
|
|
|
return *this;
|
|
|
|
}
|
2023-05-23 02:05:01 +02:00
|
|
|
if(sLength<-1 || (s==nullptr && sLength!=0)) {
|
2020-08-11 11:10:23 +02:00
|
|
|
errorCode=U_ILLEGAL_ARGUMENT_ERROR;
|
|
|
|
return *this;
|
|
|
|
}
|
|
|
|
if(sLength<0) {
|
|
|
|
sLength= static_cast<int32_t>(uprv_strlen(s));
|
|
|
|
}
|
|
|
|
if(sLength>0) {
|
|
|
|
if(s==(buffer.getAlias()+len)) {
|
|
|
|
// The caller wrote into the getAppendBuffer().
|
|
|
|
if(sLength>=(buffer.getCapacity()-len)) {
|
|
|
|
// The caller wrote too much.
|
|
|
|
errorCode=U_INTERNAL_PROGRAM_ERROR;
|
|
|
|
} else {
|
|
|
|
buffer[len+=sLength]=0;
|
|
|
|
}
|
|
|
|
} else if(buffer.getAlias()<=s && s<(buffer.getAlias()+len) &&
|
|
|
|
sLength>=(buffer.getCapacity()-len)
|
|
|
|
) {
|
|
|
|
// (Part of) this string is appended to itself which requires reallocation,
|
|
|
|
// so we have to make a copy of the substring and append that.
|
|
|
|
return append(CharString(s, sLength, errorCode), errorCode);
|
|
|
|
} else if(ensureCapacity(len+sLength+1, 0, errorCode)) {
|
|
|
|
uprv_memcpy(buffer.getAlias()+len, s, sLength);
|
|
|
|
buffer[len+=sLength]=0;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
return *this;
|
|
|
|
}
|
|
|
|
|
2021-04-22 14:08:59 +02:00
|
|
|
CharString &CharString::appendNumber(int32_t number, UErrorCode &status) {
|
|
|
|
if (number < 0) {
|
|
|
|
this->append('-', status);
|
|
|
|
if (U_FAILURE(status)) {
|
|
|
|
return *this;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
if (number == 0) {
|
|
|
|
this->append('0', status);
|
|
|
|
return *this;
|
|
|
|
}
|
|
|
|
|
|
|
|
int32_t numLen = 0;
|
|
|
|
while (number != 0) {
|
|
|
|
int32_t residue = number % 10;
|
|
|
|
number /= 10;
|
|
|
|
this->append(std::abs(residue) + '0', status);
|
|
|
|
numLen++;
|
|
|
|
if (U_FAILURE(status)) {
|
|
|
|
return *this;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
int32_t start = this->length() - numLen, end = this->length() - 1;
|
|
|
|
while(start < end) {
|
|
|
|
std::swap(this->data()[start++], this->data()[end--]);
|
|
|
|
}
|
|
|
|
|
|
|
|
return *this;
|
|
|
|
}
|
|
|
|
|
2020-08-11 11:10:23 +02:00
|
|
|
char *CharString::getAppendBuffer(int32_t minCapacity,
|
|
|
|
int32_t desiredCapacityHint,
|
|
|
|
int32_t &resultCapacity,
|
|
|
|
UErrorCode &errorCode) {
|
|
|
|
if(U_FAILURE(errorCode)) {
|
|
|
|
resultCapacity=0;
|
2023-05-23 02:05:01 +02:00
|
|
|
return nullptr;
|
2020-08-11 11:10:23 +02:00
|
|
|
}
|
|
|
|
int32_t appendCapacity=buffer.getCapacity()-len-1; // -1 for NUL
|
|
|
|
if(appendCapacity>=minCapacity) {
|
|
|
|
resultCapacity=appendCapacity;
|
|
|
|
return buffer.getAlias()+len;
|
|
|
|
}
|
|
|
|
if(ensureCapacity(len+minCapacity+1, len+desiredCapacityHint+1, errorCode)) {
|
|
|
|
resultCapacity=buffer.getCapacity()-len-1;
|
|
|
|
return buffer.getAlias()+len;
|
|
|
|
}
|
|
|
|
resultCapacity=0;
|
2023-05-23 02:05:01 +02:00
|
|
|
return nullptr;
|
2020-08-11 11:10:23 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
CharString &CharString::appendInvariantChars(const UnicodeString &s, UErrorCode &errorCode) {
|
|
|
|
return appendInvariantChars(s.getBuffer(), s.length(), errorCode);
|
|
|
|
}
|
|
|
|
|
2023-05-23 02:05:01 +02:00
|
|
|
CharString &CharString::appendInvariantChars(const char16_t* uchars, int32_t ucharsLen, UErrorCode &errorCode) {
|
2020-08-11 11:10:23 +02:00
|
|
|
if(U_FAILURE(errorCode)) {
|
|
|
|
return *this;
|
|
|
|
}
|
|
|
|
if (!uprv_isInvariantUString(uchars, ucharsLen)) {
|
|
|
|
errorCode = U_INVARIANT_CONVERSION_ERROR;
|
|
|
|
return *this;
|
|
|
|
}
|
|
|
|
if(ensureCapacity(len+ucharsLen+1, 0, errorCode)) {
|
|
|
|
u_UCharsToChars(uchars, buffer.getAlias()+len, ucharsLen);
|
|
|
|
len += ucharsLen;
|
|
|
|
buffer[len] = 0;
|
|
|
|
}
|
|
|
|
return *this;
|
|
|
|
}
|
|
|
|
|
|
|
|
UBool CharString::ensureCapacity(int32_t capacity,
|
|
|
|
int32_t desiredCapacityHint,
|
|
|
|
UErrorCode &errorCode) {
|
|
|
|
if(U_FAILURE(errorCode)) {
|
2022-10-28 08:11:55 +02:00
|
|
|
return false;
|
2020-08-11 11:10:23 +02:00
|
|
|
}
|
|
|
|
if(capacity>buffer.getCapacity()) {
|
|
|
|
if(desiredCapacityHint==0) {
|
|
|
|
desiredCapacityHint=capacity+buffer.getCapacity();
|
|
|
|
}
|
2023-05-23 02:05:01 +02:00
|
|
|
if( (desiredCapacityHint<=capacity || buffer.resize(desiredCapacityHint, len+1)==nullptr) &&
|
|
|
|
buffer.resize(capacity, len+1)==nullptr
|
2020-08-11 11:10:23 +02:00
|
|
|
) {
|
|
|
|
errorCode=U_MEMORY_ALLOCATION_ERROR;
|
2022-10-28 08:11:55 +02:00
|
|
|
return false;
|
2020-08-11 11:10:23 +02:00
|
|
|
}
|
|
|
|
}
|
2022-10-28 08:11:55 +02:00
|
|
|
return true;
|
2020-08-11 11:10:23 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
CharString &CharString::appendPathPart(StringPiece s, UErrorCode &errorCode) {
|
|
|
|
if(U_FAILURE(errorCode)) {
|
|
|
|
return *this;
|
|
|
|
}
|
|
|
|
if(s.length()==0) {
|
|
|
|
return *this;
|
|
|
|
}
|
|
|
|
char c;
|
|
|
|
if(len>0 && (c=buffer[len-1])!=U_FILE_SEP_CHAR && c!=U_FILE_ALT_SEP_CHAR) {
|
|
|
|
append(getDirSepChar(), errorCode);
|
|
|
|
}
|
|
|
|
append(s, errorCode);
|
|
|
|
return *this;
|
|
|
|
}
|
|
|
|
|
|
|
|
CharString &CharString::ensureEndsWithFileSeparator(UErrorCode &errorCode) {
|
|
|
|
char c;
|
|
|
|
if(U_SUCCESS(errorCode) && len>0 &&
|
|
|
|
(c=buffer[len-1])!=U_FILE_SEP_CHAR && c!=U_FILE_ALT_SEP_CHAR) {
|
|
|
|
append(getDirSepChar(), errorCode);
|
|
|
|
}
|
|
|
|
return *this;
|
|
|
|
}
|
|
|
|
|
|
|
|
char CharString::getDirSepChar() const {
|
|
|
|
char dirSepChar = U_FILE_SEP_CHAR;
|
|
|
|
#if (U_FILE_SEP_CHAR != U_FILE_ALT_SEP_CHAR)
|
|
|
|
// We may need to return a different directory separator when building for Cygwin or MSYS2.
|
|
|
|
if(len>0 && !uprv_strchr(data(), U_FILE_SEP_CHAR) && uprv_strchr(data(), U_FILE_ALT_SEP_CHAR))
|
|
|
|
dirSepChar = U_FILE_ALT_SEP_CHAR;
|
|
|
|
#endif
|
|
|
|
return dirSepChar;
|
|
|
|
}
|
|
|
|
|
|
|
|
U_NAMESPACE_END
|