201 lines
7.6 KiB
C++
201 lines
7.6 KiB
C++
|
// © 2016 and later: Unicode, Inc. and others.
|
||
|
// License & terms of use: http://www.unicode.org/copyright.html
|
||
|
/*
|
||
|
**********************************************************************
|
||
|
* Copyright (c) 2001-2015, International Business Machines
|
||
|
* Corporation and others. All Rights Reserved.
|
||
|
**********************************************************************
|
||
|
* Date Name Description
|
||
|
* 11/19/2001 aliu Creation.
|
||
|
* 05/19/2010 markus Rewritten from scratch
|
||
|
**********************************************************************
|
||
|
*/
|
||
|
|
||
|
#ifndef CHARSTRING_H
|
||
|
#define CHARSTRING_H
|
||
|
|
||
|
#include "unicode/utypes.h"
|
||
|
#include "unicode/unistr.h"
|
||
|
#include "unicode/uobject.h"
|
||
|
#include "cmemory.h"
|
||
|
|
||
|
U_NAMESPACE_BEGIN
|
||
|
|
||
|
// Windows needs us to DLL-export the MaybeStackArray template specialization,
|
||
|
// but MacOS X cannot handle it. Same as in digitlst.h.
|
||
|
#if !U_PLATFORM_IS_DARWIN_BASED
|
||
|
template class U_COMMON_API MaybeStackArray<char, 40>;
|
||
|
#endif
|
||
|
|
||
|
/**
|
||
|
* ICU-internal char * string class.
|
||
|
* This class does not assume or enforce any particular character encoding.
|
||
|
* Raw bytes can be stored. The string object owns its characters.
|
||
|
* A terminating NUL is stored, but the class does not prevent embedded NUL characters.
|
||
|
*
|
||
|
* This class wants to be convenient but is also deliberately minimalist.
|
||
|
* Please do not add methods if they only add minor convenience.
|
||
|
* For example:
|
||
|
* cs.data()[5]='a'; // no need for setCharAt(5, 'a')
|
||
|
*/
|
||
|
class U_COMMON_API CharString : public UMemory {
|
||
|
public:
|
||
|
CharString() : len(0) { buffer[0]=0; }
|
||
|
CharString(StringPiece s, UErrorCode &errorCode) : len(0) {
|
||
|
buffer[0]=0;
|
||
|
append(s, errorCode);
|
||
|
}
|
||
|
CharString(const CharString &s, UErrorCode &errorCode) : len(0) {
|
||
|
buffer[0]=0;
|
||
|
append(s, errorCode);
|
||
|
}
|
||
|
CharString(const char *s, int32_t sLength, UErrorCode &errorCode) : len(0) {
|
||
|
buffer[0]=0;
|
||
|
append(s, sLength, errorCode);
|
||
|
}
|
||
|
~CharString() {}
|
||
|
|
||
|
/**
|
||
|
* Move constructor; might leave src in an undefined state.
|
||
|
* This string will have the same contents and state that the source string had.
|
||
|
*/
|
||
|
CharString(CharString &&src) noexcept;
|
||
|
/**
|
||
|
* Move assignment operator; might leave src in an undefined state.
|
||
|
* This string will have the same contents and state that the source string had.
|
||
|
* The behavior is undefined if *this and src are the same object.
|
||
|
*/
|
||
|
CharString &operator=(CharString &&src) noexcept;
|
||
|
|
||
|
/**
|
||
|
* Replaces this string's contents with the other string's contents.
|
||
|
* CharString does not support the standard copy constructor nor
|
||
|
* the assignment operator, to make copies explicit and to
|
||
|
* use a UErrorCode where memory allocations might be needed.
|
||
|
*/
|
||
|
CharString ©From(const CharString &other, UErrorCode &errorCode);
|
||
|
|
||
|
UBool isEmpty() const { return len==0; }
|
||
|
int32_t length() const { return len; }
|
||
|
char operator[](int32_t index) const { return buffer[index]; }
|
||
|
StringPiece toStringPiece() const { return StringPiece(buffer.getAlias(), len); }
|
||
|
|
||
|
const char *data() const { return buffer.getAlias(); }
|
||
|
char *data() { return buffer.getAlias(); }
|
||
|
/**
|
||
|
* Allocates length()+1 chars and copies the NUL-terminated data().
|
||
|
* The caller must uprv_free() the result.
|
||
|
*/
|
||
|
char *cloneData(UErrorCode &errorCode) const;
|
||
|
/**
|
||
|
* Copies the contents of the string into dest.
|
||
|
* Checks if there is enough space in dest, extracts the entire string if possible,
|
||
|
* and NUL-terminates dest if possible.
|
||
|
*
|
||
|
* If the string fits into dest but cannot be NUL-terminated (length()==capacity),
|
||
|
* then the error code is set to U_STRING_NOT_TERMINATED_WARNING.
|
||
|
* If the string itself does not fit into dest (length()>capacity),
|
||
|
* then the error code is set to U_BUFFER_OVERFLOW_ERROR.
|
||
|
*
|
||
|
* @param dest Destination string buffer.
|
||
|
* @param capacity Size of the dest buffer (number of chars).
|
||
|
* @param errorCode ICU error code.
|
||
|
* @return length()
|
||
|
*/
|
||
|
int32_t extract(char *dest, int32_t capacity, UErrorCode &errorCode) const;
|
||
|
|
||
|
bool operator==(const CharString& other) const {
|
||
|
return len == other.length() && (len == 0 || uprv_memcmp(data(), other.data(), len) == 0);
|
||
|
}
|
||
|
bool operator!=(const CharString& other) const {
|
||
|
return !operator==(other);
|
||
|
}
|
||
|
|
||
|
bool operator==(StringPiece other) const {
|
||
|
return len == other.length() && (len == 0 || uprv_memcmp(data(), other.data(), len) == 0);
|
||
|
}
|
||
|
bool operator!=(StringPiece other) const {
|
||
|
return !operator==(other);
|
||
|
}
|
||
|
|
||
|
/** @return last index of c, or -1 if c is not in this string */
|
||
|
int32_t lastIndexOf(char c) const;
|
||
|
|
||
|
bool contains(StringPiece s) const;
|
||
|
|
||
|
CharString &clear() { len=0; buffer[0]=0; return *this; }
|
||
|
CharString &truncate(int32_t newLength);
|
||
|
|
||
|
CharString &append(char c, UErrorCode &errorCode);
|
||
|
CharString &append(StringPiece s, UErrorCode &errorCode) {
|
||
|
return append(s.data(), s.length(), errorCode);
|
||
|
}
|
||
|
CharString &append(const CharString &s, UErrorCode &errorCode) {
|
||
|
return append(s.data(), s.length(), errorCode);
|
||
|
}
|
||
|
CharString &append(const char *s, int32_t sLength, UErrorCode &status);
|
||
|
|
||
|
CharString &appendNumber(int32_t number, UErrorCode &status);
|
||
|
|
||
|
/**
|
||
|
* Returns a writable buffer for appending and writes the buffer's capacity to
|
||
|
* resultCapacity. Guarantees resultCapacity>=minCapacity if U_SUCCESS().
|
||
|
* There will additionally be space for a terminating NUL right at resultCapacity.
|
||
|
* (This function is similar to ByteSink.GetAppendBuffer().)
|
||
|
*
|
||
|
* The returned buffer is only valid until the next write operation
|
||
|
* on this string.
|
||
|
*
|
||
|
* After writing at most resultCapacity bytes, call append() with the
|
||
|
* pointer returned from this function and the number of bytes written.
|
||
|
*
|
||
|
* @param minCapacity required minimum capacity of the returned buffer;
|
||
|
* must be non-negative
|
||
|
* @param desiredCapacityHint desired capacity of the returned buffer;
|
||
|
* must be non-negative
|
||
|
* @param resultCapacity will be set to the capacity of the returned buffer
|
||
|
* @param errorCode in/out error code
|
||
|
* @return a buffer with resultCapacity>=min_capacity
|
||
|
*/
|
||
|
char *getAppendBuffer(int32_t minCapacity,
|
||
|
int32_t desiredCapacityHint,
|
||
|
int32_t &resultCapacity,
|
||
|
UErrorCode &errorCode);
|
||
|
|
||
|
CharString &appendInvariantChars(const UnicodeString &s, UErrorCode &errorCode);
|
||
|
CharString &appendInvariantChars(const char16_t* uchars, int32_t ucharsLen, UErrorCode& errorCode);
|
||
|
|
||
|
/**
|
||
|
* Appends a filename/path part, e.g., a directory name.
|
||
|
* First appends a U_FILE_SEP_CHAR or U_FILE_ALT_SEP_CHAR if necessary.
|
||
|
* Does nothing if s is empty.
|
||
|
*/
|
||
|
CharString &appendPathPart(StringPiece s, UErrorCode &errorCode);
|
||
|
|
||
|
/**
|
||
|
* Appends a U_FILE_SEP_CHAR or U_FILE_ALT_SEP_CHAR if this string is not empty
|
||
|
* and does not already end with a U_FILE_SEP_CHAR or U_FILE_ALT_SEP_CHAR.
|
||
|
*/
|
||
|
CharString &ensureEndsWithFileSeparator(UErrorCode &errorCode);
|
||
|
|
||
|
private:
|
||
|
MaybeStackArray<char, 40> buffer;
|
||
|
int32_t len;
|
||
|
|
||
|
UBool ensureCapacity(int32_t capacity, int32_t desiredCapacityHint, UErrorCode &errorCode);
|
||
|
|
||
|
CharString(const CharString &other) = delete; // forbid copying of this class
|
||
|
CharString &operator=(const CharString &other) = delete; // forbid copying of this class
|
||
|
|
||
|
/**
|
||
|
* Returns U_FILE_ALT_SEP_CHAR if found in string, and U_FILE_SEP_CHAR is not found.
|
||
|
* Otherwise returns U_FILE_SEP_CHAR.
|
||
|
*/
|
||
|
char getDirSepChar() const;
|
||
|
};
|
||
|
|
||
|
U_NAMESPACE_END
|
||
|
|
||
|
#endif
|
||
|
//eof
|