1 // © 2016 and later: Unicode, Inc. and others. 2 // License & terms of use: http://www.unicode.org/copyright.html 3 /* 4 ********************************************************************** 5 * Copyright (c) 2001-2015, International Business Machines 6 * Corporation and others. All Rights Reserved. 7 ********************************************************************** 8 * Date Name Description 9 * 11/19/2001 aliu Creation. 10 * 05/19/2010 markus Rewritten from scratch 11 ********************************************************************** 12 */ 13 14 #ifndef CHARSTRING_H 15 #define CHARSTRING_H 16 17 #include "unicode/utypes.h" 18 #include "unicode/unistr.h" 19 #include "unicode/uobject.h" 20 #include "cmemory.h" 21 22 U_NAMESPACE_BEGIN 23 24 // Windows needs us to DLL-export the MaybeStackArray template specialization, 25 // but MacOS X cannot handle it. Same as in digitlst.h. 26 #if !U_PLATFORM_IS_DARWIN_BASED 27 template class U_COMMON_API MaybeStackArray<char, 40>; 28 #endif 29 30 /** 31 * ICU-internal char * string class. 32 * This class does not assume or enforce any particular character encoding. 33 * Raw bytes can be stored. The string object owns its characters. 34 * A terminating NUL is stored, but the class does not prevent embedded NUL characters. 35 * 36 * This class wants to be convenient but is also deliberately minimalist. 37 * Please do not add methods if they only add minor convenience. 38 * For example: 39 * cs.data()[5]='a'; // no need for setCharAt(5, 'a') 40 */ 41 class U_COMMON_API CharString : public UMemory { 42 public: CharString()43 CharString() : len(0) { buffer[0]=0; } CharString(StringPiece s,UErrorCode & errorCode)44 CharString(StringPiece s, UErrorCode &errorCode) : len(0) { 45 buffer[0]=0; 46 append(s, errorCode); 47 } CharString(const CharString & s,UErrorCode & errorCode)48 CharString(const CharString &s, UErrorCode &errorCode) : len(0) { 49 buffer[0]=0; 50 append(s, errorCode); 51 } CharString(const char * s,int32_t sLength,UErrorCode & errorCode)52 CharString(const char *s, int32_t sLength, UErrorCode &errorCode) : len(0) { 53 buffer[0]=0; 54 append(s, sLength, errorCode); 55 } ~CharString()56 ~CharString() {} 57 58 /** 59 * Move constructor; might leave src in an undefined state. 60 * This string will have the same contents and state that the source string had. 61 */ 62 CharString(CharString &&src) noexcept; 63 /** 64 * Move assignment operator; might leave src in an undefined state. 65 * This string will have the same contents and state that the source string had. 66 * The behavior is undefined if *this and src are the same object. 67 */ 68 CharString &operator=(CharString &&src) noexcept; 69 70 /** 71 * Replaces this string's contents with the other string's contents. 72 * CharString does not support the standard copy constructor nor 73 * the assignment operator, to make copies explicit and to 74 * use a UErrorCode where memory allocations might be needed. 75 */ 76 CharString ©From(const CharString &other, UErrorCode &errorCode); 77 isEmpty()78 UBool isEmpty() const { return len==0; } length()79 int32_t length() const { return len; } 80 char operator[](int32_t index) const { return buffer[index]; } toStringPiece()81 StringPiece toStringPiece() const { return StringPiece(buffer.getAlias(), len); } 82 data()83 const char *data() const { return buffer.getAlias(); } data()84 char *data() { return buffer.getAlias(); } 85 /** 86 * Allocates length()+1 chars and copies the NUL-terminated data(). 87 * The caller must uprv_free() the result. 88 */ 89 char *cloneData(UErrorCode &errorCode) const; 90 /** 91 * Copies the contents of the string into dest. 92 * Checks if there is enough space in dest, extracts the entire string if possible, 93 * and NUL-terminates dest if possible. 94 * 95 * If the string fits into dest but cannot be NUL-terminated (length()==capacity), 96 * then the error code is set to U_STRING_NOT_TERMINATED_WARNING. 97 * If the string itself does not fit into dest (length()>capacity), 98 * then the error code is set to U_BUFFER_OVERFLOW_ERROR. 99 * 100 * @param dest Destination string buffer. 101 * @param capacity Size of the dest buffer (number of chars). 102 * @param errorCode ICU error code. 103 * @return length() 104 */ 105 int32_t extract(char *dest, int32_t capacity, UErrorCode &errorCode) const; 106 107 bool operator==(const CharString& other) const { 108 return len == other.length() && (len == 0 || uprv_memcmp(data(), other.data(), len) == 0); 109 } 110 bool operator!=(const CharString& other) const { 111 return !operator==(other); 112 } 113 114 bool operator==(StringPiece other) const { 115 return len == other.length() && (len == 0 || uprv_memcmp(data(), other.data(), len) == 0); 116 } 117 bool operator!=(StringPiece other) const { 118 return !operator==(other); 119 } 120 121 /** @return last index of c, or -1 if c is not in this string */ 122 int32_t lastIndexOf(char c) const; 123 124 bool contains(StringPiece s) const; 125 clear()126 CharString &clear() { len=0; buffer[0]=0; return *this; } 127 CharString &truncate(int32_t newLength); 128 129 CharString &append(char c, UErrorCode &errorCode); append(StringPiece s,UErrorCode & errorCode)130 CharString &append(StringPiece s, UErrorCode &errorCode) { 131 return append(s.data(), s.length(), errorCode); 132 } append(const CharString & s,UErrorCode & errorCode)133 CharString &append(const CharString &s, UErrorCode &errorCode) { 134 return append(s.data(), s.length(), errorCode); 135 } 136 CharString &append(const char *s, int32_t sLength, UErrorCode &status); 137 138 CharString &appendNumber(int32_t number, UErrorCode &status); 139 140 /** 141 * Returns a writable buffer for appending and writes the buffer's capacity to 142 * resultCapacity. Guarantees resultCapacity>=minCapacity if U_SUCCESS(). 143 * There will additionally be space for a terminating NUL right at resultCapacity. 144 * (This function is similar to ByteSink.GetAppendBuffer().) 145 * 146 * The returned buffer is only valid until the next write operation 147 * on this string. 148 * 149 * After writing at most resultCapacity bytes, call append() with the 150 * pointer returned from this function and the number of bytes written. 151 * 152 * @param minCapacity required minimum capacity of the returned buffer; 153 * must be non-negative 154 * @param desiredCapacityHint desired capacity of the returned buffer; 155 * must be non-negative 156 * @param resultCapacity will be set to the capacity of the returned buffer 157 * @param errorCode in/out error code 158 * @return a buffer with resultCapacity>=min_capacity 159 */ 160 char *getAppendBuffer(int32_t minCapacity, 161 int32_t desiredCapacityHint, 162 int32_t &resultCapacity, 163 UErrorCode &errorCode); 164 165 CharString &appendInvariantChars(const UnicodeString &s, UErrorCode &errorCode); 166 CharString &appendInvariantChars(const char16_t* uchars, int32_t ucharsLen, UErrorCode& errorCode); 167 168 /** 169 * Appends a filename/path part, e.g., a directory name. 170 * First appends a U_FILE_SEP_CHAR or U_FILE_ALT_SEP_CHAR if necessary. 171 * Does nothing if s is empty. 172 */ 173 CharString &appendPathPart(StringPiece s, UErrorCode &errorCode); 174 175 /** 176 * Appends a U_FILE_SEP_CHAR or U_FILE_ALT_SEP_CHAR if this string is not empty 177 * and does not already end with a U_FILE_SEP_CHAR or U_FILE_ALT_SEP_CHAR. 178 */ 179 CharString &ensureEndsWithFileSeparator(UErrorCode &errorCode); 180 181 private: 182 MaybeStackArray<char, 40> buffer; 183 int32_t len; 184 185 UBool ensureCapacity(int32_t capacity, int32_t desiredCapacityHint, UErrorCode &errorCode); 186 187 CharString(const CharString &other) = delete; // forbid copying of this class 188 CharString &operator=(const CharString &other) = delete; // forbid copying of this class 189 190 /** 191 * Returns U_FILE_ALT_SEP_CHAR if found in string, and U_FILE_SEP_CHAR is not found. 192 * Otherwise returns U_FILE_SEP_CHAR. 193 */ 194 char getDirSepChar() const; 195 }; 196 197 U_NAMESPACE_END 198 199 #endif 200 //eof 201