271 lines
		
	
	
		
			8.6 KiB
		
	
	
	
		
			C++
		
	
	
	
			
		
		
	
	
			271 lines
		
	
	
		
			8.6 KiB
		
	
	
	
		
			C++
		
	
	
	
| // © 2017 and later: Unicode, Inc. and others.
 | |
| // License & terms of use: http://www.unicode.org/copyright.html
 | |
| 
 | |
| #include "unicode/utypes.h"
 | |
| 
 | |
| #if !UCONFIG_NO_FORMATTING
 | |
| #ifndef __NUMBER_STRINGBUILDER_H__
 | |
| #define __NUMBER_STRINGBUILDER_H__
 | |
| 
 | |
| 
 | |
| #include <cstdint>
 | |
| #include <type_traits>
 | |
| 
 | |
| #include "cstring.h"
 | |
| #include "uassert.h"
 | |
| #include "fphdlimp.h"
 | |
| 
 | |
| U_NAMESPACE_BEGIN
 | |
| 
 | |
| class FormattedValueStringBuilderImpl;
 | |
| 
 | |
| /**
 | |
|  * A StringBuilder optimized for formatting. It implements the following key
 | |
|  * features beyond a UnicodeString:
 | |
|  *
 | |
|  * <ol>
 | |
|  * <li>Efficient prepend as well as append.
 | |
|  * <li>Keeps track of Fields in an efficient manner.
 | |
|  * </ol>
 | |
|  *
 | |
|  * See also FormattedValueStringBuilderImpl.
 | |
|  *
 | |
|  * @author sffc (Shane Carr)
 | |
|  */
 | |
| class U_I18N_API FormattedStringBuilder : public UMemory {
 | |
|   private:
 | |
|     static const int32_t DEFAULT_CAPACITY = 40;
 | |
| 
 | |
|     template<typename T>
 | |
|     union ValueOrHeapArray {
 | |
|         T value[DEFAULT_CAPACITY];
 | |
|         struct {
 | |
|             T *ptr;
 | |
|             int32_t capacity;
 | |
|         } heap;
 | |
|     };
 | |
| 
 | |
|   public:
 | |
|     FormattedStringBuilder();
 | |
| 
 | |
|     ~FormattedStringBuilder();
 | |
| 
 | |
|     FormattedStringBuilder(const FormattedStringBuilder &other);
 | |
| 
 | |
|     // Convention: bottom 4 bits for field, top 4 bits for field category.
 | |
|     // Field category 0 implies the number category so that the number field
 | |
|     // literals can be directly passed as a Field type.
 | |
|     // Exported as U_I18N_API so it can be used by other exports on Windows.
 | |
|     struct U_I18N_API Field {
 | |
|         uint8_t bits;
 | |
| 
 | |
|         Field() = default;
 | |
|         constexpr Field(uint8_t category, uint8_t field);
 | |
| 
 | |
|         inline UFieldCategory getCategory() const;
 | |
|         inline int32_t getField() const;
 | |
|         inline bool isNumeric() const;
 | |
|         inline bool isUndefined() const;
 | |
|         inline bool operator==(const Field& other) const;
 | |
|         inline bool operator!=(const Field& other) const;
 | |
|     };
 | |
| 
 | |
|     FormattedStringBuilder &operator=(const FormattedStringBuilder &other);
 | |
| 
 | |
|     int32_t length() const;
 | |
| 
 | |
|     int32_t codePointCount() const;
 | |
| 
 | |
|     inline char16_t charAt(int32_t index) const {
 | |
|         U_ASSERT(index >= 0);
 | |
|         U_ASSERT(index < fLength);
 | |
|         return getCharPtr()[fZero + index];
 | |
|     }
 | |
| 
 | |
|     inline Field fieldAt(int32_t index) const {
 | |
|         U_ASSERT(index >= 0);
 | |
|         U_ASSERT(index < fLength);
 | |
|         return getFieldPtr()[fZero + index];
 | |
|     }
 | |
| 
 | |
|     UChar32 getFirstCodePoint() const;
 | |
| 
 | |
|     UChar32 getLastCodePoint() const;
 | |
| 
 | |
|     UChar32 codePointAt(int32_t index) const;
 | |
| 
 | |
|     UChar32 codePointBefore(int32_t index) const;
 | |
| 
 | |
|     FormattedStringBuilder &clear();
 | |
| 
 | |
|     /** Appends a UTF-16 code unit. */
 | |
|     inline int32_t appendChar16(char16_t codeUnit, Field field, UErrorCode& status) {
 | |
|         // appendCodePoint handles both code units and code points.
 | |
|         return insertCodePoint(fLength, codeUnit, field, status);
 | |
|     }
 | |
| 
 | |
|     /** Inserts a UTF-16 code unit. Note: insert at index 0 is very efficient. */
 | |
|     inline int32_t insertChar16(int32_t index, char16_t codeUnit, Field field, UErrorCode& status) {
 | |
|         // insertCodePoint handles both code units and code points.
 | |
|         return insertCodePoint(index, codeUnit, field, status);
 | |
|     }
 | |
| 
 | |
|     /** Appends a Unicode code point. */
 | |
|     inline int32_t appendCodePoint(UChar32 codePoint, Field field, UErrorCode &status) {
 | |
|         return insertCodePoint(fLength, codePoint, field, status);
 | |
|     }
 | |
| 
 | |
|     /** Inserts a Unicode code point. Note: insert at index 0 is very efficient. */
 | |
|     int32_t insertCodePoint(int32_t index, UChar32 codePoint, Field field, UErrorCode &status);
 | |
| 
 | |
|     /** Appends a string. */
 | |
|     inline int32_t append(const UnicodeString &unistr, Field field, UErrorCode &status) {
 | |
|         return insert(fLength, unistr, field, status);
 | |
|     }
 | |
| 
 | |
|     /** Inserts a string. Note: insert at index 0 is very efficient. */
 | |
|     int32_t insert(int32_t index, const UnicodeString &unistr, Field field, UErrorCode &status);
 | |
| 
 | |
|     /** Inserts a substring. Note: insert at index 0 is very efficient.
 | |
|      *
 | |
|      * @param start Start index of the substring of unistr to be inserted.
 | |
|      * @param end End index of the substring of unistr to be inserted (exclusive).
 | |
|      */
 | |
|     int32_t insert(int32_t index, const UnicodeString &unistr, int32_t start, int32_t end, Field field,
 | |
|                    UErrorCode &status);
 | |
| 
 | |
|     /** Deletes a substring and then inserts a string at that same position.
 | |
|      * Similar to JavaScript Array.prototype.splice().
 | |
|      *
 | |
|      * @param startThis Start of the span to delete.
 | |
|      * @param endThis End of the span to delete (exclusive).
 | |
|      * @param unistr The string to insert at the deletion position.
 | |
|      * @param startOther Start index of the substring of unistr to be inserted.
 | |
|      * @param endOther End index of the substring of unistr to be inserted (exclusive).
 | |
|      */
 | |
|     int32_t splice(int32_t startThis, int32_t endThis,  const UnicodeString &unistr,
 | |
|                    int32_t startOther, int32_t endOther, Field field, UErrorCode& status);
 | |
| 
 | |
|     /** Appends a formatted string. */
 | |
|     int32_t append(const FormattedStringBuilder &other, UErrorCode &status);
 | |
| 
 | |
|     /** Inserts a formatted string. Note: insert at index 0 is very efficient. */
 | |
|     int32_t insert(int32_t index, const FormattedStringBuilder &other, UErrorCode &status);
 | |
| 
 | |
|     /**
 | |
|      * Ensures that the string buffer contains a NUL terminator. The NUL terminator does
 | |
|      * not count toward the string length. Any further changes to the string (insert or
 | |
|      * append) may invalidate the NUL terminator.
 | |
|      *
 | |
|      * You should call this method after the formatted string is completely built if you
 | |
|      * plan to return a pointer to the string from a C API.
 | |
|      */
 | |
|     void writeTerminator(UErrorCode& status);
 | |
| 
 | |
|     /**
 | |
|      * Gets a "safe" UnicodeString that can be used even after the FormattedStringBuilder is destructed.
 | |
|      */
 | |
|     UnicodeString toUnicodeString() const;
 | |
| 
 | |
|     /**
 | |
|      * Gets an "unsafe" UnicodeString that is valid only as long as the FormattedStringBuilder is alive and
 | |
|      * unchanged. Slightly faster than toUnicodeString().
 | |
|      */
 | |
|     const UnicodeString toTempUnicodeString() const;
 | |
| 
 | |
|     UnicodeString toDebugString() const;
 | |
| 
 | |
|     const char16_t *chars() const;
 | |
| 
 | |
|     bool contentEquals(const FormattedStringBuilder &other) const;
 | |
| 
 | |
|     bool containsField(Field field) const;
 | |
| 
 | |
|   private:
 | |
|     bool fUsingHeap = false;
 | |
|     ValueOrHeapArray<char16_t> fChars;
 | |
|     ValueOrHeapArray<Field> fFields;
 | |
|     int32_t fZero = DEFAULT_CAPACITY / 2;
 | |
|     int32_t fLength = 0;
 | |
| 
 | |
|     inline char16_t *getCharPtr() {
 | |
|         return fUsingHeap ? fChars.heap.ptr : fChars.value;
 | |
|     }
 | |
| 
 | |
|     inline const char16_t *getCharPtr() const {
 | |
|         return fUsingHeap ? fChars.heap.ptr : fChars.value;
 | |
|     }
 | |
| 
 | |
|     inline Field *getFieldPtr() {
 | |
|         return fUsingHeap ? fFields.heap.ptr : fFields.value;
 | |
|     }
 | |
| 
 | |
|     inline const Field *getFieldPtr() const {
 | |
|         return fUsingHeap ? fFields.heap.ptr : fFields.value;
 | |
|     }
 | |
| 
 | |
|     inline int32_t getCapacity() const {
 | |
|         return fUsingHeap ? fChars.heap.capacity : DEFAULT_CAPACITY;
 | |
|     }
 | |
| 
 | |
|     int32_t prepareForInsert(int32_t index, int32_t count, UErrorCode &status);
 | |
| 
 | |
|     int32_t prepareForInsertHelper(int32_t index, int32_t count, UErrorCode &status);
 | |
| 
 | |
|     int32_t remove(int32_t index, int32_t count);
 | |
| 
 | |
|     friend class FormattedValueStringBuilderImpl;
 | |
| };
 | |
| 
 | |
| static_assert(
 | |
|     std::is_pod<FormattedStringBuilder::Field>::value,
 | |
|     "Field should be a POD type for efficient initialization");
 | |
| 
 | |
| constexpr FormattedStringBuilder::Field::Field(uint8_t category, uint8_t field)
 | |
|     : bits((
 | |
|         U_ASSERT(category <= 0xf),
 | |
|         U_ASSERT(field <= 0xf),
 | |
|         static_cast<uint8_t>((category << 4) | field)
 | |
|     )) {}
 | |
| 
 | |
| /**
 | |
|  * Internal constant for the undefined field for use in FormattedStringBuilder.
 | |
|  */
 | |
| constexpr FormattedStringBuilder::Field kUndefinedField = {UFIELD_CATEGORY_UNDEFINED, 0};
 | |
| 
 | |
| /**
 | |
|  * Internal field to signal "numeric" when fields are not supported in NumberFormat.
 | |
|  */
 | |
| constexpr FormattedStringBuilder::Field kGeneralNumericField = {UFIELD_CATEGORY_UNDEFINED, 1};
 | |
| 
 | |
| inline UFieldCategory FormattedStringBuilder::Field::getCategory() const {
 | |
|     return static_cast<UFieldCategory>(bits >> 4);
 | |
| }
 | |
| 
 | |
| inline int32_t FormattedStringBuilder::Field::getField() const {
 | |
|     return bits & 0xf;
 | |
| }
 | |
| 
 | |
| inline bool FormattedStringBuilder::Field::isNumeric() const {
 | |
|     return getCategory() == UFIELD_CATEGORY_NUMBER || *this == kGeneralNumericField;
 | |
| }
 | |
| 
 | |
| inline bool FormattedStringBuilder::Field::isUndefined() const {
 | |
|     return getCategory() == UFIELD_CATEGORY_UNDEFINED;
 | |
| }
 | |
| 
 | |
| inline bool FormattedStringBuilder::Field::operator==(const Field& other) const {
 | |
|     return bits == other.bits;
 | |
| }
 | |
| 
 | |
| inline bool FormattedStringBuilder::Field::operator!=(const Field& other) const {
 | |
|     return bits != other.bits;
 | |
| }
 | |
| 
 | |
| U_NAMESPACE_END
 | |
| 
 | |
| 
 | |
| #endif //__NUMBER_STRINGBUILDER_H__
 | |
| 
 | |
| #endif /* #if !UCONFIG_NO_FORMATTING */
 |