/* ****************************************************************************** * Copyright (C) 2014, International Business Machines * Corporation and others. All Rights Reserved. ****************************************************************************** * simplepatternformatter.h */ #ifndef __SIMPLEPATTERNFORMATTER_H__ #define __SIMPLEPATTERNFORMATTER_H__ #define EXPECTED_PLACEHOLDER_COUNT 3 #include "cmemory.h" #include "unicode/utypes.h" #include "unicode/unistr.h" U_NAMESPACE_BEGIN class SimplePatternFormatterPlaceholderValues; struct PlaceholderInfo { int32_t id; int32_t offset; }; /** * Compiled version of a pattern string such as "{1} was born in {0}". *

* Using SimplePatternFormatter is both faster and safer than adhoc replacement. * They are faster because they are precompiled; they are safer because they * account for curly braces escaped by apostrophe ('). * * Placeholders are of the form \{[0-9]+\}. If a curly brace is preceded * by a single quote, it becomes a curly brace instead of the start of a * placeholder. Two single quotes resolve to one single quote. *

* Example: *

 * SimplePatternFormatter fmt("{1} '{born} in {0}");
 * UnicodeString result;
 * UErrorCode status = U_ZERO_ERROR;
 * // Evaluates to: "paul {born} in england"
 * fmt.format("england", "paul", result, status);
 * 
*/ class U_COMMON_API SimplePatternFormatter : public UMemory { public: /** * Default constructor */ SimplePatternFormatter(); /** * Construct from a pattern. Will never fail if pattern has three or * fewer placeholders in it. */ explicit SimplePatternFormatter(const UnicodeString& pattern); /** * Copy constructor. */ SimplePatternFormatter(const SimplePatternFormatter& other); /** * Assignment operator */ SimplePatternFormatter &operator=(const SimplePatternFormatter& other); /** * Destructor. */ ~SimplePatternFormatter(); /** * Compiles pattern and makes this object represent pattern. * * Returns TRUE on success; FALSE on failure. Will not fail if * there are three or fewer placeholders in pattern. May fail with * U_MEMORY_ALLOCATION_ERROR if there are more than three placeholders. */ UBool compile(const UnicodeString &pattern, UErrorCode &status); /** * Returns (maxPlaceholderId + 1). For example * SimplePatternFormatter("{0} {2}").getPlaceholderCount() * evaluates to 3. * Callers use this function to find out how many values this object * expects when formatting. */ int32_t getPlaceholderCount() const { return placeholderCount; } /** * Returns this pattern with none of the placeholders. */ const UnicodeString &getPatternWithNoPlaceholders() const { return noPlaceholders; } /** * Formats given value. arg0 cannot be appendTo. */ UnicodeString &format( const UnicodeString &args0, UnicodeString &appendTo, UErrorCode &status) const; /** * Formats given values. Neither arg0 nor arg1 can be appendTo. */ UnicodeString &format( const UnicodeString &args0, const UnicodeString &args1, UnicodeString &appendTo, UErrorCode &status) const; /** * Formats given values. Neither arg0, arg1, nor arg2 can be appendTo. */ UnicodeString &format( const UnicodeString &args0, const UnicodeString &args1, const UnicodeString &args2, UnicodeString &appendTo, UErrorCode &status) const; /** * Formats given values. * * The caller retains ownership of all pointers. * @param placeholderValues 1st one corresponds to {0}; 2nd to {1}; * 3rd to {2} etc. If any of these point to appendTo, this method * sets status to U_ILLEGAL_ARGUMENT_ERROR. * @param placeholderValueCount the number of placeholder values * must be at least large enough to provide values for all placeholders * in this object. Otherwise status set to U_ILLEGAL_ARGUMENT_ERROR. * @param appendTo resulting string appended here. * @param offsetArray The offset of each placeholder value in appendTo * stored here. The first value gets the offset of the value for {0}; * the 2nd for {1}; the 3rd for {2} etc. -1 means that the corresponding * placeholder does not exist in this object. If caller is not * interested in offsets, it may pass NULL and 0 for the length. * @param offsetArrayLength the size of offsetArray. If less than * placeholderValueCount only the first offsets get recorded. If * greater than placeholderValueCount, then extra values in offset * array are set to -1. * @param status any error stored here. */ UnicodeString &formatAndAppend( const UnicodeString * const *placeholderValues, int32_t placeholderValueCount, UnicodeString &appendTo, int32_t *offsetArray, int32_t offsetArrayLength, UErrorCode &status) const; /** * Formats given values. * * The caller retains ownership of all pointers. * @param placeholderValues 1st one corresponds to {0}; 2nd to {1}; * 3rd to {2} etc. May include pointer to result in which case * the previous value of result is used for the corresponding * placeholder. * @param placeholderValueCount the number of placeholder values * must be at least large enough to provide values for all placeholders * in this object. Otherwise status set to U_ILLEGAL_ARGUMENT_ERROR. * @param result resulting string stored here overwriting any previous * value. * @param offsetArray The offset of each placeholder value in result * stored here. The first value gets the offset of the value for {0}; * the 2nd for {1}; the 3rd for {2} etc. -1 means that the corresponding * placeholder does not exist in this object. If caller is not * interested in offsets, it may pass NULL and 0 for the length. * @param offsetArrayLength the size of offsetArray. If less than * placeholderValueCount only the first offsets get recorded. If * greater than placeholderValueCount, then extra values in offset * array are set to -1. * @param status any error stored here. */ UnicodeString &formatAndReplace( const UnicodeString * const *placeholderValues, int32_t placeholderValueCount, UnicodeString &result, int32_t *offsetArray, int32_t offsetArrayLength, UErrorCode &status) const; private: UnicodeString noPlaceholders; MaybeStackArray placeholders; int32_t placeholderSize; int32_t placeholderCount; UBool firstPlaceholderReused; // A Placeholder value that is the same as appendTo is treated as the // empty string. UnicodeString &formatAndAppend( const SimplePatternFormatterPlaceholderValues &placeholderValues, UnicodeString &appendTo, int32_t *offsetArray, int32_t offsetArrayLength) const; // Returns the placeholder at the beginning of this pattern // (e.g 3 for placeholder {3}). Returns -1 if the beginning of pattern // is text or if the placeholder at the beginning of this pattern // is used again in the middle of the pattern. int32_t getUniquePlaceholderAtStart() const; // ensureCapacity ensures that the capacity of the placeholders array // is desiredCapacity. If ensureCapacity must resize the placeholders // array, the first placeholderSize elements stay in the array. Note // that ensureCapcity NEVER changes the value of placeholderSize only // the capacity of the placeholders array. // If there is no memory allocation error when resizing, this // function returns desiredCapacity. If there is a memory allocation // error, this function leaves the placeholders array unchanged and // returns the smaller, old capacity. ensureCapacity resizes only if // the current capacity of placeholders array is less than desiredCapacity. // Otherwise, it leaves the placeholders array unchanged. If caller // specifies an allocation size, then it must be at least as large as // desiredCapacity. In that case, if ensureCapacity resizes, it will // allocate allocationSize spots instead of desiredCapacity spots in // the array. If caller is calling ensureCapacity in a loop while adding // elements, it is recommended that it use an allocationSize of // approximately twice desiredCapacity to avoid memory allocation with // every call to ensureCapacity. int32_t ensureCapacity(int32_t desiredCapacity, int32_t allocationSize=0); // Records the offset of an individual placeholder in the noPlaceholders // string. UBool addPlaceholder(int32_t id, int32_t offset); }; U_NAMESPACE_END #endif