Go to the documentation of this file.
17 #ifndef __NORMALIZER2_H__
18 #define __NORMALIZER2_H__
27 #if !UCONFIG_NO_NORMALIZATION
196 normalize(src, result, errorCode);
456 norm2(n2), set(filterSet) {}
657 #endif // !UCONFIG_NO_NORMALIZATION
658 #endif // __NORMALIZER2_H__
virtual UBool isNormalized(const UnicodeString &s, UErrorCode &errorCode) const
Tests if the string is normalized.
virtual UBool getRawDecomposition(UChar32 c, UnicodeString &decomposition) const
Gets the raw decomposition mapping of c.
virtual UBool getDecomposition(UChar32 c, UnicodeString &decomposition) const =0
Gets the decomposition mapping of c.
virtual UnicodeString & append(UnicodeString &first, const UnicodeString &second, UErrorCode &errorCode) const
Appends the second string to the first string (merging them at the boundary) and returns the first st...
virtual int32_t spanQuickCheckYes(const UnicodeString &s, UErrorCode &errorCode) const =0
Returns the end of the normalized substring of the input string.
UNormalization2Mode
Constants for normalization modes.
static const Normalizer2 * getInstance(const char *packageName, const char *name, UNormalization2Mode mode, UErrorCode &errorCode)
Returns a Normalizer2 instance which uses the specified data file (packageName/name similar to ucnv_o...
Basic definitions for ICU, for both C and C++ APIs.
A mutable set of Unicode characters and multicharacter strings.
int8_t UBool
The ICU boolean type.
~FilteredNormalizer2()
Destructor.
virtual int32_t spanQuickCheckYes(const UnicodeString &s, UErrorCode &errorCode) const
Returns the end of the normalized substring of the input string.
static const Normalizer2 * getNFKCInstance(UErrorCode &errorCode)
Returns a Normalizer2 instance for Unicode NFKC normalization.
virtual UBool hasBoundaryAfter(UChar32 c) const =0
Tests if the character always has a normalization boundary after it, regardless of context.
#define U_COMMON_API
Set to export library symbols from inside the common library, and to import them from outside.
USetSpanCondition
Argument values for whether span() and similar functions continue while the current character is cont...
FilteredNormalizer2(const Normalizer2 &n2, const UnicodeSet &filterSet)
Constructs a filtered normalizer wrapping any Normalizer2 instance and a filter set.
UnicodeString is a string class that stores Unicode characters directly and provides similar function...
static const Normalizer2 * getNFCInstance(UErrorCode &errorCode)
Returns a Normalizer2 instance for Unicode NFC normalization.
int32_t UChar32
Define UChar32 as a type for single Unicode code points.
UObject is the common ICU "boilerplate" class.
virtual UChar32 composePair(UChar32 a, UChar32 b) const
Performs pairwise composition of a & b and returns the composite if there is one.
virtual UBool hasBoundaryBefore(UChar32 c) const
Tests if the character always has a normalization boundary before it, regardless of context.
UErrorCode
Error code to replace exception handling, so that the code is compatible with all C++ compilers,...
Unicode normalization functionality for standard Unicode normalization or for using custom mapping ta...
virtual UNormalizationCheckResult quickCheck(const UnicodeString &s, UErrorCode &errorCode) const =0
Tests if the string is normalized.
virtual UnicodeString & append(UnicodeString &first, const UnicodeString &second, UErrorCode &errorCode) const =0
Appends the second string to the first string (merging them at the boundary) and returns the first st...
UNormalizationCheckResult
Result values for normalization quick check functions.
C API: New API for Unicode Normalization.
virtual UBool isInert(UChar32 c) const
Tests if the character is normalization-inert.
virtual UnicodeString & normalizeSecondAndAppend(UnicodeString &first, const UnicodeString &second, UErrorCode &errorCode) const
Appends the normalized form of the second string to the first string (merging them at the boundary) a...
virtual UBool getRawDecomposition(UChar32 c, UnicodeString &decomposition) const
Gets the raw decomposition mapping of c.
virtual UBool isInert(UChar32 c) const =0
Tests if the character is normalization-inert.
virtual UBool hasBoundaryAfter(UChar32 c) const
Tests if the character always has a normalization boundary after it, regardless of context.
virtual UnicodeString & normalizeSecondAndAppend(UnicodeString &first, const UnicodeString &second, UErrorCode &errorCode) const =0
Appends the normalized form of the second string to the first string (merging them at the boundary) a...
virtual UBool hasBoundaryBefore(UChar32 c) const =0
Tests if the character always has a normalization boundary before it, regardless of context.
virtual uint8_t getCombiningClass(UChar32 c) const
Gets the combining class of c.
virtual UBool isNormalized(const UnicodeString &s, UErrorCode &errorCode) const =0
Tests if the string is normalized.
~Normalizer2()
Destructor.
virtual UChar32 composePair(UChar32 a, UChar32 b) const
Performs pairwise composition of a & b and returns the composite if there is one.
virtual UNormalizationCheckResult quickCheck(const UnicodeString &s, UErrorCode &errorCode) const
Tests if the string is normalized.
static const Normalizer2 * getNFKCCasefoldInstance(UErrorCode &errorCode)
Returns a Normalizer2 instance for Unicode NFKC_Casefold normalization.
#define U_NAMESPACE_END
This is used to end a declaration of a public ICU C++ API.
virtual uint8_t getCombiningClass(UChar32 c) const
Gets the combining class of c.
#define U_NAMESPACE_BEGIN
This is used to begin a declaration of a public ICU C++ API.
static const Normalizer2 * getNFKDInstance(UErrorCode &errorCode)
Returns a Normalizer2 instance for Unicode NFKD normalization.
virtual UnicodeString & normalize(const UnicodeString &src, UnicodeString &dest, UErrorCode &errorCode) const =0
Writes the normalized form of the source string to the destination string (replacing its contents) an...
UnicodeString normalize(const UnicodeString &src, UErrorCode &errorCode) const
Returns the normalized form of the source string.
virtual UnicodeString & normalize(const UnicodeString &src, UnicodeString &dest, UErrorCode &errorCode) const
Writes the normalized form of the source string to the destination string (replacing its contents) an...
static const Normalizer2 * getNFDInstance(UErrorCode &errorCode)
Returns a Normalizer2 instance for Unicode NFD normalization.
virtual UBool getDecomposition(UChar32 c, UnicodeString &decomposition) const
Gets the decomposition mapping of c.
Normalization filtered by a UnicodeSet.