32 class RBBIRuleScanner;
34 class UnicodeSetStringSpan;
36 class RuleCharacterIterator;
285 int32_t bufferCapacity;
299 UnicodeSetStringSpan *stringSpan;
316 inline UBool isBogus(
void)
const;
374 #ifndef U_HIDE_INTERNAL_API 392 UnicodeSet(
const uint16_t buffer[], int32_t bufferLen,
407 #ifndef U_HIDE_INTERNAL_API 501 virtual int32_t hashCode(
void)
const;
530 inline USet *toUSet();
540 inline const USet * toUSet()
const;
555 inline UBool isFrozen()
const;
621 #ifndef U_HIDE_INTERNAL_API 764 virtual int32_t size(
void)
const;
772 virtual UBool isEmpty(
void)
const;
894 int32_t span(
const char16_t *s, int32_t length,
USetSpanCondition spanCondition)
const;
927 int32_t spanBack(
const char16_t *s, int32_t length,
USetSpanCondition spanCondition)
const;
962 int32_t spanUTF8(
const char *s, int32_t length,
USetSpanCondition spanCondition)
const;
981 int32_t spanBackUTF8(
const char *s, int32_t length,
USetSpanCondition spanCondition)
const;
1016 int32_t start, int32_t limit,
1028 int32_t findCodePoint(
UChar32 c)
const;
1049 int32_t indexOf(
UChar32 c)
const;
1060 UChar32 charAt(int32_t index)
const;
1377 virtual int32_t getRangeCount(
void)
const;
1386 virtual UChar32 getRangeStart(int32_t index)
const;
1395 virtual UChar32 getRangeEnd(int32_t index)
const;
1445 int32_t serialize(uint16_t *dest, int32_t destCapacity,
UErrorCode& ec)
const;
1482 friend class USetAccess;
1484 int32_t getStringCount()
const;
1502 friend class RBBIRuleScanner;
1519 void applyPattern(RuleCharacterIterator& chars,
1530 void ensureCapacity(int32_t newLen,
UErrorCode& ec);
1532 void ensureBufferCapacity(int32_t newLen,
UErrorCode& ec);
1534 void swapBuffers(
void);
1539 UBool escapeUnprintable)
const;
1542 UBool escapeUnprintable)
const;
1552 void exclusiveOr(
const UChar32* other, int32_t otherLen, int8_t polarity);
1554 void add(
const UChar32* other, int32_t otherLen, int8_t polarity);
1556 void retain(
const UChar32* other, int32_t otherLen, int8_t polarity);
1566 static UBool resemblesPropertyPattern(RuleCharacterIterator& chars,
1612 void applyPropertyPattern(RuleCharacterIterator& chars,
1623 typedef UBool (*Filter)(
UChar32 codePoint,
void* context);
1634 void applyFilter(Filter filter,
1646 void releasePattern();
1662 return !containsNone(start, end);
1666 return !containsNone(s);
1670 return !containsNone(s);
1674 return (
UBool)(fFlags & kIsBogus);
1682 return reinterpret_cast<const UnicodeSet *
>(uset);
1686 return reinterpret_cast<USet *
>(
this);
1690 return reinterpret_cast<const USet *
>(
this);
1694 int32_t sLength=s.
length();
1697 }
else if(start>sLength) {
1700 return start+span(s.
getBuffer()+start, sLength-start, spanCondition);
1704 int32_t sLength=s.
length();
1707 }
else if(limit>sLength) {
1710 return spanBack(s.
getBuffer(), limit, spanCondition);
static UClassID getStaticClassID()
ICU "poor man's RTTI", returns a UClassID for this class.
int32_t spanBack(const char16_t *s, int32_t length, USetSpanCondition spanCondition) const
Returns the start of the trailing substring of the input string which consists only of characters and...
UMatchDegree
Constants returned by UnicodeMatcher::matches() indicating the degree of match.
U_EXPORT UBool operator==(const StringPiece &x, const StringPiece &y)
Global operator == for StringPiece.
UnicodeSetIterator iterates over the contents of a UnicodeSet.
UBool isBogus(void) const
Determine if this object contains a valid set.
UBool operator!=(const UnicodeSet &o) const
Compares the specified object with this set for equality.
void * UClassID
UClassID is used to identify classes without using the compiler's RTTI.
static UnicodeSet * fromUSet(USet *uset)
Get a UnicodeSet pointer from a USet.
virtual UBool matchesIndexValue(uint8_t v) const =0
Returns TRUE if this matcher will match a character c, where c & 0xFF == v, at offset, in the forward direction (with limit > offset).
An interface that defines both lookup protocol and parsing of symbolic names.
virtual UClassID getDynamicClassID(void) const =0
Returns a unique class ID polymorphically.
virtual UnicodeFunctor * clone() const =0
Return a copy of this object.
Replaceable is an abstract base class representing a string of characters that supports the replaceme...
#define U_NAMESPACE_BEGIN
This is used to begin a declaration of a public ICU C++ API.
UnicodeFilter defines a protocol for selecting a subset of the full range (U+0000 to U+10FFFF) of Uni...
virtual void addMatchSetTo(UnicodeSet &toUnionTo) const =0
Union the set of all characters that may be matched by this object into the given set...
UBool operator!=(const StringPiece &x, const StringPiece &y)
Global operator != for StringPiece.
int32_t UChar32
Define UChar32 as a type for single Unicode code points.
#define NULL
Define NULL if necessary, to nullptr for C++ and to ((void *)0) for C.
UnicodeFunctor is an abstract base class for objects that perform match and/or replace operations on ...
virtual UMatchDegree matches(const Replaceable &text, int32_t &offset, int32_t limit, UBool incremental)
Implement UnicodeMatcher API.
A mutable set of Unicode characters and multicharacter strings.
USetSpanCondition
Argument values for whether span() and similar functions continue while the current character is cont...
#define U_NAMESPACE_END
This is used to end a declaration of a public ICU C++ API.
UProperty
Selection constants for Unicode properties.
UErrorCode
Error code to replace exception handling, so that the code is compatible with all C++ compilers...
int32_t length(void) const
Return the length of the UnicodeString object.
ParsePosition is a simple class used by Format and its subclasses to keep track of the current positi...
char16_t * getBuffer(int32_t minCapacity)
Get a read/write pointer to the internal buffer.
void UnicodeSet_initInclusion(int32_t src, UErrorCode &status)
virtual UnicodeString & toPattern(UnicodeString &result, UBool escapeUnprintable=FALSE) const =0
Returns a string representation of this matcher.
UBool containsSome(UChar32 start, UChar32 end) const
Returns true if this set contains one or more of the characters in the given range.
virtual UBool contains(UChar32 c) const =0
Returns true for characters that are in the selected subset.
#define FALSE
The FALSE value of a UBool.
#define U_COMMON_API
Set to export library symbols from inside the common library, and to import them from outside...
UnicodeString is a string class that stores Unicode characters directly and provides similar function...
UBool isFrozen() const
Determines whether the set has been frozen (made immutable) or not.
USet * toUSet()
Produce a USet * pointer for this UnicodeSet.
int32_t span(const char16_t *s, int32_t length, USetSpanCondition spanCondition) const
Returns the length of the initial substring of the input string which consists only of characters and...
int8_t UBool
The ICU boolean type.