17 #if U_SHOW_CPLUSPLUS_API
19 #endif // U_SHOW_CPLUSPLUS_API
25 #ifndef UBRK_TYPEDEF_UBREAK_ITERATOR
26 # define UBRK_TYPEDEF_UBREAK_ITERATOR
34 #if !UCONFIG_NO_BREAK_ITERATION
112 #ifndef U_HIDE_DEPRECATED_API
127 #endif // U_HIDE_DEPRECATED_API
133 #define UBRK_DONE ((int32_t) -1)
296 const UChar * text, int32_t textLength,
299 #ifndef U_HIDE_DEPRECATED_API
323 int32_t *pBufferSize,
328 #ifndef U_HIDE_DRAFT_API
341 #endif // U_HIDE_DRAFT_API
343 #ifndef U_HIDE_DEPRECATED_API
349 #define U_BRK_SAFECLONE_BUFFERSIZE 1
362 #if U_SHOW_CPLUSPLUS_API
516 U_CAPI const char* U_EXPORT2
584 U_CAPI const char* U_EXPORT2
645 uint8_t * binaryRules, int32_t rulesCapacity,
struct UBreakIterator UBreakIterator
Opaque type representing an ICU Break iterator object.
Tag value for for sentences that do not contain an ending sentence terminator ('. ...
U_CAPI int32_t ubrk_getRuleStatus(UBreakIterator *bi)
Return the status from the break rule that determined the most recently returned break position...
Tag value for words containing kana characters, upper limit.
Tag value for words containing ideographic characters, lower limit.
Tag value for words containing letters, upper limit.
Upper bound for hard line breaks.
U_CAPI int32_t ubrk_current(const UBreakIterator *bi)
Determine the most recently-returned text boundary.
#define U_CAPI
This is used to declare a function as a public ICU C API.
U_CAPI int32_t ubrk_getRuleStatusVec(UBreakIterator *bi, int32_t *fillInVec, int32_t capacity, UErrorCode *status)
Get the statuses from the break rules that determined the most recently returned break position...
Tag value for words containing kana characters, lower limit.
U_CAPI int32_t ubrk_preceding(UBreakIterator *bi, int32_t offset)
Set the iterator position to the first boundary preceding the specified offset.
ULineBreakTag
Enum constants for the line break tags returned by getRuleStatus().
UWordBreak
Enum constants for the word break tags returned by getRuleStatus().
USentenceBreakTag
Enum constants for the sentence break tags returned by getRuleStatus().
Tag value for a hard, or mandatory line break.
U_CAPI void ubrk_setText(UBreakIterator *bi, const UChar *text, int32_t textLength, UErrorCode *status)
Sets an existing iterator to point to a new piece of text.
Upper bound for tags for sentences ended by sentence terminators.
U_CAPI int32_t ubrk_getBinaryRules(UBreakIterator *bi, uint8_t *binaryRules, int32_t rulesCapacity, UErrorCode *status)
Get a compiled binary version of the rules specifying the behavior of a UBreakIterator.
UBreakIteratorType
The possible types of text boundaries.
U_CAPI UBool ubrk_isBoundary(UBreakIterator *bi, int32_t offset)
Returns true if the specified position is a boundary position.
Tag value for for sentences ending with a sentence terminator ('.
U_CAPI void ubrk_refreshUText(UBreakIterator *bi, UText *text, UErrorCode *status)
Set the subject text string upon which the break iterator is operating without changing any other asp...
U_CAPI UBreakIterator * ubrk_clone(const UBreakIterator *bi, UErrorCode *status)
Thread safe cloning operation.
C API: Abstract Unicode Text API.
U_CAPI int32_t ubrk_following(UBreakIterator *bi, int32_t offset)
Advance the iterator to the first boundary following the specified offset.
Upper bound for tags for uncategorized words.
U_CAPI void ubrk_close(UBreakIterator *bi)
Close a UBreakIterator.
One more than the highest normal UBreakIteratorType value.
Tag value for words that appear to be numbers, upper limit.
#define U_DEFINE_LOCAL_OPEN_POINTER(LocalPointerClassName, Type, closeFunction)
"Smart pointer" definition macro, deletes objects via the closeFunction.
C++ API: "Smart pointers" for use with and in ICU4C C++ code.
U_CAPI void ubrk_setUText(UBreakIterator *bi, UText *text, UErrorCode *status)
Sets an existing iterator to point to a new piece of text.
Tag value for soft line breaks, positions at which a line break is acceptable but not required...
"Smart pointer" class, closes a UBreakIterator via ubrk_close().
Upper bound for tags for sentences ended by a separator.
U_CAPI int32_t ubrk_previous(UBreakIterator *bi)
Set the iterator position to the boundary preceding the current boundary.
U_CAPI const char * ubrk_getLocaleByType(const UBreakIterator *bi, ULocDataLocaleType type, UErrorCode *status)
Return the locale of the break iterator.
U_CAPI const char * ubrk_getAvailable(int32_t index)
Get a locale for which text breaking information is available.
U_CAPI UBreakIterator * ubrk_openRules(const UChar *rules, int32_t rulesLength, const UChar *text, int32_t textLength, UParseError *parseErr, UErrorCode *status)
Open a new UBreakIterator for locating text boundaries using specified breaking rules.
char16_t UChar
The base type for UTF-16 code units and pointers.
U_CAPI int32_t ubrk_first(UBreakIterator *bi)
Set the iterator position to zero, the start of the text being scanned.
C API: Parse Error Information.
U_CAPI int32_t ubrk_last(UBreakIterator *bi)
Set the iterator position to the index immediately beyond the last character in the text being scanne...
U_CAPI UBreakIterator * ubrk_open(UBreakIteratorType type, const char *locale, const UChar *text, int32_t textLength, UErrorCode *status)
Open a new UBreakIterator for locating text boundaries for a specified locale.
Tag value for "words" that do not fit into any of other categories.
UErrorCode
Standard ICU4C error code type, a substitute for exceptions.
ULocDataLocaleType
Constants for *_getLocale() Allow user to select whether she wants information on requested...
A UParseError struct is used to returned detailed information about parsing errors.
Basic definitions for ICU, for both C and C++ APIs.
U_CAPI int32_t ubrk_countAvailable(void)
Determine how many locales have text breaking information available.
Tag value for words that contain letters, excluding hiragana, katakana or ideographic characters...
U_CAPI UBreakIterator * ubrk_openBinaryRules(const uint8_t *binaryRules, int32_t rulesLength, const UChar *text, int32_t textLength, UErrorCode *status)
Open a new UBreakIterator for locating text boundaries using precompiled binary rules.
Tag value for words that appear to be numbers, lower limit.
U_CAPI int32_t ubrk_next(UBreakIterator *bi)
Advance the iterator to the boundary following the current boundary.
Upper bound for soft line breaks.
Title Case breaks The iterator created using this type locates title boundaries as described for Unic...
U_CAPI UBreakIterator * ubrk_safeClone(const UBreakIterator *bi, void *stackBuffer, int32_t *pBufferSize, UErrorCode *status)
Thread safe cloning operation.
Tag value for words containing ideographic characters, upper limit.
int8_t UBool
The ICU boolean type, a signed-byte integer.