2 ********************************************************************************
3 * Copyright (C) 1996-2013, International Business Machines
4 * Corporation and others. All Rights Reserved.
5 ********************************************************************************
8 #include "unicode/utypes.h"
10 #if !UCONFIG_NO_BREAK_ITERATION
12 #include "unicode/ubrk.h"
14 #include "unicode/brkiter.h"
15 #include "unicode/uloc.h"
16 #include "unicode/ustring.h"
17 #include "unicode/uchriter.h"
18 #include "unicode/rbbi.h"
24 //------------------------------------------------------------------------------
26 // ubrk_open Create a canned type of break iterator based on type (word, line, etc.)
29 //------------------------------------------------------------------------------
30 U_CAPI UBreakIterator* U_EXPORT2
31 ubrk_open(UBreakIteratorType type,
38 if(U_FAILURE(*status)) return 0;
40 BreakIterator *result = 0;
45 result = BreakIterator::createCharacterInstance(Locale(locale), *status);
49 result = BreakIterator::createWordInstance(Locale(locale), *status);
53 result = BreakIterator::createLineInstance(Locale(locale), *status);
57 result = BreakIterator::createSentenceInstance(Locale(locale), *status);
61 result = BreakIterator::createTitleInstance(Locale(locale), *status);
65 *status = U_ILLEGAL_ARGUMENT_ERROR;
68 // check for allocation error
69 if (U_FAILURE(*status)) {
73 *status = U_MEMORY_ALLOCATION_ERROR;
78 UBreakIterator *uBI = (UBreakIterator *)result;
80 ubrk_setText(uBI, text, textLength, status);
87 //------------------------------------------------------------------------------
89 // ubrk_openRules open a break iterator from a set of break rules.
90 // Invokes the rule builder.
92 //------------------------------------------------------------------------------
93 U_CAPI UBreakIterator* U_EXPORT2
94 ubrk_openRules( const UChar *rules,
98 UParseError *parseErr,
101 if (status == NULL || U_FAILURE(*status)){
105 BreakIterator *result = 0;
106 UnicodeString ruleString(rules, rulesLength);
107 result = RBBIRuleBuilder::createRuleBasedBreakIterator(ruleString, parseErr, *status);
108 if(U_FAILURE(*status)) {
112 UBreakIterator *uBI = (UBreakIterator *)result;
114 ubrk_setText(uBI, text, textLength, status);
123 U_CAPI UBreakIterator * U_EXPORT2
125 const UBreakIterator *bi,
126 void * /*stackBuffer*/,
127 int32_t *pBufferSize,
130 if (status == NULL || U_FAILURE(*status)){
134 *status = U_ILLEGAL_ARGUMENT_ERROR;
137 if (pBufferSize != NULL) {
138 int32_t inputSize = *pBufferSize;
140 if (inputSize == 0) {
141 return NULL; // preflighting for deprecated functionality
144 BreakIterator *newBI = ((BreakIterator *)bi)->clone();
146 *status = U_MEMORY_ALLOCATION_ERROR;
148 *status = U_SAFECLONE_ALLOCATED_WARNING;
150 return (UBreakIterator *)newBI;
155 U_CAPI void U_EXPORT2
156 ubrk_close(UBreakIterator *bi)
158 delete (BreakIterator *)bi;
161 U_CAPI void U_EXPORT2
162 ubrk_setText(UBreakIterator* bi,
167 BreakIterator *brit = (BreakIterator *)bi;
168 UText ut = UTEXT_INITIALIZER;
169 utext_openUChars(&ut, text, textLength, status);
170 brit->setText(&ut, *status);
171 // A stack allocated UText wrapping a UChar * string
172 // can be dumped without explicitly closing it.
177 U_CAPI void U_EXPORT2
178 ubrk_setUText(UBreakIterator *bi,
182 RuleBasedBreakIterator *brit = (RuleBasedBreakIterator *)bi;
183 brit->RuleBasedBreakIterator::setText(text, *status);
190 U_CAPI int32_t U_EXPORT2
191 ubrk_current(const UBreakIterator *bi)
194 return ((RuleBasedBreakIterator*)bi)->RuleBasedBreakIterator::current();
197 U_CAPI int32_t U_EXPORT2
198 ubrk_next(UBreakIterator *bi)
201 return ((RuleBasedBreakIterator*)bi)->RuleBasedBreakIterator::next();
204 U_CAPI int32_t U_EXPORT2
205 ubrk_previous(UBreakIterator *bi)
208 return ((RuleBasedBreakIterator*)bi)->RuleBasedBreakIterator::previous();
211 U_CAPI int32_t U_EXPORT2
212 ubrk_first(UBreakIterator *bi)
215 return ((RuleBasedBreakIterator*)bi)->RuleBasedBreakIterator::first();
218 U_CAPI int32_t U_EXPORT2
219 ubrk_last(UBreakIterator *bi)
222 return ((RuleBasedBreakIterator*)bi)->RuleBasedBreakIterator::last();
225 U_CAPI int32_t U_EXPORT2
226 ubrk_preceding(UBreakIterator *bi,
230 return ((RuleBasedBreakIterator*)bi)->RuleBasedBreakIterator::preceding(offset);
233 U_CAPI int32_t U_EXPORT2
234 ubrk_following(UBreakIterator *bi,
238 return ((RuleBasedBreakIterator*)bi)->RuleBasedBreakIterator::following(offset);
241 U_CAPI const char* U_EXPORT2
242 ubrk_getAvailable(int32_t index)
245 return uloc_getAvailable(index);
248 U_CAPI int32_t U_EXPORT2
249 ubrk_countAvailable()
252 return uloc_countAvailable();
256 U_CAPI UBool U_EXPORT2
257 ubrk_isBoundary(UBreakIterator *bi, int32_t offset)
259 return ((RuleBasedBreakIterator *)bi)->RuleBasedBreakIterator::isBoundary(offset);
263 U_CAPI int32_t U_EXPORT2
264 ubrk_getRuleStatus(UBreakIterator *bi)
266 return ((RuleBasedBreakIterator *)bi)->RuleBasedBreakIterator::getRuleStatus();
269 U_CAPI int32_t U_EXPORT2
270 ubrk_getRuleStatusVec(UBreakIterator *bi, int32_t *fillInVec, int32_t capacity, UErrorCode *status)
272 return ((RuleBasedBreakIterator *)bi)->RuleBasedBreakIterator::getRuleStatusVec(fillInVec, capacity, *status);
276 U_CAPI const char* U_EXPORT2
277 ubrk_getLocaleByType(const UBreakIterator *bi,
278 ULocDataLocaleType type,
282 if (U_SUCCESS(*status)) {
283 *status = U_ILLEGAL_ARGUMENT_ERROR;
287 return ((BreakIterator*)bi)->getLocaleID(type, *status);
291 void ubrk_refreshUText(UBreakIterator *bi,
295 BreakIterator *bii = reinterpret_cast<BreakIterator *>(bi);
296 bii->refreshInputText(text, *status);
301 #endif /* #if !UCONFIG_NO_BREAK_ITERATION */