1 /*
2 *******************************************************************************
3 *
4 *   Copyright (C) 2016 and later: Unicode, Inc. and others.
5 *   License & terms of use: http://www.unicode.org/copyright.html#License
6 *
7 *******************************************************************************
8 *******************************************************************************
9 *
10 *   Copyright (C) 2002-2003, International Business Machines
11 *   Corporation and others.  All Rights Reserved.
12 *
13 *******************************************************************************
14 */
15 
16 #include <stdio.h>
17 #include <unicode/brkiter.h>
18 #include <stdlib.h>
19 
20 U_CFUNC int c_main(void);
21 
22 
printUnicodeString(const UnicodeString & s)23 void printUnicodeString(const UnicodeString &s) {
24     char charBuf[1000];
25     s.extract(0, s.length(), charBuf, sizeof(charBuf)-1, 0);
26     charBuf[sizeof(charBuf)-1] = 0;
27     printf("%s", charBuf);
28 }
29 
30 
printTextRange(BreakIterator & iterator,int32_t start,int32_t end)31 void printTextRange( BreakIterator& iterator,
32                     int32_t start, int32_t end )
33 {
34     CharacterIterator *strIter = iterator.getText().clone();
35     UnicodeString  s;
36     strIter->getText(s);
37 
38     printf(" %ld %ld\t", (long)start, (long)end);
39     printUnicodeString(UnicodeString(s, 0, start));
40     printf("|");
41     printUnicodeString(UnicodeString(s, start, end-start));
42     printf("|");
43     printUnicodeString(UnicodeString(s, end));
44     puts("");
45     delete strIter;
46 }
47 
48 
49 /* Print each element in order: */
printEachForward(BreakIterator & boundary)50 void printEachForward( BreakIterator& boundary)
51 {
52     int32_t start = boundary.first();
53     for (int32_t end = boundary.next();
54          end != BreakIterator::DONE;
55          start = end, end = boundary.next())
56     {
57         printTextRange( boundary, start, end );
58     }
59 }
60 
61 /* Print each element in reverse order: */
printEachBackward(BreakIterator & boundary)62 void printEachBackward( BreakIterator& boundary)
63 {
64     int32_t end = boundary.last();
65     for (int32_t start = boundary.previous();
66          start != BreakIterator::DONE;
67          end = start, start = boundary.previous())
68     {
69         printTextRange( boundary, start, end );
70     }
71 }
72 
73 /* Print the first element */
printFirst(BreakIterator & boundary)74 void printFirst(BreakIterator& boundary)
75 {
76     int32_t start = boundary.first();
77     int32_t end = boundary.next();
78     printTextRange( boundary, start, end );
79 }
80 
81 /* Print the last element */
printLast(BreakIterator & boundary)82 void printLast(BreakIterator& boundary)
83 {
84     int32_t end = boundary.last();
85     int32_t start = boundary.previous();
86     printTextRange( boundary, start, end );
87 }
88 
89 /* Print the element at a specified position */
printAt(BreakIterator & boundary,int32_t pos)90 void printAt(BreakIterator &boundary, int32_t pos )
91 {
92     int32_t end = boundary.following(pos);
93     int32_t start = boundary.previous();
94     printTextRange( boundary, start, end );
95 }
96 
97 /* Creating and using text boundaries */
main(void)98 int main( void )
99 {
100     puts("ICU Break Iterator Sample Program\n");
101     puts("C++ Break Iteration\n");
102     BreakIterator* boundary;
103     UnicodeString stringToExamine("Aaa bbb ccc. Ddd eee fff.");
104     printf("Examining: ");
105     printUnicodeString(stringToExamine);
106     puts("");
107 
108     //print each sentence in forward and reverse order
109     UErrorCode status = U_ZERO_ERROR;
110     boundary = BreakIterator::createSentenceInstance(
111         Locale::getUS(), status );
112     if (U_FAILURE(status)) {
113         printf("failed to create sentence break iterator.  status = %s",
114             u_errorName(status));
115         exit(1);
116     }
117 
118     boundary->setText(stringToExamine);
119     puts("\n Sentence Boundaries... ");
120     puts("----- forward: -----------");
121     printEachForward(*boundary);
122     puts("----- backward: ----------");
123     printEachBackward(*boundary);
124     delete boundary;
125 
126     //print each word in order
127     printf("\n Word Boundaries... \n");
128     boundary = BreakIterator::createWordInstance(
129         Locale::getUS(), status);
130     boundary->setText(stringToExamine);
131     puts("----- forward: -----------");
132     printEachForward(*boundary);
133     //print first element
134     puts("----- first: -------------");
135     printFirst(*boundary);
136     //print last element
137     puts("----- last: --------------");
138     printLast(*boundary);
139     //print word at charpos 10
140     puts("----- at pos 10: ---------");
141     printAt(*boundary, 10 );
142 
143     delete boundary;
144 
145     puts("\nEnd C++ Break Iteration");
146 
147     // Call the C version
148     return c_main();
149 }
150