1 // Copyright (C) 2016 and later: Unicode, Inc. and others.
2 // License & terms of use: http://www.unicode.org/copyright.html
3 /*
4 **********************************************************************
5 *   Copyright (C) 2000-2004, International Business Machines
6 *   Corporation and others.  All Rights Reserved.
7 **********************************************************************
8  *  ucnv_cb.h:
9  *  External APIs for the ICU's codeset conversion library
10  *  Helena Shih
11  *
12  * Modification History:
13  *
14  *   Date        Name        Description
15  */
16 
17 /**
18  * \file
19  * \brief C UConverter functions to aid the writers of callbacks
20  *
21  * <h2> Callback API for UConverter </h2>
22  *
23  * These functions are provided here for the convenience of the callback
24  * writer. If you are just looking for callback functions to use, please
25  * see ucnv_err.h.  DO NOT call these functions directly when you are
26  * working with converters, unless your code has been called as a callback
27  * via ucnv_setFromUCallback or ucnv_setToUCallback !!
28  *
29  * A note about error codes and overflow.  Unlike other ICU functions,
30  * these functions do not expect the error status to be U_ZERO_ERROR.
31  * Callbacks must be much more careful about their error codes.
32  * The error codes used here are in/out parameters, which should be passed
33  * back in the callback's error parameter.
34  *
35  * For example, if you call ucnv_cbfromUWriteBytes to write data out
36  * to the output codepage, it may return U_BUFFER_OVERFLOW_ERROR if
37  * the data did not fit in the target. But this isn't a failing error,
38  * in fact, ucnv_cbfromUWriteBytes may be called AGAIN with the error
39  * status still U_BUFFER_OVERFLOW_ERROR to attempt to write further bytes,
40  * which will also go into the internal overflow buffers.
41  *
42  * Concerning offsets, the 'offset' parameters here are relative to the start
43  * of SOURCE.  For example, Suppose the string "ABCD" was being converted
44  * from Unicode into a codepage which doesn't have a mapping for 'B'.
45  * 'A' will be written out correctly, but
46  * The FromU Callback will be called on an unassigned character for 'B'.
47  * At this point, this is the state of the world:
48  *    Target:    A [..]     [points after A]
49  *    Source:  A B [C] D    [points to C - B has been consumed]
50  *             0 1  2  3
51  *    codePoint = "B"       [the unassigned codepoint]
52  *
53  * Now, suppose a callback wants to write the substitution character '?' to
54  * the target. It calls ucnv_cbFromUWriteBytes() to write the ?.
55  * It should pass ZERO as the offset, because the offset as far as the
56  * callback is concerned is relative to the SOURCE pointer [which points
57  * before 'C'.]  If the callback goes into the args and consumes 'C' also,
58  * it would call FromUWriteBytes with an offset of 1 (and advance the source
59  * pointer).
60  *
61  */
62 
63 #ifndef UCNV_CB_H
64 #define UCNV_CB_H
65 
66 #include "unicode/utypes.h"
67 
68 #if !UCONFIG_NO_CONVERSION
69 
70 #include "unicode/ucnv.h"
71 #include "unicode/ucnv_err.h"
72 
73 /**
74  * ONLY used by FromU callback functions.
75  * Writes out the specified byte output bytes to the target byte buffer or to converter internal buffers.
76  *
77  * @param args callback fromUnicode arguments
78  * @param source source bytes to write
79  * @param length length of bytes to write
80  * @param offsetIndex the relative offset index from callback.
81  * @param err error status. If <TT>U_BUFFER_OVERFLOW</TT> is returned, then U_BUFFER_OVERFLOW <STRONG>must</STRONG>
82  * be returned to the user, because it means that not all data could be written into the target buffer, and some is
83  * in the converter error buffer.
84  * @see ucnv_cbFromUWriteSub
85  * @stable ICU 2.0
86  */
87 U_STABLE void U_EXPORT2
88 ucnv_cbFromUWriteBytes (UConverterFromUnicodeArgs *args,
89                         const char* source,
90                         int32_t length,
91                         int32_t offsetIndex,
92                         UErrorCode * err);
93 
94 /**
95  * ONLY used by FromU callback functions.
96  * This function will write out the correct substitution character sequence
97  * to the target.
98  *
99  * @param args callback fromUnicode arguments
100  * @param offsetIndex the relative offset index from the current source pointer to be used
101  * @param err error status. If <TT>U_BUFFER_OVERFLOW</TT> is returned, then U_BUFFER_OVERFLOW <STRONG>must</STRONG>
102  * be returned to the user, because it means that not all data could be written into the target buffer, and some is
103  * in the converter error buffer.
104  * @see ucnv_cbFromUWriteBytes
105  * @stable ICU 2.0
106  */
107 U_STABLE void U_EXPORT2
108 ucnv_cbFromUWriteSub (UConverterFromUnicodeArgs *args,
109                       int32_t offsetIndex,
110                       UErrorCode * err);
111 
112 /**
113  * ONLY used by fromU callback functions.
114  * This function will write out the error character(s) to the target UChar buffer.
115  *
116  * @param args callback fromUnicode arguments
117  * @param source pointer to pointer to first UChar to write [on exit: 1 after last UChar processed]
118  * @param sourceLimit pointer after last UChar to write
119  * @param offsetIndex the relative offset index from callback which will be set
120  * @param err error status <TT>U_BUFFER_OVERFLOW</TT>
121  * @see ucnv_cbToUWriteSub
122  * @stable ICU 2.0
123  */
124 U_STABLE void U_EXPORT2 ucnv_cbFromUWriteUChars(UConverterFromUnicodeArgs *args,
125                              const UChar** source,
126                              const UChar*  sourceLimit,
127                              int32_t offsetIndex,
128                              UErrorCode * err);
129 
130 /**
131  * ONLY used by ToU callback functions.
132  *  This function will write out the specified characters to the target
133  * UChar buffer.
134  *
135  * @param args callback toUnicode arguments
136  * @param source source string to write
137  * @param length the length of source string
138  * @param offsetIndex the relative offset index which will be written.
139  * @param err error status <TT>U_BUFFER_OVERFLOW</TT>
140  * @see ucnv_cbToUWriteSub
141  * @stable ICU 2.0
142  */
143 U_STABLE void U_EXPORT2 ucnv_cbToUWriteUChars (UConverterToUnicodeArgs *args,
144                                              const UChar* source,
145                                              int32_t length,
146                                              int32_t offsetIndex,
147                                              UErrorCode * err);
148 
149 /**
150  * ONLY used by ToU  callback functions.
151  * This function will write out the Unicode substitution character (U+FFFD).
152  *
153  * @param args callback fromUnicode arguments
154  * @param offsetIndex the relative offset index from callback.
155  * @param err error status <TT>U_BUFFER_OVERFLOW</TT>
156  * @see ucnv_cbToUWriteUChars
157  * @stable ICU 2.0
158  */
159 U_STABLE void U_EXPORT2 ucnv_cbToUWriteSub (UConverterToUnicodeArgs *args,
160                        int32_t offsetIndex,
161                        UErrorCode * err);
162 #endif
163 
164 #endif
165