1 /*
2 *******************************************************************************
3 *
4 *   Copyright (C) 1999-2012, International Business Machines
5 *   Corporation and others.  All Rights Reserved.
6 *
7 *******************************************************************************
8 *   file name:  umsg.cpp
9 *   encoding:   US-ASCII
10 *   tab size:   8 (not used)
11 *   indentation:4
12 *
13 * This is a C wrapper to MessageFormat C++ API.
14 *
15 *   Change history:
16 *
17 *   08/5/2001  Ram         Added C wrappers for C++ API. Changed implementation of old API's
18 *                          Removed pattern parser.
19 *
20 */
21 
22 #include "unicode/utypes.h"
23 
24 #if !UCONFIG_NO_FORMATTING
25 
26 #include "unicode/umsg.h"
27 #include "unicode/ustring.h"
28 #include "unicode/fmtable.h"
29 #include "unicode/msgfmt.h"
30 #include "unicode/unistr.h"
31 #include "cpputils.h"
32 #include "uassert.h"
33 #include "ustr_imp.h"
34 
35 U_NAMESPACE_BEGIN
36 /**
37  * This class isolates our access to private internal methods of
38  * MessageFormat.  It is never instantiated; it exists only for C++
39  * access management.
40  */
41 class MessageFormatAdapter {
42 public:
43     static const Formattable::Type* getArgTypeList(const MessageFormat& m,
44                                                    int32_t& count);
hasArgTypeConflicts(const MessageFormat & m)45     static UBool hasArgTypeConflicts(const MessageFormat& m) {
46         return m.hasArgTypeConflicts;
47     }
48 };
49 const Formattable::Type*
getArgTypeList(const MessageFormat & m,int32_t & count)50 MessageFormatAdapter::getArgTypeList(const MessageFormat& m,
51                                      int32_t& count) {
52     return m.getArgTypeList(count);
53 }
54 U_NAMESPACE_END
55 
56 U_NAMESPACE_USE
57 
58 U_CAPI int32_t
u_formatMessage(const char * locale,const UChar * pattern,int32_t patternLength,UChar * result,int32_t resultLength,UErrorCode * status,...)59 u_formatMessage(const char  *locale,
60                 const UChar *pattern,
61                 int32_t     patternLength,
62                 UChar       *result,
63                 int32_t     resultLength,
64                 UErrorCode  *status,
65                 ...)
66 {
67     va_list    ap;
68     int32_t actLen;
69     //argument checking defered to subsequent method calls
70     // start vararg processing
71     va_start(ap, status);
72 
73     actLen = u_vformatMessage(locale,pattern,patternLength,result,resultLength,ap,status);
74     // end vararg processing
75     va_end(ap);
76 
77     return actLen;
78 }
79 
80 U_CAPI int32_t U_EXPORT2
u_vformatMessage(const char * locale,const UChar * pattern,int32_t patternLength,UChar * result,int32_t resultLength,va_list ap,UErrorCode * status)81 u_vformatMessage(   const char  *locale,
82                     const UChar *pattern,
83                     int32_t     patternLength,
84                     UChar       *result,
85                     int32_t     resultLength,
86                     va_list     ap,
87                     UErrorCode  *status)
88 
89 {
90     //argument checking defered to subsequent method calls
91     UMessageFormat *fmt = umsg_open(pattern,patternLength,locale,NULL,status);
92     int32_t retVal = umsg_vformat(fmt,result,resultLength,ap,status);
93     umsg_close(fmt);
94     return retVal;
95 }
96 
97 U_CAPI int32_t
u_formatMessageWithError(const char * locale,const UChar * pattern,int32_t patternLength,UChar * result,int32_t resultLength,UParseError * parseError,UErrorCode * status,...)98 u_formatMessageWithError(const char *locale,
99                         const UChar *pattern,
100                         int32_t     patternLength,
101                         UChar       *result,
102                         int32_t     resultLength,
103                         UParseError *parseError,
104                         UErrorCode  *status,
105                         ...)
106 {
107     va_list    ap;
108     int32_t actLen;
109     //argument checking defered to subsequent method calls
110     // start vararg processing
111     va_start(ap, status);
112 
113     actLen = u_vformatMessageWithError(locale,pattern,patternLength,result,resultLength,parseError,ap,status);
114 
115     // end vararg processing
116     va_end(ap);
117     return actLen;
118 }
119 
120 U_CAPI int32_t U_EXPORT2
u_vformatMessageWithError(const char * locale,const UChar * pattern,int32_t patternLength,UChar * result,int32_t resultLength,UParseError * parseError,va_list ap,UErrorCode * status)121 u_vformatMessageWithError(  const char  *locale,
122                             const UChar *pattern,
123                             int32_t     patternLength,
124                             UChar       *result,
125                             int32_t     resultLength,
126                             UParseError *parseError,
127                             va_list     ap,
128                             UErrorCode  *status)
129 
130 {
131     //argument checking defered to subsequent method calls
132     UMessageFormat *fmt = umsg_open(pattern,patternLength,locale,parseError,status);
133     int32_t retVal = umsg_vformat(fmt,result,resultLength,ap,status);
134     umsg_close(fmt);
135     return retVal;
136 }
137 
138 
139 // For parse, do the reverse of format:
140 //  1. Call through to the C++ APIs
141 //  2. Just assume the user passed in enough arguments.
142 //  3. Iterate through each formattable returned, and assign to the arguments
143 U_CAPI void
u_parseMessage(const char * locale,const UChar * pattern,int32_t patternLength,const UChar * source,int32_t sourceLength,UErrorCode * status,...)144 u_parseMessage( const char   *locale,
145                 const UChar  *pattern,
146                 int32_t      patternLength,
147                 const UChar  *source,
148                 int32_t      sourceLength,
149                 UErrorCode   *status,
150                 ...)
151 {
152     va_list    ap;
153     //argument checking defered to subsequent method calls
154 
155     // start vararg processing
156     va_start(ap, status);
157 
158     u_vparseMessage(locale,pattern,patternLength,source,sourceLength,ap,status);
159     // end vararg processing
160     va_end(ap);
161 }
162 
163 U_CAPI void U_EXPORT2
u_vparseMessage(const char * locale,const UChar * pattern,int32_t patternLength,const UChar * source,int32_t sourceLength,va_list ap,UErrorCode * status)164 u_vparseMessage(const char  *locale,
165                 const UChar *pattern,
166                 int32_t     patternLength,
167                 const UChar *source,
168                 int32_t     sourceLength,
169                 va_list     ap,
170                 UErrorCode  *status)
171 {
172     //argument checking defered to subsequent method calls
173     UMessageFormat *fmt = umsg_open(pattern,patternLength,locale,NULL,status);
174     int32_t count = 0;
175     umsg_vparse(fmt,source,sourceLength,&count,ap,status);
176     umsg_close(fmt);
177 }
178 
179 U_CAPI void
u_parseMessageWithError(const char * locale,const UChar * pattern,int32_t patternLength,const UChar * source,int32_t sourceLength,UParseError * error,UErrorCode * status,...)180 u_parseMessageWithError(const char  *locale,
181                         const UChar *pattern,
182                         int32_t     patternLength,
183                         const UChar *source,
184                         int32_t     sourceLength,
185                         UParseError *error,
186                         UErrorCode  *status,
187                         ...)
188 {
189     va_list    ap;
190 
191     //argument checking defered to subsequent method calls
192 
193     // start vararg processing
194     va_start(ap, status);
195 
196     u_vparseMessageWithError(locale,pattern,patternLength,source,sourceLength,ap,error,status);
197     // end vararg processing
198     va_end(ap);
199 }
200 U_CAPI void U_EXPORT2
u_vparseMessageWithError(const char * locale,const UChar * pattern,int32_t patternLength,const UChar * source,int32_t sourceLength,va_list ap,UParseError * error,UErrorCode * status)201 u_vparseMessageWithError(const char  *locale,
202                          const UChar *pattern,
203                          int32_t     patternLength,
204                          const UChar *source,
205                          int32_t     sourceLength,
206                          va_list     ap,
207                          UParseError *error,
208                          UErrorCode* status)
209 {
210     //argument checking defered to subsequent method calls
211     UMessageFormat *fmt = umsg_open(pattern,patternLength,locale,error,status);
212     int32_t count = 0;
213     umsg_vparse(fmt,source,sourceLength,&count,ap,status);
214     umsg_close(fmt);
215 }
216 //////////////////////////////////////////////////////////////////////////////////
217 //
218 //  Message format C API
219 //
220 /////////////////////////////////////////////////////////////////////////////////
221 
222 
223 U_CAPI UMessageFormat* U_EXPORT2
umsg_open(const UChar * pattern,int32_t patternLength,const char * locale,UParseError * parseError,UErrorCode * status)224 umsg_open(  const UChar     *pattern,
225             int32_t         patternLength,
226             const  char     *locale,
227             UParseError     *parseError,
228             UErrorCode      *status)
229 {
230     //check arguments
231     if(status==NULL || U_FAILURE(*status))
232     {
233       return 0;
234     }
235     if(pattern==NULL||patternLength<-1){
236         *status=U_ILLEGAL_ARGUMENT_ERROR;
237         return 0;
238     }
239 
240     UParseError tErr;
241     if(parseError==NULL)
242     {
243         parseError = &tErr;
244     }
245 
246     int32_t len = (patternLength == -1 ? u_strlen(pattern) : patternLength);
247     UnicodeString patString(patternLength == -1, pattern, len);
248 
249     MessageFormat* retVal = new MessageFormat(patString,Locale(locale),*parseError,*status);
250     if(retVal == NULL) {
251         *status = U_MEMORY_ALLOCATION_ERROR;
252         return NULL;
253     }
254     if (U_SUCCESS(*status) && MessageFormatAdapter::hasArgTypeConflicts(*retVal)) {
255         *status = U_ARGUMENT_TYPE_MISMATCH;
256     }
257     return (UMessageFormat*)retVal;
258 }
259 
260 U_CAPI void U_EXPORT2
umsg_close(UMessageFormat * format)261 umsg_close(UMessageFormat* format)
262 {
263     //check arguments
264     if(format==NULL){
265         return;
266     }
267     delete (MessageFormat*) format;
268 }
269 
270 U_CAPI UMessageFormat U_EXPORT2
umsg_clone(const UMessageFormat * fmt,UErrorCode * status)271 umsg_clone(const UMessageFormat *fmt,
272            UErrorCode *status)
273 {
274     //check arguments
275     if(status==NULL || U_FAILURE(*status)){
276         return NULL;
277     }
278     if(fmt==NULL){
279         *status = U_ILLEGAL_ARGUMENT_ERROR;
280         return NULL;
281     }
282     UMessageFormat retVal = (UMessageFormat)((MessageFormat*)fmt)->clone();
283     if(retVal == 0) {
284         *status = U_MEMORY_ALLOCATION_ERROR;
285         return 0;
286     }
287     return retVal;
288 }
289 
290 U_CAPI void  U_EXPORT2
umsg_setLocale(UMessageFormat * fmt,const char * locale)291 umsg_setLocale(UMessageFormat *fmt, const char* locale)
292 {
293     //check arguments
294     if(fmt==NULL){
295         return;
296     }
297     ((MessageFormat*)fmt)->setLocale(Locale(locale));
298 }
299 
300 U_CAPI const char*  U_EXPORT2
umsg_getLocale(const UMessageFormat * fmt)301 umsg_getLocale(const UMessageFormat *fmt)
302 {
303     //check arguments
304     if(fmt==NULL){
305         return "";
306     }
307     return ((const MessageFormat*)fmt)->getLocale().getName();
308 }
309 
310 U_CAPI void  U_EXPORT2
umsg_applyPattern(UMessageFormat * fmt,const UChar * pattern,int32_t patternLength,UParseError * parseError,UErrorCode * status)311 umsg_applyPattern(UMessageFormat *fmt,
312                            const UChar* pattern,
313                            int32_t patternLength,
314                            UParseError* parseError,
315                            UErrorCode* status)
316 {
317     //check arguments
318     UParseError tErr;
319     if(status ==NULL||U_FAILURE(*status)){
320         return ;
321     }
322     if(fmt==NULL||pattern==NULL||patternLength<-1){
323         *status=U_ILLEGAL_ARGUMENT_ERROR;
324         return ;
325     }
326 
327     if(parseError==NULL){
328       parseError = &tErr;
329     }
330     if(patternLength<-1){
331         patternLength=u_strlen(pattern);
332     }
333 
334     ((MessageFormat*)fmt)->applyPattern(UnicodeString(pattern,patternLength),*parseError,*status);
335 }
336 
337 U_CAPI int32_t  U_EXPORT2
umsg_toPattern(const UMessageFormat * fmt,UChar * result,int32_t resultLength,UErrorCode * status)338 umsg_toPattern(const UMessageFormat *fmt,
339                UChar* result,
340                int32_t resultLength,
341                UErrorCode* status)
342 {
343     //check arguments
344     if(status ==NULL||U_FAILURE(*status)){
345         return -1;
346     }
347     if(fmt==NULL||resultLength<0 || (resultLength>0 && result==0)){
348         *status=U_ILLEGAL_ARGUMENT_ERROR;
349         return -1;
350     }
351 
352 
353     UnicodeString res;
354     if(!(result==NULL && resultLength==0)) {
355         // NULL destination for pure preflighting: empty dummy string
356         // otherwise, alias the destination buffer
357         res.setTo(result, 0, resultLength);
358     }
359     ((const MessageFormat*)fmt)->toPattern(res);
360     return res.extract(result, resultLength, *status);
361 }
362 
363 U_CAPI int32_t
umsg_format(const UMessageFormat * fmt,UChar * result,int32_t resultLength,UErrorCode * status,...)364 umsg_format(    const UMessageFormat *fmt,
365                 UChar          *result,
366                 int32_t        resultLength,
367                 UErrorCode     *status,
368                 ...)
369 {
370     va_list    ap;
371     int32_t actLen;
372     //argument checking defered to last method call umsg_vformat which
373     //saves time when arguments are valid and we dont care when arguments are not
374     //since we return an error anyway
375 
376 
377     // start vararg processing
378     va_start(ap, status);
379 
380     actLen = umsg_vformat(fmt,result,resultLength,ap,status);
381 
382     // end vararg processing
383     va_end(ap);
384 
385     return actLen;
386 }
387 
388 U_CAPI int32_t U_EXPORT2
umsg_vformat(const UMessageFormat * fmt,UChar * result,int32_t resultLength,va_list ap,UErrorCode * status)389 umsg_vformat(   const UMessageFormat *fmt,
390                 UChar          *result,
391                 int32_t        resultLength,
392                 va_list        ap,
393                 UErrorCode     *status)
394 {
395     //check arguments
396     if(status==0 || U_FAILURE(*status))
397     {
398         return -1;
399     }
400     if(fmt==NULL||resultLength<0 || (resultLength>0 && result==0)) {
401         *status=U_ILLEGAL_ARGUMENT_ERROR;
402         return -1;
403     }
404 
405     int32_t count =0;
406     const Formattable::Type* argTypes =
407         MessageFormatAdapter::getArgTypeList(*(const MessageFormat*)fmt, count);
408     // Allocate at least one element.  Allocating an array of length
409     // zero causes problems on some platforms (e.g. Win32).
410     Formattable* args = new Formattable[count ? count : 1];
411 
412     // iterate through the vararg list, and get the arguments out
413     for(int32_t i = 0; i < count; ++i) {
414 
415         UChar *stringVal;
416         double tDouble=0;
417         int32_t tInt =0;
418         int64_t tInt64 = 0;
419         UDate tempDate = 0;
420         switch(argTypes[i]) {
421         case Formattable::kDate:
422             tempDate = va_arg(ap, UDate);
423             args[i].setDate(tempDate);
424             break;
425 
426         case Formattable::kDouble:
427             tDouble =va_arg(ap, double);
428             args[i].setDouble(tDouble);
429             break;
430 
431         case Formattable::kLong:
432             tInt = va_arg(ap, int32_t);
433             args[i].setLong(tInt);
434             break;
435 
436         case Formattable::kInt64:
437             tInt64 = va_arg(ap, int64_t);
438             args[i].setInt64(tInt64);
439             break;
440 
441         case Formattable::kString:
442             // For some reason, a temporary is needed
443             stringVal = va_arg(ap, UChar*);
444             if(stringVal){
445                 args[i].setString(UnicodeString(stringVal));
446             }else{
447                 *status=U_ILLEGAL_ARGUMENT_ERROR;
448             }
449             break;
450 
451         case Formattable::kArray:
452             // throw away this argument
453             // this is highly platform-dependent, and probably won't work
454             // so, if you try to skip arguments in the list (and not use them)
455             // you'll probably crash
456             va_arg(ap, int);
457             break;
458 
459         case Formattable::kObject:
460             // Unused argument number. Read and ignore a pointer argument.
461             va_arg(ap, void*);
462             break;
463 
464         default:
465             // Unknown/unsupported argument type.
466             U_ASSERT(FALSE);
467             *status=U_ILLEGAL_ARGUMENT_ERROR;
468             break;
469         }
470     }
471     UnicodeString resultStr;
472     FieldPosition fieldPosition(0);
473 
474     /* format the message */
475     ((const MessageFormat*)fmt)->format(args,count,resultStr,fieldPosition,*status);
476 
477     delete[] args;
478 
479     if(U_FAILURE(*status)){
480         return -1;
481     }
482 
483     return resultStr.extract(result, resultLength, *status);
484 }
485 
486 U_CAPI void
umsg_parse(const UMessageFormat * fmt,const UChar * source,int32_t sourceLength,int32_t * count,UErrorCode * status,...)487 umsg_parse( const UMessageFormat *fmt,
488             const UChar    *source,
489             int32_t        sourceLength,
490             int32_t        *count,
491             UErrorCode     *status,
492             ...)
493 {
494     va_list    ap;
495     //argument checking defered to last method call umsg_vparse which
496     //saves time when arguments are valid and we dont care when arguments are not
497     //since we return an error anyway
498 
499     // start vararg processing
500     va_start(ap, status);
501 
502     umsg_vparse(fmt,source,sourceLength,count,ap,status);
503 
504     // end vararg processing
505     va_end(ap);
506 }
507 
508 U_CAPI void U_EXPORT2
umsg_vparse(const UMessageFormat * fmt,const UChar * source,int32_t sourceLength,int32_t * count,va_list ap,UErrorCode * status)509 umsg_vparse(const UMessageFormat *fmt,
510             const UChar    *source,
511             int32_t        sourceLength,
512             int32_t        *count,
513             va_list        ap,
514             UErrorCode     *status)
515 {
516     //check arguments
517     if(status==NULL||U_FAILURE(*status))
518     {
519         return;
520     }
521     if(fmt==NULL||source==NULL || sourceLength<-1 || count==NULL){
522         *status=U_ILLEGAL_ARGUMENT_ERROR;
523         return;
524     }
525     if(sourceLength==-1){
526         sourceLength=u_strlen(source);
527     }
528 
529     UnicodeString srcString(source,sourceLength);
530     Formattable *args = ((const MessageFormat*)fmt)->parse(srcString,*count,*status);
531     UDate *aDate;
532     double *aDouble;
533     UChar *aString;
534     int32_t* aInt;
535     int64_t* aInt64;
536     UnicodeString temp;
537     int len =0;
538     // assign formattables to varargs
539     for(int32_t i = 0; i < *count; i++) {
540         switch(args[i].getType()) {
541 
542         case Formattable::kDate:
543             aDate = va_arg(ap, UDate*);
544             if(aDate){
545                 *aDate = args[i].getDate();
546             }else{
547                 *status=U_ILLEGAL_ARGUMENT_ERROR;
548             }
549             break;
550 
551         case Formattable::kDouble:
552             aDouble = va_arg(ap, double*);
553             if(aDouble){
554                 *aDouble = args[i].getDouble();
555             }else{
556                 *status=U_ILLEGAL_ARGUMENT_ERROR;
557             }
558             break;
559 
560         case Formattable::kLong:
561             aInt = va_arg(ap, int32_t*);
562             if(aInt){
563                 *aInt = (int32_t) args[i].getLong();
564             }else{
565                 *status=U_ILLEGAL_ARGUMENT_ERROR;
566             }
567             break;
568 
569         case Formattable::kInt64:
570             aInt64 = va_arg(ap, int64_t*);
571             if(aInt64){
572                 *aInt64 = args[i].getInt64();
573             }else{
574                 *status=U_ILLEGAL_ARGUMENT_ERROR;
575             }
576             break;
577 
578         case Formattable::kString:
579             aString = va_arg(ap, UChar*);
580             if(aString){
581                 args[i].getString(temp);
582                 len = temp.length();
583                 temp.extract(0,len,aString);
584                 aString[len]=0;
585             }else{
586                 *status= U_ILLEGAL_ARGUMENT_ERROR;
587             }
588             break;
589 
590         case Formattable::kObject:
591             // This will never happen because MessageFormat doesn't
592             // support kObject.  When MessageFormat is changed to
593             // understand MeasureFormats, modify this code to do the
594             // right thing. [alan]
595             U_ASSERT(FALSE);
596             break;
597 
598         // better not happen!
599         case Formattable::kArray:
600             U_ASSERT(FALSE);
601             break;
602         }
603     }
604 
605     // clean up
606     delete [] args;
607 }
608 
609 #define SINGLE_QUOTE      ((UChar)0x0027)
610 #define CURLY_BRACE_LEFT  ((UChar)0x007B)
611 #define CURLY_BRACE_RIGHT ((UChar)0x007D)
612 
613 #define STATE_INITIAL 0
614 #define STATE_SINGLE_QUOTE 1
615 #define STATE_IN_QUOTE 2
616 #define STATE_MSG_ELEMENT 3
617 
618 #define MAppend(c) if (len < destCapacity) dest[len++] = c; else len++
619 
umsg_autoQuoteApostrophe(const UChar * pattern,int32_t patternLength,UChar * dest,int32_t destCapacity,UErrorCode * ec)620 int32_t umsg_autoQuoteApostrophe(const UChar* pattern,
621                  int32_t patternLength,
622                  UChar* dest,
623                  int32_t destCapacity,
624                  UErrorCode* ec)
625 {
626     int32_t state = STATE_INITIAL;
627     int32_t braceCount = 0;
628     int32_t len = 0;
629 
630     if (ec == NULL || U_FAILURE(*ec)) {
631         return -1;
632     }
633 
634     if (pattern == NULL || patternLength < -1 || (dest == NULL && destCapacity > 0)) {
635         *ec = U_ILLEGAL_ARGUMENT_ERROR;
636         return -1;
637     }
638     U_ASSERT(destCapacity >= 0);
639 
640     if (patternLength == -1) {
641         patternLength = u_strlen(pattern);
642     }
643 
644     for (int i = 0; i < patternLength; ++i) {
645         UChar c = pattern[i];
646         switch (state) {
647         case STATE_INITIAL:
648             switch (c) {
649             case SINGLE_QUOTE:
650                 state = STATE_SINGLE_QUOTE;
651                 break;
652             case CURLY_BRACE_LEFT:
653                 state = STATE_MSG_ELEMENT;
654                 ++braceCount;
655                 break;
656             }
657             break;
658 
659         case STATE_SINGLE_QUOTE:
660             switch (c) {
661             case SINGLE_QUOTE:
662                 state = STATE_INITIAL;
663                 break;
664             case CURLY_BRACE_LEFT:
665             case CURLY_BRACE_RIGHT:
666                 state = STATE_IN_QUOTE;
667                 break;
668             default:
669                 MAppend(SINGLE_QUOTE);
670                 state = STATE_INITIAL;
671                 break;
672             }
673         break;
674 
675         case STATE_IN_QUOTE:
676             switch (c) {
677             case SINGLE_QUOTE:
678                 state = STATE_INITIAL;
679                 break;
680             }
681             break;
682 
683         case STATE_MSG_ELEMENT:
684             switch (c) {
685             case CURLY_BRACE_LEFT:
686                 ++braceCount;
687                 break;
688             case CURLY_BRACE_RIGHT:
689                 if (--braceCount == 0) {
690                     state = STATE_INITIAL;
691                 }
692                 break;
693             }
694             break;
695 
696         default: // Never happens.
697             break;
698         }
699 
700         U_ASSERT(len >= 0);
701         MAppend(c);
702     }
703 
704     // End of scan
705     if (state == STATE_SINGLE_QUOTE || state == STATE_IN_QUOTE) {
706         MAppend(SINGLE_QUOTE);
707     }
708 
709     return u_terminateUChars(dest, destCapacity, len, ec);
710 }
711 
712 #endif /* #if !UCONFIG_NO_FORMATTING */
713