1 /* implements the string, long, and float formatters.  that is,
2    string.__format__, etc. */
3 
4 #include <locale.h>
5 
6 /* Before including this, you must include either:
7    stringlib/unicodedefs.h
8    stringlib/stringdefs.h
9 
10    Also, you should define the names:
11    FORMAT_STRING
12    FORMAT_LONG
13    FORMAT_FLOAT
14    FORMAT_COMPLEX
15    to be whatever you want the public names of these functions to
16    be.  These are the only non-static functions defined here.
17 */
18 
19 /* Raises an exception about an unknown presentation type for this
20  * type. */
21 
22 static void
unknown_presentation_type(STRINGLIB_CHAR presentation_type,const char * type_name)23 unknown_presentation_type(STRINGLIB_CHAR presentation_type,
24                           const char* type_name)
25 {
26 #if STRINGLIB_IS_UNICODE
27     /* If STRINGLIB_CHAR is Py_UNICODE, %c might be out-of-range,
28        hence the two cases. If it is char, gcc complains that the
29        condition below is always true, hence the ifdef. */
30     if (presentation_type > 32 && presentation_type < 128)
31 #endif
32         PyErr_Format(PyExc_ValueError,
33                      "Unknown format code '%c' "
34                      "for object of type '%.200s'",
35                      (char)presentation_type,
36                      type_name);
37 #if STRINGLIB_IS_UNICODE
38     else
39         PyErr_Format(PyExc_ValueError,
40                      "Unknown format code '\\x%x' "
41                      "for object of type '%.200s'",
42                      (unsigned int)presentation_type,
43                      type_name);
44 #endif
45 }
46 
47 static void
invalid_comma_type(STRINGLIB_CHAR presentation_type)48 invalid_comma_type(STRINGLIB_CHAR presentation_type)
49 {
50 #if STRINGLIB_IS_UNICODE
51     /* See comment in unknown_presentation_type */
52     if (presentation_type > 32 && presentation_type < 128)
53 #endif
54         PyErr_Format(PyExc_ValueError,
55                      "Cannot specify ',' with '%c'.",
56                      (char)presentation_type);
57 #if STRINGLIB_IS_UNICODE
58     else
59         PyErr_Format(PyExc_ValueError,
60                      "Cannot specify ',' with '\\x%x'.",
61                      (unsigned int)presentation_type);
62 #endif
63 }
64 
65 /*
66     get_integer consumes 0 or more decimal digit characters from an
67     input string, updates *result with the corresponding positive
68     integer, and returns the number of digits consumed.
69 
70     returns -1 on error.
71 */
72 static int
get_integer(STRINGLIB_CHAR ** ptr,STRINGLIB_CHAR * end,Py_ssize_t * result)73 get_integer(STRINGLIB_CHAR **ptr, STRINGLIB_CHAR *end,
74                   Py_ssize_t *result)
75 {
76     Py_ssize_t accumulator, digitval;
77     int numdigits;
78     accumulator = numdigits = 0;
79     for (;;(*ptr)++, numdigits++) {
80         if (*ptr >= end)
81             break;
82         digitval = STRINGLIB_TODECIMAL(**ptr);
83         if (digitval < 0)
84             break;
85         /*
86            Detect possible overflow before it happens:
87 
88               accumulator * 10 + digitval > PY_SSIZE_T_MAX if and only if
89               accumulator > (PY_SSIZE_T_MAX - digitval) / 10.
90         */
91         if (accumulator > (PY_SSIZE_T_MAX - digitval) / 10) {
92             PyErr_Format(PyExc_ValueError,
93                          "Too many decimal digits in format string");
94             return -1;
95         }
96         accumulator = accumulator * 10 + digitval;
97     }
98     *result = accumulator;
99     return numdigits;
100 }
101 
102 /************************************************************************/
103 /*********** standard format specifier parsing **************************/
104 /************************************************************************/
105 
106 /* returns true if this character is a specifier alignment token */
107 Py_LOCAL_INLINE(int)
is_alignment_token(STRINGLIB_CHAR c)108 is_alignment_token(STRINGLIB_CHAR c)
109 {
110     switch (c) {
111     case '<': case '>': case '=': case '^':
112         return 1;
113     default:
114         return 0;
115     }
116 }
117 
118 /* returns true if this character is a sign element */
119 Py_LOCAL_INLINE(int)
is_sign_element(STRINGLIB_CHAR c)120 is_sign_element(STRINGLIB_CHAR c)
121 {
122     switch (c) {
123     case ' ': case '+': case '-':
124         return 1;
125     default:
126         return 0;
127     }
128 }
129 
130 
131 typedef struct {
132     STRINGLIB_CHAR fill_char;
133     STRINGLIB_CHAR align;
134     int alternate;
135     STRINGLIB_CHAR sign;
136     Py_ssize_t width;
137     int thousands_separators;
138     Py_ssize_t precision;
139     STRINGLIB_CHAR type;
140 } InternalFormatSpec;
141 
142 
143 #if 0
144 /* Occasionally useful for debugging. Should normally be commented out. */
145 static void
146 DEBUG_PRINT_FORMAT_SPEC(InternalFormatSpec *format)
147 {
148     printf("internal format spec: fill_char %d\n", format->fill_char);
149     printf("internal format spec: align %d\n", format->align);
150     printf("internal format spec: alternate %d\n", format->alternate);
151     printf("internal format spec: sign %d\n", format->sign);
152     printf("internal format spec: width %zd\n", format->width);
153     printf("internal format spec: thousands_separators %d\n",
154            format->thousands_separators);
155     printf("internal format spec: precision %zd\n", format->precision);
156     printf("internal format spec: type %c\n", format->type);
157     printf("\n");
158 }
159 #endif
160 
161 
162 /*
163   ptr points to the start of the format_spec, end points just past its end.
164   fills in format with the parsed information.
165   returns 1 on success, 0 on failure.
166   if failure, sets the exception
167 */
168 static int
parse_internal_render_format_spec(STRINGLIB_CHAR * format_spec,Py_ssize_t format_spec_len,InternalFormatSpec * format,char default_type,char default_align)169 parse_internal_render_format_spec(STRINGLIB_CHAR *format_spec,
170                                   Py_ssize_t format_spec_len,
171                                   InternalFormatSpec *format,
172                                   char default_type,
173                                   char default_align)
174 {
175     STRINGLIB_CHAR *ptr = format_spec;
176     STRINGLIB_CHAR *end = format_spec + format_spec_len;
177 
178     /* end-ptr is used throughout this code to specify the length of
179        the input string */
180 
181     Py_ssize_t consumed;
182     int align_specified = 0;
183     int fill_char_specified = 0;
184 
185     format->fill_char = ' ';
186     format->align = default_align;
187     format->alternate = 0;
188     format->sign = '\0';
189     format->width = -1;
190     format->thousands_separators = 0;
191     format->precision = -1;
192     format->type = default_type;
193 
194     /* If the second char is an alignment token,
195        then parse the fill char */
196     if (end-ptr >= 2 && is_alignment_token(ptr[1])) {
197         format->align = ptr[1];
198         format->fill_char = ptr[0];
199         fill_char_specified = 1;
200         align_specified = 1;
201         ptr += 2;
202     }
203     else if (end-ptr >= 1 && is_alignment_token(ptr[0])) {
204         format->align = ptr[0];
205         align_specified = 1;
206         ++ptr;
207     }
208 
209     /* Parse the various sign options */
210     if (end-ptr >= 1 && is_sign_element(ptr[0])) {
211         format->sign = ptr[0];
212         ++ptr;
213     }
214 
215     /* If the next character is #, we're in alternate mode.  This only
216        applies to integers. */
217     if (end-ptr >= 1 && ptr[0] == '#') {
218         format->alternate = 1;
219         ++ptr;
220     }
221 
222     /* The special case for 0-padding (backwards compat) */
223     if (!fill_char_specified && end-ptr >= 1 && ptr[0] == '0') {
224         format->fill_char = '0';
225         if (!align_specified) {
226             format->align = '=';
227         }
228         ++ptr;
229     }
230 
231     consumed = get_integer(&ptr, end, &format->width);
232     if (consumed == -1)
233         /* Overflow error. Exception already set. */
234         return 0;
235 
236     /* If consumed is 0, we didn't consume any characters for the
237        width. In that case, reset the width to -1, because
238        get_integer() will have set it to zero. -1 is how we record
239        that the width wasn't specified. */
240     if (consumed == 0)
241         format->width = -1;
242 
243     /* Comma signifies add thousands separators */
244     if (end-ptr && ptr[0] == ',') {
245         format->thousands_separators = 1;
246         ++ptr;
247     }
248 
249     /* Parse field precision */
250     if (end-ptr && ptr[0] == '.') {
251         ++ptr;
252 
253         consumed = get_integer(&ptr, end, &format->precision);
254         if (consumed == -1)
255             /* Overflow error. Exception already set. */
256             return 0;
257 
258         /* Not having a precision after a dot is an error. */
259         if (consumed == 0) {
260             PyErr_Format(PyExc_ValueError,
261                          "Format specifier missing precision");
262             return 0;
263         }
264 
265     }
266 
267     /* Finally, parse the type field. */
268 
269     if (end-ptr > 1) {
270         /* More than one char remain, invalid conversion spec. */
271         PyErr_Format(PyExc_ValueError, "Invalid conversion specification");
272         return 0;
273     }
274 
275     if (end-ptr == 1) {
276         format->type = ptr[0];
277         ++ptr;
278     }
279 
280     /* Do as much validating as we can, just by looking at the format
281        specifier.  Do not take into account what type of formatting
282        we're doing (int, float, string). */
283 
284     if (format->thousands_separators) {
285         switch (format->type) {
286         case 'd':
287         case 'e':
288         case 'f':
289         case 'g':
290         case 'E':
291         case 'G':
292         case '%':
293         case 'F':
294         case '\0':
295             /* These are allowed. See PEP 378.*/
296             break;
297         default:
298             invalid_comma_type(format->type);
299             return 0;
300         }
301     }
302 
303     return 1;
304 }
305 
306 /* Calculate the padding needed. */
307 static void
calc_padding(Py_ssize_t nchars,Py_ssize_t width,STRINGLIB_CHAR align,Py_ssize_t * n_lpadding,Py_ssize_t * n_rpadding,Py_ssize_t * n_total)308 calc_padding(Py_ssize_t nchars, Py_ssize_t width, STRINGLIB_CHAR align,
309              Py_ssize_t *n_lpadding, Py_ssize_t *n_rpadding,
310              Py_ssize_t *n_total)
311 {
312     if (width >= 0) {
313         if (nchars > width)
314             *n_total = nchars;
315         else
316             *n_total = width;
317     }
318     else {
319         /* not specified, use all of the chars and no more */
320         *n_total = nchars;
321     }
322 
323     /* Figure out how much leading space we need, based on the
324        aligning */
325     if (align == '>')
326         *n_lpadding = *n_total - nchars;
327     else if (align == '^')
328         *n_lpadding = (*n_total - nchars) / 2;
329     else if (align == '<' || align == '=')
330         *n_lpadding = 0;
331     else {
332         /* We should never have an unspecified alignment. */
333         *n_lpadding = 0;
334         assert(0);
335     }
336 
337     *n_rpadding = *n_total - nchars - *n_lpadding;
338 }
339 
340 /* Do the padding, and return a pointer to where the caller-supplied
341    content goes. */
342 static STRINGLIB_CHAR *
fill_padding(STRINGLIB_CHAR * p,Py_ssize_t nchars,STRINGLIB_CHAR fill_char,Py_ssize_t n_lpadding,Py_ssize_t n_rpadding)343 fill_padding(STRINGLIB_CHAR *p, Py_ssize_t nchars, STRINGLIB_CHAR fill_char,
344              Py_ssize_t n_lpadding, Py_ssize_t n_rpadding)
345 {
346     /* Pad on left. */
347     if (n_lpadding)
348         STRINGLIB_FILL(p, fill_char, n_lpadding);
349 
350     /* Pad on right. */
351     if (n_rpadding)
352         STRINGLIB_FILL(p + nchars + n_lpadding, fill_char, n_rpadding);
353 
354     /* Pointer to the user content. */
355     return p + n_lpadding;
356 }
357 
358 #if defined FORMAT_FLOAT || defined FORMAT_LONG || defined FORMAT_COMPLEX
359 /************************************************************************/
360 /*********** common routines for numeric formatting *********************/
361 /************************************************************************/
362 
363 /* Locale type codes. */
364 #define LT_CURRENT_LOCALE 0
365 #define LT_DEFAULT_LOCALE 1
366 #define LT_NO_LOCALE 2
367 
368 /* Locale info needed for formatting integers and the part of floats
369    before and including the decimal. Note that locales only support
370    8-bit chars, not unicode. */
371 typedef struct {
372     char *decimal_point;
373     char *thousands_sep;
374     char *grouping;
375 } LocaleInfo;
376 
377 /* describes the layout for an integer, see the comment in
378    calc_number_widths() for details */
379 typedef struct {
380     Py_ssize_t n_lpadding;
381     Py_ssize_t n_prefix;
382     Py_ssize_t n_spadding;
383     Py_ssize_t n_rpadding;
384     char sign;
385     Py_ssize_t n_sign;      /* number of digits needed for sign (0/1) */
386     Py_ssize_t n_grouped_digits; /* Space taken up by the digits, including
387                                     any grouping chars. */
388     Py_ssize_t n_decimal;   /* 0 if only an integer */
389     Py_ssize_t n_remainder; /* Digits in decimal and/or exponent part,
390                                excluding the decimal itself, if
391                                present. */
392 
393     /* These 2 are not the widths of fields, but are needed by
394        STRINGLIB_GROUPING. */
395     Py_ssize_t n_digits;    /* The number of digits before a decimal
396                                or exponent. */
397     Py_ssize_t n_min_width; /* The min_width we used when we computed
398                                the n_grouped_digits width. */
399 } NumberFieldWidths;
400 
401 
402 /* Given a number of the form:
403    digits[remainder]
404    where ptr points to the start and end points to the end, find where
405     the integer part ends. This could be a decimal, an exponent, both,
406     or neither.
407    If a decimal point is present, set *has_decimal and increment
408     remainder beyond it.
409    Results are undefined (but shouldn't crash) for improperly
410     formatted strings.
411 */
412 static void
parse_number(STRINGLIB_CHAR * ptr,Py_ssize_t len,Py_ssize_t * n_remainder,int * has_decimal)413 parse_number(STRINGLIB_CHAR *ptr, Py_ssize_t len,
414              Py_ssize_t *n_remainder, int *has_decimal)
415 {
416     STRINGLIB_CHAR *end = ptr + len;
417     STRINGLIB_CHAR *remainder;
418 
419     while (ptr<end && isdigit(*ptr))
420         ++ptr;
421     remainder = ptr;
422 
423     /* Does remainder start with a decimal point? */
424     *has_decimal = ptr<end && *remainder == '.';
425 
426     /* Skip the decimal point. */
427     if (*has_decimal)
428         remainder++;
429 
430     *n_remainder = end - remainder;
431 }
432 
433 /* not all fields of format are used.  for example, precision is
434    unused.  should this take discrete params in order to be more clear
435    about what it does?  or is passing a single format parameter easier
436    and more efficient enough to justify a little obfuscation? */
437 static Py_ssize_t
calc_number_widths(NumberFieldWidths * spec,Py_ssize_t n_prefix,STRINGLIB_CHAR sign_char,STRINGLIB_CHAR * number,Py_ssize_t n_number,Py_ssize_t n_remainder,int has_decimal,const LocaleInfo * locale,const InternalFormatSpec * format)438 calc_number_widths(NumberFieldWidths *spec, Py_ssize_t n_prefix,
439                    STRINGLIB_CHAR sign_char, STRINGLIB_CHAR *number,
440                    Py_ssize_t n_number, Py_ssize_t n_remainder,
441                    int has_decimal, const LocaleInfo *locale,
442                    const InternalFormatSpec *format)
443 {
444     Py_ssize_t n_non_digit_non_padding;
445     Py_ssize_t n_padding;
446 
447     spec->n_digits = n_number - n_remainder - (has_decimal?1:0);
448     spec->n_lpadding = 0;
449     spec->n_prefix = n_prefix;
450     spec->n_decimal = has_decimal ? strlen(locale->decimal_point) : 0;
451     spec->n_remainder = n_remainder;
452     spec->n_spadding = 0;
453     spec->n_rpadding = 0;
454     spec->sign = '\0';
455     spec->n_sign = 0;
456 
457     /* the output will look like:
458        |                                                                                         |
459        | <lpadding> <sign> <prefix> <spadding> <grouped_digits> <decimal> <remainder> <rpadding> |
460        |                                                                                         |
461 
462        sign is computed from format->sign and the actual
463        sign of the number
464 
465        prefix is given (it's for the '0x' prefix)
466 
467        digits is already known
468 
469        the total width is either given, or computed from the
470        actual digits
471 
472        only one of lpadding, spadding, and rpadding can be non-zero,
473        and it's calculated from the width and other fields
474     */
475 
476     /* compute the various parts we're going to write */
477     switch (format->sign) {
478     case '+':
479         /* always put a + or - */
480         spec->n_sign = 1;
481         spec->sign = (sign_char == '-' ? '-' : '+');
482         break;
483     case ' ':
484         spec->n_sign = 1;
485         spec->sign = (sign_char == '-' ? '-' : ' ');
486         break;
487     default:
488         /* Not specified, or the default (-) */
489         if (sign_char == '-') {
490             spec->n_sign = 1;
491             spec->sign = '-';
492         }
493     }
494 
495     /* The number of chars used for non-digits and non-padding. */
496     n_non_digit_non_padding = spec->n_sign + spec->n_prefix + spec->n_decimal +
497         spec->n_remainder;
498 
499     /* min_width can go negative, that's okay. format->width == -1 means
500        we don't care. */
501     if (format->fill_char == '0' && format->align == '=')
502         spec->n_min_width = format->width - n_non_digit_non_padding;
503     else
504         spec->n_min_width = 0;
505 
506     if (spec->n_digits == 0)
507         /* This case only occurs when using 'c' formatting, we need
508            to special case it because the grouping code always wants
509            to have at least one character. */
510         spec->n_grouped_digits = 0;
511     else
512         spec->n_grouped_digits = STRINGLIB_GROUPING(NULL, 0, NULL,
513                                                     spec->n_digits,
514                                                     spec->n_min_width,
515                                                     locale->grouping,
516                                                     locale->thousands_sep);
517 
518     /* Given the desired width and the total of digit and non-digit
519        space we consume, see if we need any padding. format->width can
520        be negative (meaning no padding), but this code still works in
521        that case. */
522     n_padding = format->width -
523                         (n_non_digit_non_padding + spec->n_grouped_digits);
524     if (n_padding > 0) {
525         /* Some padding is needed. Determine if it's left, space, or right. */
526         switch (format->align) {
527         case '<':
528             spec->n_rpadding = n_padding;
529             break;
530         case '^':
531             spec->n_lpadding = n_padding / 2;
532             spec->n_rpadding = n_padding - spec->n_lpadding;
533             break;
534         case '=':
535             spec->n_spadding = n_padding;
536             break;
537         case '>':
538             spec->n_lpadding = n_padding;
539             break;
540         default:
541             /* Shouldn't get here, but treat it as '>' */
542             spec->n_lpadding = n_padding;
543             assert(0);
544             break;
545         }
546     }
547     return spec->n_lpadding + spec->n_sign + spec->n_prefix +
548         spec->n_spadding + spec->n_grouped_digits + spec->n_decimal +
549         spec->n_remainder + spec->n_rpadding;
550 }
551 
552 /* Fill in the digit parts of a numbers's string representation,
553    as determined in calc_number_widths().
554    No error checking, since we know the buffer is the correct size. */
555 static void
fill_number(STRINGLIB_CHAR * buf,const NumberFieldWidths * spec,STRINGLIB_CHAR * digits,Py_ssize_t n_digits,STRINGLIB_CHAR * prefix,STRINGLIB_CHAR fill_char,LocaleInfo * locale,int toupper)556 fill_number(STRINGLIB_CHAR *buf, const NumberFieldWidths *spec,
557             STRINGLIB_CHAR *digits, Py_ssize_t n_digits,
558             STRINGLIB_CHAR *prefix, STRINGLIB_CHAR fill_char,
559             LocaleInfo *locale, int toupper)
560 {
561     /* Used to keep track of digits, decimal, and remainder. */
562     STRINGLIB_CHAR *p = digits;
563 
564 #ifndef NDEBUG
565     Py_ssize_t r;
566 #endif
567 
568     if (spec->n_lpadding) {
569         STRINGLIB_FILL(buf, fill_char, spec->n_lpadding);
570         buf += spec->n_lpadding;
571     }
572     if (spec->n_sign == 1) {
573         *buf++ = spec->sign;
574     }
575     if (spec->n_prefix) {
576         memmove(buf,
577                 prefix,
578                 spec->n_prefix * sizeof(STRINGLIB_CHAR));
579         if (toupper) {
580             Py_ssize_t t;
581             for (t = 0; t < spec->n_prefix; ++t)
582                 buf[t] = STRINGLIB_TOUPPER(buf[t]);
583         }
584         buf += spec->n_prefix;
585     }
586     if (spec->n_spadding) {
587         STRINGLIB_FILL(buf, fill_char, spec->n_spadding);
588         buf += spec->n_spadding;
589     }
590 
591     /* Only for type 'c' special case, it has no digits. */
592     if (spec->n_digits != 0) {
593         /* Fill the digits with InsertThousandsGrouping. */
594 #ifndef NDEBUG
595         r =
596 #endif
597             STRINGLIB_GROUPING(buf, spec->n_grouped_digits, digits,
598                                spec->n_digits, spec->n_min_width,
599                                locale->grouping, locale->thousands_sep);
600 #ifndef NDEBUG
601         assert(r == spec->n_grouped_digits);
602 #endif
603         p += spec->n_digits;
604     }
605     if (toupper) {
606         Py_ssize_t t;
607         for (t = 0; t < spec->n_grouped_digits; ++t)
608             buf[t] = STRINGLIB_TOUPPER(buf[t]);
609     }
610     buf += spec->n_grouped_digits;
611 
612     if (spec->n_decimal) {
613         Py_ssize_t t;
614         for (t = 0; t < spec->n_decimal; ++t)
615             buf[t] = locale->decimal_point[t];
616         buf += spec->n_decimal;
617         p += 1;
618     }
619 
620     if (spec->n_remainder) {
621         memcpy(buf, p, spec->n_remainder * sizeof(STRINGLIB_CHAR));
622         buf += spec->n_remainder;
623         p += spec->n_remainder;
624     }
625 
626     if (spec->n_rpadding) {
627         STRINGLIB_FILL(buf, fill_char, spec->n_rpadding);
628         buf += spec->n_rpadding;
629     }
630 }
631 
632 static char no_grouping[1] = {CHAR_MAX};
633 
634 /* Find the decimal point character(s?), thousands_separator(s?), and
635    grouping description, either for the current locale if type is
636    LT_CURRENT_LOCALE, a hard-coded locale if LT_DEFAULT_LOCALE, or
637    none if LT_NO_LOCALE. */
638 static void
get_locale_info(int type,LocaleInfo * locale_info)639 get_locale_info(int type, LocaleInfo *locale_info)
640 {
641     switch (type) {
642     case LT_CURRENT_LOCALE: {
643         struct lconv *locale_data = localeconv();
644         locale_info->decimal_point = locale_data->decimal_point;
645         locale_info->thousands_sep = locale_data->thousands_sep;
646         locale_info->grouping = locale_data->grouping;
647         break;
648     }
649     case LT_DEFAULT_LOCALE:
650         locale_info->decimal_point = ".";
651         locale_info->thousands_sep = ",";
652         locale_info->grouping = "\3"; /* Group every 3 characters.  The
653                                          (implicit) trailing 0 means repeat
654                                          infinitely. */
655         break;
656     case LT_NO_LOCALE:
657         locale_info->decimal_point = ".";
658         locale_info->thousands_sep = "";
659         locale_info->grouping = no_grouping;
660         break;
661     default:
662         assert(0);
663     }
664 }
665 
666 #endif /* FORMAT_FLOAT || FORMAT_LONG || FORMAT_COMPLEX */
667 
668 /************************************************************************/
669 /*********** string formatting ******************************************/
670 /************************************************************************/
671 
672 static PyObject *
format_string_internal(PyObject * value,const InternalFormatSpec * format)673 format_string_internal(PyObject *value, const InternalFormatSpec *format)
674 {
675     Py_ssize_t lpad;
676     Py_ssize_t rpad;
677     Py_ssize_t total;
678     STRINGLIB_CHAR *p;
679     Py_ssize_t len = STRINGLIB_LEN(value);
680     PyObject *result = NULL;
681 
682     /* sign is not allowed on strings */
683     if (format->sign != '\0') {
684         PyErr_SetString(PyExc_ValueError,
685                         "Sign not allowed in string format specifier");
686         goto done;
687     }
688 
689     /* alternate is not allowed on strings */
690     if (format->alternate) {
691         PyErr_SetString(PyExc_ValueError,
692                         "Alternate form (#) not allowed in string format "
693                         "specifier");
694         goto done;
695     }
696 
697     /* '=' alignment not allowed on strings */
698     if (format->align == '=') {
699         PyErr_SetString(PyExc_ValueError,
700                         "'=' alignment not allowed "
701                         "in string format specifier");
702         goto done;
703     }
704 
705     /* if precision is specified, output no more that format.precision
706        characters */
707     if (format->precision >= 0 && len >= format->precision) {
708         len = format->precision;
709     }
710 
711     calc_padding(len, format->width, format->align, &lpad, &rpad, &total);
712 
713     /* allocate the resulting string */
714     result = STRINGLIB_NEW(NULL, total);
715     if (result == NULL)
716         goto done;
717 
718     /* Write into that space. First the padding. */
719     p = fill_padding(STRINGLIB_STR(result), len,
720                      format->fill_char, lpad, rpad);
721 
722     /* Then the source string. */
723     memcpy(p, STRINGLIB_STR(value), len * sizeof(STRINGLIB_CHAR));
724 
725 done:
726     return result;
727 }
728 
729 
730 /************************************************************************/
731 /*********** long formatting ********************************************/
732 /************************************************************************/
733 
734 #if defined FORMAT_LONG || defined FORMAT_INT
735 typedef PyObject*
736 (*IntOrLongToString)(PyObject *value, int base);
737 
738 static PyObject *
format_int_or_long_internal(PyObject * value,const InternalFormatSpec * format,IntOrLongToString tostring)739 format_int_or_long_internal(PyObject *value, const InternalFormatSpec *format,
740                             IntOrLongToString tostring)
741 {
742     PyObject *result = NULL;
743     PyObject *tmp = NULL;
744     STRINGLIB_CHAR *pnumeric_chars;
745     STRINGLIB_CHAR numeric_char;
746     STRINGLIB_CHAR sign_char = '\0';
747     Py_ssize_t n_digits;       /* count of digits need from the computed
748                                   string */
749     Py_ssize_t n_remainder = 0; /* Used only for 'c' formatting, which
750                                    produces non-digits */
751     Py_ssize_t n_prefix = 0;   /* Count of prefix chars, (e.g., '0x') */
752     Py_ssize_t n_total;
753     STRINGLIB_CHAR *prefix = NULL;
754     NumberFieldWidths spec;
755     long x;
756 
757     /* Locale settings, either from the actual locale or
758        from a hard-code pseudo-locale */
759     LocaleInfo locale;
760 
761     /* no precision allowed on integers */
762     if (format->precision != -1) {
763         PyErr_SetString(PyExc_ValueError,
764                         "Precision not allowed in integer format specifier");
765         goto done;
766     }
767 
768     /* special case for character formatting */
769     if (format->type == 'c') {
770         /* error to specify a sign */
771         if (format->sign != '\0') {
772             PyErr_SetString(PyExc_ValueError,
773                             "Sign not allowed with integer"
774                             " format specifier 'c'");
775             goto done;
776         }
777 
778         /* Error to specify a comma. */
779         if (format->thousands_separators) {
780             PyErr_SetString(PyExc_ValueError,
781                             "Thousands separators not allowed with integer"
782                             " format specifier 'c'");
783             goto done;
784         }
785 
786         /* taken from unicodeobject.c formatchar() */
787         /* Integer input truncated to a character */
788 /* XXX: won't work for int */
789         x = PyLong_AsLong(value);
790         if (x == -1 && PyErr_Occurred())
791             goto done;
792 #if STRINGLIB_IS_UNICODE
793 #ifdef Py_UNICODE_WIDE
794         if (x < 0 || x > 0x10ffff) {
795             PyErr_SetString(PyExc_OverflowError,
796                             "%c arg not in range(0x110000) "
797                             "(wide Python build)");
798             goto done;
799         }
800 #else
801         if (x < 0 || x > 0xffff) {
802             PyErr_SetString(PyExc_OverflowError,
803                             "%c arg not in range(0x10000) "
804                             "(narrow Python build)");
805             goto done;
806         }
807 #endif
808 #else
809         if (x < 0 || x > 0xff) {
810             PyErr_SetString(PyExc_OverflowError,
811                             "%c arg not in range(0x100)");
812             goto done;
813         }
814 #endif
815         numeric_char = (STRINGLIB_CHAR)x;
816         pnumeric_chars = &numeric_char;
817         n_digits = 1;
818 
819         /* As a sort-of hack, we tell calc_number_widths that we only
820            have "remainder" characters. calc_number_widths thinks
821            these are characters that don't get formatted, only copied
822            into the output string. We do this for 'c' formatting,
823            because the characters are likely to be non-digits. */
824         n_remainder = 1;
825     }
826     else {
827         int base;
828         int leading_chars_to_skip = 0;  /* Number of characters added by
829                                            PyNumber_ToBase that we want to
830                                            skip over. */
831 
832         /* Compute the base and how many characters will be added by
833            PyNumber_ToBase */
834         switch (format->type) {
835         case 'b':
836             base = 2;
837             leading_chars_to_skip = 2; /* 0b */
838             break;
839         case 'o':
840             base = 8;
841             leading_chars_to_skip = 2; /* 0o */
842             break;
843         case 'x':
844         case 'X':
845             base = 16;
846             leading_chars_to_skip = 2; /* 0x */
847             break;
848         default:  /* shouldn't be needed, but stops a compiler warning */
849         case 'd':
850         case 'n':
851             base = 10;
852             break;
853         }
854 
855         /* The number of prefix chars is the same as the leading
856            chars to skip */
857         if (format->alternate)
858             n_prefix = leading_chars_to_skip;
859 
860         /* Do the hard part, converting to a string in a given base */
861         tmp = tostring(value, base);
862         if (tmp == NULL)
863             goto done;
864 
865         pnumeric_chars = STRINGLIB_STR(tmp);
866         n_digits = STRINGLIB_LEN(tmp);
867 
868         prefix = pnumeric_chars;
869 
870         /* Remember not to modify what pnumeric_chars points to.  it
871            might be interned.  Only modify it after we copy it into a
872            newly allocated output buffer. */
873 
874         /* Is a sign character present in the output?  If so, remember it
875            and skip it */
876         if (pnumeric_chars[0] == '-') {
877             sign_char = pnumeric_chars[0];
878             ++prefix;
879             ++leading_chars_to_skip;
880         }
881 
882         /* Skip over the leading chars (0x, 0b, etc.) */
883         n_digits -= leading_chars_to_skip;
884         pnumeric_chars += leading_chars_to_skip;
885     }
886 
887     /* Determine the grouping, separator, and decimal point, if any. */
888     get_locale_info(format->type == 'n' ? LT_CURRENT_LOCALE :
889                     (format->thousands_separators ?
890                      LT_DEFAULT_LOCALE :
891                      LT_NO_LOCALE),
892                     &locale);
893 
894     /* Calculate how much memory we'll need. */
895     n_total = calc_number_widths(&spec, n_prefix, sign_char, pnumeric_chars,
896                        n_digits, n_remainder, 0, &locale, format);
897 
898     /* Allocate the memory. */
899     result = STRINGLIB_NEW(NULL, n_total);
900     if (!result)
901         goto done;
902 
903     /* Populate the memory. */
904     fill_number(STRINGLIB_STR(result), &spec, pnumeric_chars, n_digits,
905                 prefix, format->fill_char, &locale, format->type == 'X');
906 
907 done:
908     Py_XDECREF(tmp);
909     return result;
910 }
911 #endif /* defined FORMAT_LONG || defined FORMAT_INT */
912 
913 /************************************************************************/
914 /*********** float formatting *******************************************/
915 /************************************************************************/
916 
917 #ifdef FORMAT_FLOAT
918 #if STRINGLIB_IS_UNICODE
919 static void
strtounicode(Py_UNICODE * buffer,const char * charbuffer,Py_ssize_t len)920 strtounicode(Py_UNICODE *buffer, const char *charbuffer, Py_ssize_t len)
921 {
922     Py_ssize_t i;
923     for (i = 0; i < len; ++i)
924         buffer[i] = (Py_UNICODE)charbuffer[i];
925 }
926 #endif
927 
928 /* much of this is taken from unicodeobject.c */
929 static PyObject *
format_float_internal(PyObject * value,const InternalFormatSpec * format)930 format_float_internal(PyObject *value,
931                       const InternalFormatSpec *format)
932 {
933     char *buf = NULL;       /* buffer returned from PyOS_double_to_string */
934     Py_ssize_t n_digits;
935     Py_ssize_t n_remainder;
936     Py_ssize_t n_total;
937     int has_decimal;
938     double val;
939     Py_ssize_t precision;
940     Py_ssize_t default_precision = 6;
941     STRINGLIB_CHAR type = format->type;
942     int add_pct = 0;
943     STRINGLIB_CHAR *p;
944     NumberFieldWidths spec;
945     int flags = 0;
946     PyObject *result = NULL;
947     STRINGLIB_CHAR sign_char = '\0';
948     int float_type; /* Used to see if we have a nan, inf, or regular float. */
949 
950 #if STRINGLIB_IS_UNICODE
951     Py_UNICODE *unicode_tmp = NULL;
952 #endif
953 
954     /* Locale settings, either from the actual locale or
955        from a hard-code pseudo-locale */
956     LocaleInfo locale;
957 
958     if (format->precision > INT_MAX) {
959         PyErr_SetString(PyExc_ValueError, "precision too big");
960         goto done;
961     }
962     precision = (int)format->precision;
963 
964     /* Alternate is not allowed on floats. */
965     if (format->alternate) {
966         PyErr_SetString(PyExc_ValueError,
967                         "Alternate form (#) not allowed in float format "
968                         "specifier");
969         goto done;
970     }
971 
972     if (type == '\0') {
973         /* Omitted type specifier. This is like 'g' but with at least one
974            digit after the decimal point, and different default precision.*/
975         type = 'g';
976         default_precision = PyFloat_STR_PRECISION;
977         flags |= Py_DTSF_ADD_DOT_0;
978     }
979 
980     if (type == 'n')
981         /* 'n' is the same as 'g', except for the locale used to
982            format the result. We take care of that later. */
983         type = 'g';
984 
985     val = PyFloat_AsDouble(value);
986     if (val == -1.0 && PyErr_Occurred())
987         goto done;
988 
989     if (type == '%') {
990         type = 'f';
991         val *= 100;
992         add_pct = 1;
993     }
994 
995     if (precision < 0)
996         precision = default_precision;
997 
998     /* Cast "type", because if we're in unicode we need to pass an
999        8-bit char. This is safe, because we've restricted what "type"
1000        can be. */
1001     buf = PyOS_double_to_string(val, (char)type, precision, flags,
1002                                 &float_type);
1003     if (buf == NULL)
1004         goto done;
1005     n_digits = strlen(buf);
1006 
1007     if (add_pct) {
1008         /* We know that buf has a trailing zero (since we just called
1009            strlen() on it), and we don't use that fact any more. So we
1010            can just write over the trailing zero. */
1011         buf[n_digits] = '%';
1012         n_digits += 1;
1013     }
1014 
1015     /* Since there is no unicode version of PyOS_double_to_string,
1016        just use the 8 bit version and then convert to unicode. */
1017 #if STRINGLIB_IS_UNICODE
1018     unicode_tmp = (Py_UNICODE*)PyMem_Malloc((n_digits)*sizeof(Py_UNICODE));
1019     if (unicode_tmp == NULL) {
1020         PyErr_NoMemory();
1021         goto done;
1022     }
1023     strtounicode(unicode_tmp, buf, n_digits);
1024     p = unicode_tmp;
1025 #else
1026     p = buf;
1027 #endif
1028 
1029     /* Is a sign character present in the output?  If so, remember it
1030        and skip it */
1031     if (*p == '-') {
1032         sign_char = *p;
1033         ++p;
1034         --n_digits;
1035     }
1036 
1037     /* Determine if we have any "remainder" (after the digits, might include
1038        decimal or exponent or both (or neither)) */
1039     parse_number(p, n_digits, &n_remainder, &has_decimal);
1040 
1041     /* Determine the grouping, separator, and decimal point, if any. */
1042     get_locale_info(format->type == 'n' ? LT_CURRENT_LOCALE :
1043                     (format->thousands_separators ?
1044                      LT_DEFAULT_LOCALE :
1045                      LT_NO_LOCALE),
1046                     &locale);
1047 
1048     /* Calculate how much memory we'll need. */
1049     n_total = calc_number_widths(&spec, 0, sign_char, p, n_digits,
1050                                  n_remainder, has_decimal, &locale, format);
1051 
1052     /* Allocate the memory. */
1053     result = STRINGLIB_NEW(NULL, n_total);
1054     if (result == NULL)
1055         goto done;
1056 
1057     /* Populate the memory. */
1058     fill_number(STRINGLIB_STR(result), &spec, p, n_digits, NULL,
1059                 format->fill_char, &locale, 0);
1060 
1061 done:
1062     PyMem_Free(buf);
1063 #if STRINGLIB_IS_UNICODE
1064     PyMem_Free(unicode_tmp);
1065 #endif
1066     return result;
1067 }
1068 #endif /* FORMAT_FLOAT */
1069 
1070 /************************************************************************/
1071 /*********** complex formatting *****************************************/
1072 /************************************************************************/
1073 
1074 #ifdef FORMAT_COMPLEX
1075 
1076 static PyObject *
format_complex_internal(PyObject * value,const InternalFormatSpec * format)1077 format_complex_internal(PyObject *value,
1078                         const InternalFormatSpec *format)
1079 {
1080     double re;
1081     double im;
1082     char *re_buf = NULL;       /* buffer returned from PyOS_double_to_string */
1083     char *im_buf = NULL;       /* buffer returned from PyOS_double_to_string */
1084 
1085     InternalFormatSpec tmp_format = *format;
1086     Py_ssize_t n_re_digits;
1087     Py_ssize_t n_im_digits;
1088     Py_ssize_t n_re_remainder;
1089     Py_ssize_t n_im_remainder;
1090     Py_ssize_t n_re_total;
1091     Py_ssize_t n_im_total;
1092     int re_has_decimal;
1093     int im_has_decimal;
1094     Py_ssize_t precision;
1095     Py_ssize_t default_precision = 6;
1096     STRINGLIB_CHAR type = format->type;
1097     STRINGLIB_CHAR *p_re;
1098     STRINGLIB_CHAR *p_im;
1099     NumberFieldWidths re_spec;
1100     NumberFieldWidths im_spec;
1101     int flags = 0;
1102     PyObject *result = NULL;
1103     STRINGLIB_CHAR *p;
1104     STRINGLIB_CHAR re_sign_char = '\0';
1105     STRINGLIB_CHAR im_sign_char = '\0';
1106     int re_float_type; /* Used to see if we have a nan, inf, or regular float. */
1107     int im_float_type;
1108     int add_parens = 0;
1109     int skip_re = 0;
1110     Py_ssize_t lpad;
1111     Py_ssize_t rpad;
1112     Py_ssize_t total;
1113 
1114 #if STRINGLIB_IS_UNICODE
1115     Py_UNICODE *re_unicode_tmp = NULL;
1116     Py_UNICODE *im_unicode_tmp = NULL;
1117 #endif
1118 
1119     /* Locale settings, either from the actual locale or
1120        from a hard-code pseudo-locale */
1121     LocaleInfo locale;
1122 
1123     if (format->precision > INT_MAX) {
1124         PyErr_SetString(PyExc_ValueError, "precision too big");
1125         goto done;
1126     }
1127     precision = (int)format->precision;
1128 
1129     /* Alternate is not allowed on complex. */
1130     if (format->alternate) {
1131         PyErr_SetString(PyExc_ValueError,
1132                         "Alternate form (#) not allowed in complex format "
1133                         "specifier");
1134         goto done;
1135     }
1136 
1137     /* Neither is zero pading. */
1138     if (format->fill_char == '0') {
1139         PyErr_SetString(PyExc_ValueError,
1140                         "Zero padding is not allowed in complex format "
1141                         "specifier");
1142         goto done;
1143     }
1144 
1145     /* Neither is '=' alignment . */
1146     if (format->align == '=') {
1147         PyErr_SetString(PyExc_ValueError,
1148                         "'=' alignment flag is not allowed in complex format "
1149                         "specifier");
1150         goto done;
1151     }
1152 
1153     re = PyComplex_RealAsDouble(value);
1154     if (re == -1.0 && PyErr_Occurred())
1155         goto done;
1156     im = PyComplex_ImagAsDouble(value);
1157     if (im == -1.0 && PyErr_Occurred())
1158         goto done;
1159 
1160     if (type == '\0') {
1161         /* Omitted type specifier. Should be like str(self). */
1162         type = 'g';
1163         default_precision = PyFloat_STR_PRECISION;
1164         if (re == 0.0 && copysign(1.0, re) == 1.0)
1165             skip_re = 1;
1166         else
1167             add_parens = 1;
1168     }
1169 
1170     if (type == 'n')
1171         /* 'n' is the same as 'g', except for the locale used to
1172            format the result. We take care of that later. */
1173         type = 'g';
1174 
1175     if (precision < 0)
1176         precision = default_precision;
1177 
1178     /* Cast "type", because if we're in unicode we need to pass an
1179        8-bit char. This is safe, because we've restricted what "type"
1180        can be. */
1181     re_buf = PyOS_double_to_string(re, (char)type, precision, flags,
1182                                    &re_float_type);
1183     if (re_buf == NULL)
1184         goto done;
1185     im_buf = PyOS_double_to_string(im, (char)type, precision, flags,
1186                                    &im_float_type);
1187     if (im_buf == NULL)
1188         goto done;
1189 
1190     n_re_digits = strlen(re_buf);
1191     n_im_digits = strlen(im_buf);
1192 
1193     /* Since there is no unicode version of PyOS_double_to_string,
1194        just use the 8 bit version and then convert to unicode. */
1195 #if STRINGLIB_IS_UNICODE
1196     re_unicode_tmp = (Py_UNICODE*)PyMem_Malloc((n_re_digits)*sizeof(Py_UNICODE));
1197     if (re_unicode_tmp == NULL) {
1198         PyErr_NoMemory();
1199         goto done;
1200     }
1201     strtounicode(re_unicode_tmp, re_buf, n_re_digits);
1202     p_re = re_unicode_tmp;
1203 
1204     im_unicode_tmp = (Py_UNICODE*)PyMem_Malloc((n_im_digits)*sizeof(Py_UNICODE));
1205     if (im_unicode_tmp == NULL) {
1206         PyErr_NoMemory();
1207         goto done;
1208     }
1209     strtounicode(im_unicode_tmp, im_buf, n_im_digits);
1210     p_im = im_unicode_tmp;
1211 #else
1212     p_re = re_buf;
1213     p_im = im_buf;
1214 #endif
1215 
1216     /* Is a sign character present in the output?  If so, remember it
1217        and skip it */
1218     if (*p_re == '-') {
1219         re_sign_char = *p_re;
1220         ++p_re;
1221         --n_re_digits;
1222     }
1223     if (*p_im == '-') {
1224         im_sign_char = *p_im;
1225         ++p_im;
1226         --n_im_digits;
1227     }
1228 
1229     /* Determine if we have any "remainder" (after the digits, might include
1230        decimal or exponent or both (or neither)) */
1231     parse_number(p_re, n_re_digits, &n_re_remainder, &re_has_decimal);
1232     parse_number(p_im, n_im_digits, &n_im_remainder, &im_has_decimal);
1233 
1234     /* Determine the grouping, separator, and decimal point, if any. */
1235     get_locale_info(format->type == 'n' ? LT_CURRENT_LOCALE :
1236                     (format->thousands_separators ?
1237                      LT_DEFAULT_LOCALE :
1238                      LT_NO_LOCALE),
1239                     &locale);
1240 
1241     /* Turn off any padding. We'll do it later after we've composed
1242        the numbers without padding. */
1243     tmp_format.fill_char = '\0';
1244     tmp_format.align = '<';
1245     tmp_format.width = -1;
1246 
1247     /* Calculate how much memory we'll need. */
1248     n_re_total = calc_number_widths(&re_spec, 0, re_sign_char, p_re,
1249                                     n_re_digits, n_re_remainder,
1250                                     re_has_decimal, &locale, &tmp_format);
1251 
1252     /* Same formatting, but always include a sign, unless the real part is
1253      * going to be omitted, in which case we use whatever sign convention was
1254      * requested by the original format. */
1255     if (!skip_re)
1256         tmp_format.sign = '+';
1257     n_im_total = calc_number_widths(&im_spec, 0, im_sign_char, p_im,
1258                                     n_im_digits, n_im_remainder,
1259                                     im_has_decimal, &locale, &tmp_format);
1260 
1261     if (skip_re)
1262         n_re_total = 0;
1263 
1264     /* Add 1 for the 'j', and optionally 2 for parens. */
1265     calc_padding(n_re_total + n_im_total + 1 + add_parens * 2,
1266                  format->width, format->align, &lpad, &rpad, &total);
1267 
1268     result = STRINGLIB_NEW(NULL, total);
1269     if (result == NULL)
1270         goto done;
1271 
1272     /* Populate the memory. First, the padding. */
1273     p = fill_padding(STRINGLIB_STR(result),
1274                      n_re_total + n_im_total + 1 + add_parens * 2,
1275                      format->fill_char, lpad, rpad);
1276 
1277     if (add_parens)
1278         *p++ = '(';
1279 
1280     if (!skip_re) {
1281         fill_number(p, &re_spec, p_re, n_re_digits, NULL, 0, &locale, 0);
1282         p += n_re_total;
1283     }
1284     fill_number(p, &im_spec, p_im, n_im_digits, NULL, 0, &locale, 0);
1285     p += n_im_total;
1286     *p++ = 'j';
1287 
1288     if (add_parens)
1289         *p++ = ')';
1290 
1291 done:
1292     PyMem_Free(re_buf);
1293     PyMem_Free(im_buf);
1294 #if STRINGLIB_IS_UNICODE
1295     PyMem_Free(re_unicode_tmp);
1296     PyMem_Free(im_unicode_tmp);
1297 #endif
1298     return result;
1299 }
1300 #endif /* FORMAT_COMPLEX */
1301 
1302 /************************************************************************/
1303 /*********** built in formatters ****************************************/
1304 /************************************************************************/
1305 PyObject *
FORMAT_STRING(PyObject * obj,STRINGLIB_CHAR * format_spec,Py_ssize_t format_spec_len)1306 FORMAT_STRING(PyObject *obj,
1307               STRINGLIB_CHAR *format_spec,
1308               Py_ssize_t format_spec_len)
1309 {
1310     InternalFormatSpec format;
1311     PyObject *result = NULL;
1312 
1313     /* check for the special case of zero length format spec, make
1314        it equivalent to str(obj) */
1315     if (format_spec_len == 0) {
1316         result = STRINGLIB_TOSTR(obj);
1317         goto done;
1318     }
1319 
1320     /* parse the format_spec */
1321     if (!parse_internal_render_format_spec(format_spec, format_spec_len,
1322                                            &format, 's', '<'))
1323         goto done;
1324 
1325     /* type conversion? */
1326     switch (format.type) {
1327     case 's':
1328         /* no type conversion needed, already a string.  do the formatting */
1329         result = format_string_internal(obj, &format);
1330         break;
1331     default:
1332         /* unknown */
1333         unknown_presentation_type(format.type, obj->ob_type->tp_name);
1334         goto done;
1335     }
1336 
1337 done:
1338     return result;
1339 }
1340 
1341 #if defined FORMAT_LONG || defined FORMAT_INT
1342 static PyObject*
format_int_or_long(PyObject * obj,STRINGLIB_CHAR * format_spec,Py_ssize_t format_spec_len,IntOrLongToString tostring)1343 format_int_or_long(PyObject* obj,
1344                    STRINGLIB_CHAR *format_spec,
1345                    Py_ssize_t format_spec_len,
1346                    IntOrLongToString tostring)
1347 {
1348     PyObject *result = NULL;
1349     PyObject *tmp = NULL;
1350     InternalFormatSpec format;
1351 
1352     /* check for the special case of zero length format spec, make
1353        it equivalent to str(obj) */
1354     if (format_spec_len == 0) {
1355         result = STRINGLIB_TOSTR(obj);
1356         goto done;
1357     }
1358 
1359     /* parse the format_spec */
1360     if (!parse_internal_render_format_spec(format_spec,
1361                                            format_spec_len,
1362                                            &format, 'd', '>'))
1363         goto done;
1364 
1365     /* type conversion? */
1366     switch (format.type) {
1367     case 'b':
1368     case 'c':
1369     case 'd':
1370     case 'o':
1371     case 'x':
1372     case 'X':
1373     case 'n':
1374         /* no type conversion needed, already an int (or long).  do
1375            the formatting */
1376             result = format_int_or_long_internal(obj, &format, tostring);
1377         break;
1378 
1379     case 'e':
1380     case 'E':
1381     case 'f':
1382     case 'F':
1383     case 'g':
1384     case 'G':
1385     case '%':
1386         /* convert to float */
1387         tmp = PyNumber_Float(obj);
1388         if (tmp == NULL)
1389             goto done;
1390         result = format_float_internal(tmp, &format);
1391         break;
1392 
1393     default:
1394         /* unknown */
1395         unknown_presentation_type(format.type, obj->ob_type->tp_name);
1396         goto done;
1397     }
1398 
1399 done:
1400     Py_XDECREF(tmp);
1401     return result;
1402 }
1403 #endif /* FORMAT_LONG || defined FORMAT_INT */
1404 
1405 #ifdef FORMAT_LONG
1406 /* Need to define long_format as a function that will convert a long
1407    to a string.  In 3.0, _PyLong_Format has the correct signature.  In
1408    2.x, we need to fudge a few parameters */
1409 #if PY_VERSION_HEX >= 0x03000000
1410 #define long_format _PyLong_Format
1411 #else
1412 static PyObject*
long_format(PyObject * value,int base)1413 long_format(PyObject* value, int base)
1414 {
1415     /* Convert to base, don't add trailing 'L', and use the new octal
1416        format. We already know this is a long object */
1417     assert(PyLong_Check(value));
1418     /* convert to base, don't add 'L', and use the new octal format */
1419     return _PyLong_Format(value, base, 0, 1);
1420 }
1421 #endif
1422 
1423 PyObject *
FORMAT_LONG(PyObject * obj,STRINGLIB_CHAR * format_spec,Py_ssize_t format_spec_len)1424 FORMAT_LONG(PyObject *obj,
1425             STRINGLIB_CHAR *format_spec,
1426             Py_ssize_t format_spec_len)
1427 {
1428     return format_int_or_long(obj, format_spec, format_spec_len,
1429                               long_format);
1430 }
1431 #endif /* FORMAT_LONG */
1432 
1433 #ifdef FORMAT_INT
1434 /* this is only used for 2.x, not 3.0 */
1435 static PyObject*
int_format(PyObject * value,int base)1436 int_format(PyObject* value, int base)
1437 {
1438     /* Convert to base, and use the new octal format. We already
1439        know this is an int object */
1440     assert(PyInt_Check(value));
1441     return _PyInt_Format((PyIntObject*)value, base, 1);
1442 }
1443 
1444 PyObject *
FORMAT_INT(PyObject * obj,STRINGLIB_CHAR * format_spec,Py_ssize_t format_spec_len)1445 FORMAT_INT(PyObject *obj,
1446            STRINGLIB_CHAR *format_spec,
1447            Py_ssize_t format_spec_len)
1448 {
1449     return format_int_or_long(obj, format_spec, format_spec_len,
1450                               int_format);
1451 }
1452 #endif /* FORMAT_INT */
1453 
1454 #ifdef FORMAT_FLOAT
1455 PyObject *
FORMAT_FLOAT(PyObject * obj,STRINGLIB_CHAR * format_spec,Py_ssize_t format_spec_len)1456 FORMAT_FLOAT(PyObject *obj,
1457              STRINGLIB_CHAR *format_spec,
1458              Py_ssize_t format_spec_len)
1459 {
1460     PyObject *result = NULL;
1461     InternalFormatSpec format;
1462 
1463     /* check for the special case of zero length format spec, make
1464        it equivalent to str(obj) */
1465     if (format_spec_len == 0) {
1466         result = STRINGLIB_TOSTR(obj);
1467         goto done;
1468     }
1469 
1470     /* parse the format_spec */
1471     if (!parse_internal_render_format_spec(format_spec,
1472                                            format_spec_len,
1473                                            &format, '\0', '>'))
1474         goto done;
1475 
1476     /* type conversion? */
1477     switch (format.type) {
1478     case '\0': /* No format code: like 'g', but with at least one decimal. */
1479     case 'e':
1480     case 'E':
1481     case 'f':
1482     case 'F':
1483     case 'g':
1484     case 'G':
1485     case 'n':
1486     case '%':
1487         /* no conversion, already a float.  do the formatting */
1488         result = format_float_internal(obj, &format);
1489         break;
1490 
1491     default:
1492         /* unknown */
1493         unknown_presentation_type(format.type, obj->ob_type->tp_name);
1494         goto done;
1495     }
1496 
1497 done:
1498     return result;
1499 }
1500 #endif /* FORMAT_FLOAT */
1501 
1502 #ifdef FORMAT_COMPLEX
1503 PyObject *
FORMAT_COMPLEX(PyObject * obj,STRINGLIB_CHAR * format_spec,Py_ssize_t format_spec_len)1504 FORMAT_COMPLEX(PyObject *obj,
1505                STRINGLIB_CHAR *format_spec,
1506                Py_ssize_t format_spec_len)
1507 {
1508     PyObject *result = NULL;
1509     InternalFormatSpec format;
1510 
1511     /* check for the special case of zero length format spec, make
1512        it equivalent to str(obj) */
1513     if (format_spec_len == 0) {
1514         result = STRINGLIB_TOSTR(obj);
1515         goto done;
1516     }
1517 
1518     /* parse the format_spec */
1519     if (!parse_internal_render_format_spec(format_spec,
1520                                            format_spec_len,
1521                                            &format, '\0', '>'))
1522         goto done;
1523 
1524     /* type conversion? */
1525     switch (format.type) {
1526     case '\0': /* No format code: like 'g', but with at least one decimal. */
1527     case 'e':
1528     case 'E':
1529     case 'f':
1530     case 'F':
1531     case 'g':
1532     case 'G':
1533     case 'n':
1534         /* no conversion, already a complex.  do the formatting */
1535         result = format_complex_internal(obj, &format);
1536         break;
1537 
1538     default:
1539         /* unknown */
1540         unknown_presentation_type(format.type, obj->ob_type->tp_name);
1541         goto done;
1542     }
1543 
1544 done:
1545     return result;
1546 }
1547 #endif /* FORMAT_COMPLEX */
1548