1*946379e7Schristos /* Emacs Lisp format strings.
2*946379e7Schristos Copyright (C) 2001-2004, 2006 Free Software Foundation, Inc.
3*946379e7Schristos Written by Bruno Haible <haible@clisp.cons.org>, 2002.
4*946379e7Schristos
5*946379e7Schristos This program is free software; you can redistribute it and/or modify
6*946379e7Schristos it under the terms of the GNU General Public License as published by
7*946379e7Schristos the Free Software Foundation; either version 2, or (at your option)
8*946379e7Schristos any later version.
9*946379e7Schristos
10*946379e7Schristos This program is distributed in the hope that it will be useful,
11*946379e7Schristos but WITHOUT ANY WARRANTY; without even the implied warranty of
12*946379e7Schristos MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
13*946379e7Schristos GNU General Public License for more details.
14*946379e7Schristos
15*946379e7Schristos You should have received a copy of the GNU General Public License
16*946379e7Schristos along with this program; if not, write to the Free Software Foundation,
17*946379e7Schristos Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301, USA. */
18*946379e7Schristos
19*946379e7Schristos #ifdef HAVE_CONFIG_H
20*946379e7Schristos # include <config.h>
21*946379e7Schristos #endif
22*946379e7Schristos
23*946379e7Schristos #include <stdbool.h>
24*946379e7Schristos #include <stdlib.h>
25*946379e7Schristos
26*946379e7Schristos #include "format.h"
27*946379e7Schristos #include "c-ctype.h"
28*946379e7Schristos #include "xalloc.h"
29*946379e7Schristos #include "xvasprintf.h"
30*946379e7Schristos #include "format-invalid.h"
31*946379e7Schristos #include "gettext.h"
32*946379e7Schristos
33*946379e7Schristos #define _(str) gettext (str)
34*946379e7Schristos
35*946379e7Schristos /* Emacs Lisp format strings are implemented in emacs-21.1/src/editfns.c,
36*946379e7Schristos xemacs-21.1.14/src/editfns.c and xemacs-21.1.14/src/doprnt.c.
37*946379e7Schristos A directive
38*946379e7Schristos - starts with '%' or '%m$' where m is a positive integer,
39*946379e7Schristos - is optionally followed by any of the characters '#', '0', '-', ' ', '+',
40*946379e7Schristos each of which acts as a flag,
41*946379e7Schristos - is optionally followed by a width specification: '*' (reads an argument)
42*946379e7Schristos or a nonempty digit sequence,
43*946379e7Schristos - is optionally followed by '.' and a precision specification: '*' (reads
44*946379e7Schristos an argument) or a nonempty digit sequence,
45*946379e7Schristos - is finished by a specifier
46*946379e7Schristos - '%', that needs no argument,
47*946379e7Schristos - 'c', that need a character argument,
48*946379e7Schristos - 'd', 'i', 'x', 'X', 'o', that need an integer argument,
49*946379e7Schristos - 'e', 'E', 'f', 'g', 'G', that need a floating-point argument,
50*946379e7Schristos - 's', that need an argument and prints it using princ,
51*946379e7Schristos - 'S', that need an argument and prints it using prin1.
52*946379e7Schristos Numbered ('%m$') and unnumbered argument specifications can be used in the
53*946379e7Schristos same string. The effect of '%m$' is to set the current argument number to
54*946379e7Schristos m. The current argument number is incremented after processing a directive.
55*946379e7Schristos */
56*946379e7Schristos
57*946379e7Schristos enum format_arg_type
58*946379e7Schristos {
59*946379e7Schristos FAT_NONE,
60*946379e7Schristos FAT_CHARACTER,
61*946379e7Schristos FAT_INTEGER,
62*946379e7Schristos FAT_FLOAT,
63*946379e7Schristos FAT_OBJECT_PRETTY,
64*946379e7Schristos FAT_OBJECT
65*946379e7Schristos };
66*946379e7Schristos
67*946379e7Schristos struct numbered_arg
68*946379e7Schristos {
69*946379e7Schristos unsigned int number;
70*946379e7Schristos enum format_arg_type type;
71*946379e7Schristos };
72*946379e7Schristos
73*946379e7Schristos struct spec
74*946379e7Schristos {
75*946379e7Schristos unsigned int directives;
76*946379e7Schristos unsigned int numbered_arg_count;
77*946379e7Schristos unsigned int allocated;
78*946379e7Schristos struct numbered_arg *numbered;
79*946379e7Schristos };
80*946379e7Schristos
81*946379e7Schristos /* Locale independent test for a decimal digit.
82*946379e7Schristos Argument can be 'char' or 'unsigned char'. (Whereas the argument of
83*946379e7Schristos <ctype.h> isdigit must be an 'unsigned char'.) */
84*946379e7Schristos #undef isdigit
85*946379e7Schristos #define isdigit(c) ((unsigned int) ((c) - '0') < 10)
86*946379e7Schristos
87*946379e7Schristos
88*946379e7Schristos static int
numbered_arg_compare(const void * p1,const void * p2)89*946379e7Schristos numbered_arg_compare (const void *p1, const void *p2)
90*946379e7Schristos {
91*946379e7Schristos unsigned int n1 = ((const struct numbered_arg *) p1)->number;
92*946379e7Schristos unsigned int n2 = ((const struct numbered_arg *) p2)->number;
93*946379e7Schristos
94*946379e7Schristos return (n1 > n2 ? 1 : n1 < n2 ? -1 : 0);
95*946379e7Schristos }
96*946379e7Schristos
97*946379e7Schristos static void *
format_parse(const char * format,bool translated,char ** invalid_reason)98*946379e7Schristos format_parse (const char *format, bool translated, char **invalid_reason)
99*946379e7Schristos {
100*946379e7Schristos struct spec spec;
101*946379e7Schristos struct spec *result;
102*946379e7Schristos unsigned int number;
103*946379e7Schristos
104*946379e7Schristos spec.directives = 0;
105*946379e7Schristos spec.numbered_arg_count = 0;
106*946379e7Schristos spec.allocated = 0;
107*946379e7Schristos spec.numbered = NULL;
108*946379e7Schristos number = 1;
109*946379e7Schristos
110*946379e7Schristos for (; *format != '\0';)
111*946379e7Schristos if (*format++ == '%')
112*946379e7Schristos {
113*946379e7Schristos /* A directive. */
114*946379e7Schristos enum format_arg_type type;
115*946379e7Schristos
116*946379e7Schristos spec.directives++;
117*946379e7Schristos
118*946379e7Schristos if (isdigit (*format))
119*946379e7Schristos {
120*946379e7Schristos const char *f = format;
121*946379e7Schristos unsigned int m = 0;
122*946379e7Schristos
123*946379e7Schristos do
124*946379e7Schristos {
125*946379e7Schristos m = 10 * m + (*f - '0');
126*946379e7Schristos f++;
127*946379e7Schristos }
128*946379e7Schristos while (isdigit (*f));
129*946379e7Schristos
130*946379e7Schristos if (*f == '$' && m > 0)
131*946379e7Schristos {
132*946379e7Schristos number = m;
133*946379e7Schristos format = ++f;
134*946379e7Schristos }
135*946379e7Schristos }
136*946379e7Schristos
137*946379e7Schristos /* Parse flags. */
138*946379e7Schristos while (*format == ' ' || *format == '+' || *format == '-'
139*946379e7Schristos || *format == '#' || *format == '0')
140*946379e7Schristos format++;
141*946379e7Schristos
142*946379e7Schristos /* Parse width. */
143*946379e7Schristos if (*format == '*')
144*946379e7Schristos {
145*946379e7Schristos format++;
146*946379e7Schristos
147*946379e7Schristos if (spec.allocated == spec.numbered_arg_count)
148*946379e7Schristos {
149*946379e7Schristos spec.allocated = 2 * spec.allocated + 1;
150*946379e7Schristos spec.numbered = (struct numbered_arg *) xrealloc (spec.numbered, spec.allocated * sizeof (struct numbered_arg));
151*946379e7Schristos }
152*946379e7Schristos spec.numbered[spec.numbered_arg_count].number = number;
153*946379e7Schristos spec.numbered[spec.numbered_arg_count].type = FAT_INTEGER;
154*946379e7Schristos spec.numbered_arg_count++;
155*946379e7Schristos
156*946379e7Schristos number++;
157*946379e7Schristos }
158*946379e7Schristos else if (isdigit (*format))
159*946379e7Schristos {
160*946379e7Schristos do format++; while (isdigit (*format));
161*946379e7Schristos }
162*946379e7Schristos
163*946379e7Schristos /* Parse precision. */
164*946379e7Schristos if (*format == '.')
165*946379e7Schristos {
166*946379e7Schristos format++;
167*946379e7Schristos
168*946379e7Schristos if (*format == '*')
169*946379e7Schristos {
170*946379e7Schristos format++;
171*946379e7Schristos
172*946379e7Schristos if (spec.allocated == spec.numbered_arg_count)
173*946379e7Schristos {
174*946379e7Schristos spec.allocated = 2 * spec.allocated + 1;
175*946379e7Schristos spec.numbered = (struct numbered_arg *) xrealloc (spec.numbered, spec.allocated * sizeof (struct numbered_arg));
176*946379e7Schristos }
177*946379e7Schristos spec.numbered[spec.numbered_arg_count].number = number;
178*946379e7Schristos spec.numbered[spec.numbered_arg_count].type = FAT_INTEGER;
179*946379e7Schristos spec.numbered_arg_count++;
180*946379e7Schristos
181*946379e7Schristos number++;
182*946379e7Schristos }
183*946379e7Schristos else if (isdigit (*format))
184*946379e7Schristos {
185*946379e7Schristos do format++; while (isdigit (*format));
186*946379e7Schristos }
187*946379e7Schristos }
188*946379e7Schristos
189*946379e7Schristos switch (*format)
190*946379e7Schristos {
191*946379e7Schristos case '%':
192*946379e7Schristos type = FAT_NONE;
193*946379e7Schristos break;
194*946379e7Schristos case 'c':
195*946379e7Schristos type = FAT_CHARACTER;
196*946379e7Schristos break;
197*946379e7Schristos case 'd': case 'i': case 'x': case 'X': case 'o':
198*946379e7Schristos type = FAT_INTEGER;
199*946379e7Schristos break;
200*946379e7Schristos case 'e': case 'E': case 'f': case 'g': case 'G':
201*946379e7Schristos type = FAT_FLOAT;
202*946379e7Schristos break;
203*946379e7Schristos case 's':
204*946379e7Schristos type = FAT_OBJECT_PRETTY;
205*946379e7Schristos break;
206*946379e7Schristos case 'S':
207*946379e7Schristos type = FAT_OBJECT;
208*946379e7Schristos break;
209*946379e7Schristos default:
210*946379e7Schristos *invalid_reason =
211*946379e7Schristos (*format == '\0'
212*946379e7Schristos ? INVALID_UNTERMINATED_DIRECTIVE ()
213*946379e7Schristos : INVALID_CONVERSION_SPECIFIER (spec.directives, *format));
214*946379e7Schristos goto bad_format;
215*946379e7Schristos }
216*946379e7Schristos
217*946379e7Schristos if (type != FAT_NONE)
218*946379e7Schristos {
219*946379e7Schristos if (spec.allocated == spec.numbered_arg_count)
220*946379e7Schristos {
221*946379e7Schristos spec.allocated = 2 * spec.allocated + 1;
222*946379e7Schristos spec.numbered = (struct numbered_arg *) xrealloc (spec.numbered, spec.allocated * sizeof (struct numbered_arg));
223*946379e7Schristos }
224*946379e7Schristos spec.numbered[spec.numbered_arg_count].number = number;
225*946379e7Schristos spec.numbered[spec.numbered_arg_count].type = type;
226*946379e7Schristos spec.numbered_arg_count++;
227*946379e7Schristos
228*946379e7Schristos number++;
229*946379e7Schristos }
230*946379e7Schristos
231*946379e7Schristos format++;
232*946379e7Schristos }
233*946379e7Schristos
234*946379e7Schristos /* Sort the numbered argument array, and eliminate duplicates. */
235*946379e7Schristos if (spec.numbered_arg_count > 1)
236*946379e7Schristos {
237*946379e7Schristos unsigned int i, j;
238*946379e7Schristos bool err;
239*946379e7Schristos
240*946379e7Schristos qsort (spec.numbered, spec.numbered_arg_count,
241*946379e7Schristos sizeof (struct numbered_arg), numbered_arg_compare);
242*946379e7Schristos
243*946379e7Schristos /* Remove duplicates: Copy from i to j, keeping 0 <= j <= i. */
244*946379e7Schristos err = false;
245*946379e7Schristos for (i = j = 0; i < spec.numbered_arg_count; i++)
246*946379e7Schristos if (j > 0 && spec.numbered[i].number == spec.numbered[j-1].number)
247*946379e7Schristos {
248*946379e7Schristos enum format_arg_type type1 = spec.numbered[i].type;
249*946379e7Schristos enum format_arg_type type2 = spec.numbered[j-1].type;
250*946379e7Schristos enum format_arg_type type_both;
251*946379e7Schristos
252*946379e7Schristos if (type1 == type2)
253*946379e7Schristos type_both = type1;
254*946379e7Schristos else
255*946379e7Schristos {
256*946379e7Schristos /* Incompatible types. */
257*946379e7Schristos type_both = FAT_NONE;
258*946379e7Schristos if (!err)
259*946379e7Schristos *invalid_reason =
260*946379e7Schristos INVALID_INCOMPATIBLE_ARG_TYPES (spec.numbered[i].number);
261*946379e7Schristos err = true;
262*946379e7Schristos }
263*946379e7Schristos
264*946379e7Schristos spec.numbered[j-1].type = type_both;
265*946379e7Schristos }
266*946379e7Schristos else
267*946379e7Schristos {
268*946379e7Schristos if (j < i)
269*946379e7Schristos {
270*946379e7Schristos spec.numbered[j].number = spec.numbered[i].number;
271*946379e7Schristos spec.numbered[j].type = spec.numbered[i].type;
272*946379e7Schristos }
273*946379e7Schristos j++;
274*946379e7Schristos }
275*946379e7Schristos spec.numbered_arg_count = j;
276*946379e7Schristos if (err)
277*946379e7Schristos /* *invalid_reason has already been set above. */
278*946379e7Schristos goto bad_format;
279*946379e7Schristos }
280*946379e7Schristos
281*946379e7Schristos result = (struct spec *) xmalloc (sizeof (struct spec));
282*946379e7Schristos *result = spec;
283*946379e7Schristos return result;
284*946379e7Schristos
285*946379e7Schristos bad_format:
286*946379e7Schristos if (spec.numbered != NULL)
287*946379e7Schristos free (spec.numbered);
288*946379e7Schristos return NULL;
289*946379e7Schristos }
290*946379e7Schristos
291*946379e7Schristos static void
format_free(void * descr)292*946379e7Schristos format_free (void *descr)
293*946379e7Schristos {
294*946379e7Schristos struct spec *spec = (struct spec *) descr;
295*946379e7Schristos
296*946379e7Schristos if (spec->numbered != NULL)
297*946379e7Schristos free (spec->numbered);
298*946379e7Schristos free (spec);
299*946379e7Schristos }
300*946379e7Schristos
301*946379e7Schristos static int
format_get_number_of_directives(void * descr)302*946379e7Schristos format_get_number_of_directives (void *descr)
303*946379e7Schristos {
304*946379e7Schristos struct spec *spec = (struct spec *) descr;
305*946379e7Schristos
306*946379e7Schristos return spec->directives;
307*946379e7Schristos }
308*946379e7Schristos
309*946379e7Schristos static bool
format_check(void * msgid_descr,void * msgstr_descr,bool equality,formatstring_error_logger_t error_logger,const char * pretty_msgstr)310*946379e7Schristos format_check (void *msgid_descr, void *msgstr_descr, bool equality,
311*946379e7Schristos formatstring_error_logger_t error_logger,
312*946379e7Schristos const char *pretty_msgstr)
313*946379e7Schristos {
314*946379e7Schristos struct spec *spec1 = (struct spec *) msgid_descr;
315*946379e7Schristos struct spec *spec2 = (struct spec *) msgstr_descr;
316*946379e7Schristos bool err = false;
317*946379e7Schristos
318*946379e7Schristos if (spec1->numbered_arg_count + spec2->numbered_arg_count > 0)
319*946379e7Schristos {
320*946379e7Schristos unsigned int i, j;
321*946379e7Schristos unsigned int n1 = spec1->numbered_arg_count;
322*946379e7Schristos unsigned int n2 = spec2->numbered_arg_count;
323*946379e7Schristos
324*946379e7Schristos /* Check the argument names are the same.
325*946379e7Schristos Both arrays are sorted. We search for the first difference. */
326*946379e7Schristos for (i = 0, j = 0; i < n1 || j < n2; )
327*946379e7Schristos {
328*946379e7Schristos int cmp = (i >= n1 ? 1 :
329*946379e7Schristos j >= n2 ? -1 :
330*946379e7Schristos spec1->numbered[i].number > spec2->numbered[j].number ? 1 :
331*946379e7Schristos spec1->numbered[i].number < spec2->numbered[j].number ? -1 :
332*946379e7Schristos 0);
333*946379e7Schristos
334*946379e7Schristos if (cmp > 0)
335*946379e7Schristos {
336*946379e7Schristos if (error_logger)
337*946379e7Schristos error_logger (_("a format specification for argument %u, as in '%s', doesn't exist in 'msgid'"),
338*946379e7Schristos spec2->numbered[j].number, pretty_msgstr);
339*946379e7Schristos err = true;
340*946379e7Schristos break;
341*946379e7Schristos }
342*946379e7Schristos else if (cmp < 0)
343*946379e7Schristos {
344*946379e7Schristos if (equality)
345*946379e7Schristos {
346*946379e7Schristos if (error_logger)
347*946379e7Schristos error_logger (_("a format specification for argument %u doesn't exist in '%s'"),
348*946379e7Schristos spec1->numbered[i].number, pretty_msgstr);
349*946379e7Schristos err = true;
350*946379e7Schristos break;
351*946379e7Schristos }
352*946379e7Schristos else
353*946379e7Schristos i++;
354*946379e7Schristos }
355*946379e7Schristos else
356*946379e7Schristos j++, i++;
357*946379e7Schristos }
358*946379e7Schristos /* Check the argument types are the same. */
359*946379e7Schristos if (!err)
360*946379e7Schristos for (i = 0, j = 0; j < n2; )
361*946379e7Schristos {
362*946379e7Schristos if (spec1->numbered[i].number == spec2->numbered[j].number)
363*946379e7Schristos {
364*946379e7Schristos if (spec1->numbered[i].type != spec2->numbered[j].type)
365*946379e7Schristos {
366*946379e7Schristos if (error_logger)
367*946379e7Schristos error_logger (_("format specifications in 'msgid' and '%s' for argument %u are not the same"),
368*946379e7Schristos pretty_msgstr, spec2->numbered[j].number);
369*946379e7Schristos err = true;
370*946379e7Schristos break;
371*946379e7Schristos }
372*946379e7Schristos j++, i++;
373*946379e7Schristos }
374*946379e7Schristos else
375*946379e7Schristos i++;
376*946379e7Schristos }
377*946379e7Schristos }
378*946379e7Schristos
379*946379e7Schristos return err;
380*946379e7Schristos }
381*946379e7Schristos
382*946379e7Schristos
383*946379e7Schristos struct formatstring_parser formatstring_elisp =
384*946379e7Schristos {
385*946379e7Schristos format_parse,
386*946379e7Schristos format_free,
387*946379e7Schristos format_get_number_of_directives,
388*946379e7Schristos NULL,
389*946379e7Schristos format_check
390*946379e7Schristos };
391*946379e7Schristos
392*946379e7Schristos
393*946379e7Schristos #ifdef TEST
394*946379e7Schristos
395*946379e7Schristos /* Test program: Print the argument list specification returned by
396*946379e7Schristos format_parse for strings read from standard input. */
397*946379e7Schristos
398*946379e7Schristos #include <stdio.h>
399*946379e7Schristos #include "getline.h"
400*946379e7Schristos
401*946379e7Schristos static void
format_print(void * descr)402*946379e7Schristos format_print (void *descr)
403*946379e7Schristos {
404*946379e7Schristos struct spec *spec = (struct spec *) descr;
405*946379e7Schristos unsigned int last;
406*946379e7Schristos unsigned int i;
407*946379e7Schristos
408*946379e7Schristos if (spec == NULL)
409*946379e7Schristos {
410*946379e7Schristos printf ("INVALID");
411*946379e7Schristos return;
412*946379e7Schristos }
413*946379e7Schristos
414*946379e7Schristos printf ("(");
415*946379e7Schristos last = 1;
416*946379e7Schristos for (i = 0; i < spec->numbered_arg_count; i++)
417*946379e7Schristos {
418*946379e7Schristos unsigned int number = spec->numbered[i].number;
419*946379e7Schristos
420*946379e7Schristos if (i > 0)
421*946379e7Schristos printf (" ");
422*946379e7Schristos if (number < last)
423*946379e7Schristos abort ();
424*946379e7Schristos for (; last < number; last++)
425*946379e7Schristos printf ("_ ");
426*946379e7Schristos switch (spec->numbered[i].type)
427*946379e7Schristos {
428*946379e7Schristos case FAT_CHARACTER:
429*946379e7Schristos printf ("c");
430*946379e7Schristos break;
431*946379e7Schristos case FAT_INTEGER:
432*946379e7Schristos printf ("i");
433*946379e7Schristos break;
434*946379e7Schristos case FAT_FLOAT:
435*946379e7Schristos printf ("f");
436*946379e7Schristos break;
437*946379e7Schristos case FAT_OBJECT_PRETTY:
438*946379e7Schristos printf ("s");
439*946379e7Schristos break;
440*946379e7Schristos case FAT_OBJECT:
441*946379e7Schristos printf ("*");
442*946379e7Schristos break;
443*946379e7Schristos default:
444*946379e7Schristos abort ();
445*946379e7Schristos }
446*946379e7Schristos last = number + 1;
447*946379e7Schristos }
448*946379e7Schristos printf (")");
449*946379e7Schristos }
450*946379e7Schristos
451*946379e7Schristos int
main()452*946379e7Schristos main ()
453*946379e7Schristos {
454*946379e7Schristos for (;;)
455*946379e7Schristos {
456*946379e7Schristos char *line = NULL;
457*946379e7Schristos size_t line_size = 0;
458*946379e7Schristos int line_len;
459*946379e7Schristos char *invalid_reason;
460*946379e7Schristos void *descr;
461*946379e7Schristos
462*946379e7Schristos line_len = getline (&line, &line_size, stdin);
463*946379e7Schristos if (line_len < 0)
464*946379e7Schristos break;
465*946379e7Schristos if (line_len > 0 && line[line_len - 1] == '\n')
466*946379e7Schristos line[--line_len] = '\0';
467*946379e7Schristos
468*946379e7Schristos invalid_reason = NULL;
469*946379e7Schristos descr = format_parse (line, false, &invalid_reason);
470*946379e7Schristos
471*946379e7Schristos format_print (descr);
472*946379e7Schristos printf ("\n");
473*946379e7Schristos if (descr == NULL)
474*946379e7Schristos printf ("%s\n", invalid_reason);
475*946379e7Schristos
476*946379e7Schristos free (invalid_reason);
477*946379e7Schristos free (line);
478*946379e7Schristos }
479*946379e7Schristos
480*946379e7Schristos return 0;
481*946379e7Schristos }
482*946379e7Schristos
483*946379e7Schristos /*
484*946379e7Schristos * For Emacs M-x compile
485*946379e7Schristos * Local Variables:
486*946379e7Schristos * compile-command: "/bin/sh ../libtool --mode=link gcc -o a.out -static -O -g -Wall -I.. -I../lib -I../intl -DHAVE_CONFIG_H -DTEST format-elisp.c ../lib/libgettextlib.la"
487*946379e7Schristos * End:
488*946379e7Schristos */
489*946379e7Schristos
490*946379e7Schristos #endif /* TEST */
491