xref: /openbsd-src/usr.bin/printf/printf.c (revision db3296cf5c1dd9058ceecc3a29fe4aaa0bd26000)
1 /*	$OpenBSD: printf.c,v 1.11 2003/06/23 16:40:44 millert Exp $	*/
2 
3 /*
4  * Copyright (c) 1989 The Regents of the University of California.
5  * All rights reserved.
6  *
7  * Redistribution and use in source and binary forms, with or without
8  * modification, are permitted provided that the following conditions
9  * are met:
10  * 1. Redistributions of source code must retain the above copyright
11  *    notice, this list of conditions and the following disclaimer.
12  * 2. Redistributions in binary form must reproduce the above copyright
13  *    notice, this list of conditions and the following disclaimer in the
14  *    documentation and/or other materials provided with the distribution.
15  * 3. Neither the name of the University nor the names of its contributors
16  *    may be used to endorse or promote products derived from this software
17  *    without specific prior written permission.
18  *
19  * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
20  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
21  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
22  * ARE DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
23  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
24  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
25  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
26  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
27  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
28  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
29  * SUCH DAMAGE.
30  */
31 
32 #ifndef lint
33 #if !defined(SHELL) && !defined(BUILTIN)
34 char copyright[] =
35 "@(#) Copyright (c) 1989 The Regents of the University of California.\n\
36  All rights reserved.\n";
37 #endif
38 #endif /* not lint */
39 
40 #ifndef lint
41 /*static char sccsid[] = "from: @(#)printf.c	5.9 (Berkeley) 6/1/90";*/
42 static char rcsid[] = "$OpenBSD: printf.c,v 1.11 2003/06/23 16:40:44 millert Exp $";
43 #endif /* not lint */
44 
45 #include <ctype.h>
46 #include <stdio.h>
47 #include <stdlib.h>
48 #include <string.h>
49 #include <limits.h>
50 #include <locale.h>
51 #include <errno.h>
52 #include <err.h>
53 
54 static int	 print_escape_str(const char *);
55 static int	 print_escape(const char *);
56 
57 static int	 getchr(void);
58 static double	 getdouble(void);
59 static int	 getint(void);
60 static long	 getlong(void);
61 static unsigned long getulong(void);
62 static char	*getstr(void);
63 static char	*mklong(const char *, int);
64 static void      check_conversion(const char *, const char *);
65 static void	 usage(void);
66 
67 static int	rval;
68 static char  **gargv;
69 
70 #define isodigit(c)	((c) >= '0' && (c) <= '7')
71 #define octtobin(c)	((c) - '0')
72 #define hextobin(c)	((c) >= 'A' && (c) <= 'F' ? c - 'A' + 10 : (c) >= 'a' && (c) <= 'f' ? c - 'a' + 10 : c - '0')
73 
74 #ifdef SHELL
75 #define main printfcmd
76 #include "../../bin/sh/bltin/bltin.h"
77 #include <stdarg.h>
78 
79 static void
80 warnx(const char *fmt, ...)
81 {
82 
83 	char buf[64];
84 	va_list ap;
85 
86 	va_start(ap, fmt);
87 	vsnprintf(buf, sizeof buf, fmt, ap);
88 	va_end(ap);
89 
90 	error(buf);
91 }
92 #endif /* SHELL */
93 
94 #define PF(f, func) { \
95 	if (fieldwidth) \
96 		if (precision) \
97 			(void)printf(f, fieldwidth, precision, func); \
98 		else \
99 			(void)printf(f, fieldwidth, func); \
100 	else if (precision) \
101 		(void)printf(f, precision, func); \
102 	else \
103 		(void)printf(f, func); \
104 }
105 
106 int
107 #ifdef BUILTIN
108 progprintf(int argc, char *argv[])
109 #else
110 main(int argc, char *argv[])
111 #endif
112 {
113 	char *fmt, *start;
114 	int fieldwidth, precision;
115 	char convch, nextch;
116 	char *format;
117 	int ch;
118 
119 #if !defined(SHELL) && !defined(BUILTIN)
120 	setlocale (LC_ALL, "");
121 #endif
122 
123 	if (argc < 2) {
124 		usage();
125 		return (1);
126 	}
127 
128 	format = *++argv;
129 	gargv = ++argv;
130 
131 #define SKIP1	"#-+ 0"
132 #define SKIP2	"*0123456789"
133 	do {
134 		/*
135 		 * Basic algorithm is to scan the format string for conversion
136 		 * specifications -- once one is found, find out if the field
137 		 * width or precision is a '*'; if it is, gather up value.
138 		 * Note, format strings are reused as necessary to use up the
139 		 * provided arguments, arguments of zero/null string are
140 		 * provided to use up the format string.
141 		 */
142 
143 		/* find next format specification */
144 		for (fmt = format; *fmt; fmt++) {
145 			switch (*fmt) {
146 			case '%':
147 				start = fmt++;
148 
149 				if (*fmt == '%') {
150 					putchar ('%');
151 					break;
152 				} else if (*fmt == 'b') {
153 					char *p = getstr();
154 					if (print_escape_str(p)) {
155 						return (rval);
156 					}
157 					break;
158 				}
159 
160 				/* skip to field width */
161 				for (; strchr(SKIP1, *fmt); ++fmt) ;
162 				fieldwidth = *fmt == '*' ? getint() : 0;
163 
164 				/* skip to possible '.', get following precision */
165 				for (; strchr(SKIP2, *fmt); ++fmt) ;
166 				if (*fmt == '.')
167 					++fmt;
168 				precision = *fmt == '*' ? getint() : 0;
169 
170 				for (; strchr(SKIP2, *fmt); ++fmt) ;
171 				if (!*fmt) {
172 					warnx ("missing format character");
173 					return(1);
174 				}
175 
176 				convch = *fmt;
177 				nextch = *(fmt + 1);
178 				*(fmt + 1) = '\0';
179 				switch(convch) {
180 				case 'c': {
181 					char p = getchr();
182 					PF(start, p);
183 					break;
184 				}
185 				case 's': {
186 					char *p = getstr();
187 					PF(start, p);
188 					break;
189 				}
190 				case 'd':
191 				case 'i': {
192 					long p;
193 					char *f = mklong(start, convch);
194 					if (!f) {
195 						warnx("out of memory");
196 						return (1);
197 					}
198 					p = getlong();
199 					PF(f, p);
200 					break;
201 				}
202 				case 'o':
203 				case 'u':
204 				case 'x':
205 				case 'X': {
206 					unsigned long p;
207 					char *f = mklong(start, convch);
208 					if (!f) {
209 						warnx("out of memory");
210 						return (1);
211 					}
212 					p = getulong();
213 					PF(f, p);
214 					break;
215 				}
216 				case 'e':
217 				case 'E':
218 				case 'f':
219 				case 'g':
220 				case 'G': {
221 					double p = getdouble();
222 					PF(start, p);
223 					break;
224 				}
225 				default:
226 					warnx ("%s: invalid directive", start);
227 					return(1);
228 				}
229 				*(fmt + 1) = nextch;
230 				break;
231 
232 			case '\\':
233 				fmt += print_escape(fmt);
234 				break;
235 
236 			default:
237 				putchar (*fmt);
238 				break;
239 			}
240 		}
241 	} while (gargv > argv && *gargv);
242 
243 	return (rval);
244 }
245 
246 
247 /*
248  * Print SysV echo(1) style escape string
249  *	Halts processing string and returns 1 if a \c escape is encountered.
250  */
251 static int
252 print_escape_str(const char *str)
253 {
254 	int value;
255 	int c;
256 
257 	while (*str) {
258 		if (*str == '\\') {
259 			str++;
260 			/*
261 			 * %b string octal constants are not like those in C.
262 			 * They start with a \0, and are followed by 0, 1, 2,
263 			 * or 3 octal digits.
264 			 */
265 			if (*str == '0') {
266 				str++;
267 				for (c = 3, value = 0; c-- && isodigit(*str); str++) {
268 					value <<= 3;
269 					value += octtobin(*str);
270 				}
271 				putchar (value);
272 				str--;
273 			} else if (*str == 'c') {
274 				return 1;
275 			} else {
276 				str--;
277 				str += print_escape(str);
278 			}
279 		} else {
280 			putchar (*str);
281 		}
282 		str++;
283 	}
284 
285 	return 0;
286 }
287 
288 /*
289  * Print "standard" escape characters
290  */
291 static int
292 print_escape(const char *str)
293 {
294 	const char *start = str;
295 	int value;
296 	int c;
297 
298 	str++;
299 
300 	switch (*str) {
301 	case '0': case '1': case '2': case '3':
302 	case '4': case '5': case '6': case '7':
303 		for (c = 3, value = 0; c-- && isodigit(*str); str++) {
304 			value <<= 3;
305 			value += octtobin(*str);
306 		}
307 		putchar(value);
308 		return str - start - 1;
309 		/* NOTREACHED */
310 
311 	case 'x':
312 		str++;
313 		for (value = 0; isxdigit(*str); str++) {
314 			value <<= 4;
315 			value += hextobin(*str);
316 		}
317 		if (value > UCHAR_MAX) {
318 			warnx ("escape sequence out of range for character");
319 			rval = 1;
320 		}
321 		putchar (value);
322 		return str - start - 1;
323 		/* NOTREACHED */
324 
325 	case '\\':			/* backslash */
326 		putchar('\\');
327 		break;
328 
329 	case '\'':			/* single quote */
330 		putchar('\'');
331 		break;
332 
333 	case '"':			/* double quote */
334 		putchar('"');
335 		break;
336 
337 	case 'a':			/* alert */
338 		putchar('\a');
339 		break;
340 
341 	case 'b':			/* backspace */
342 		putchar('\b');
343 		break;
344 
345 	case 'e':			/* escape */
346 #ifdef __GNUC__
347 		putchar('\e');
348 #else
349 		putchar(033);
350 #endif
351 		break;
352 
353 	case 'f':			/* form-feed */
354 		putchar('\f');
355 		break;
356 
357 	case 'n':			/* newline */
358 		putchar('\n');
359 		break;
360 
361 	case 'r':			/* carriage-return */
362 		putchar('\r');
363 		break;
364 
365 	case 't':			/* tab */
366 		putchar('\t');
367 		break;
368 
369 	case 'v':			/* vertical-tab */
370 		putchar('\v');
371 		break;
372 
373 	default:
374 		putchar(*str);
375 		warnx("unknown escape sequence `\\%c'", *str);
376 		rval = 1;
377 	}
378 
379 	return 1;
380 }
381 
382 static char *
383 mklong(const char *str, int ch)
384 {
385 	static char *copy;
386 	static int copysize;
387 	int len;
388 
389 	len = strlen(str) + 2;
390 	if (copysize < len) {
391 		char *newcopy;
392 		copysize = len + 256;
393 
394 		newcopy = realloc(copy, copysize);
395 		if (newcopy == NULL) {
396 			copysize = 0;
397 			free(copy);
398 			copy = NULL;
399 			return (NULL);
400 		}
401 		copy = newcopy;
402 	}
403 	(void) memmove(copy, str, len - 3);
404 	copy[len - 3] = 'l';
405 	copy[len - 2] = ch;
406 	copy[len - 1] = '\0';
407 	return (copy);
408 }
409 
410 static int
411 getchr(void)
412 {
413 	if (!*gargv)
414 		return((int)'\0');
415 	return((int)**gargv++);
416 }
417 
418 static char *
419 getstr(void)
420 {
421 	if (!*gargv)
422 		return("");
423 	return(*gargv++);
424 }
425 
426 static char *number = "+-.0123456789";
427 static int
428 getint(void)
429 {
430 	if (!*gargv)
431 		return(0);
432 
433 	if (strchr(number, **gargv))
434 		return(atoi(*gargv++));
435 
436 	return 0;
437 }
438 
439 static long
440 getlong(void)
441 {
442 	long val;
443 	char *ep;
444 
445 	if (!*gargv)
446 		return(0L);
447 
448 	if (**gargv == '\"' || **gargv == '\'')
449 		return (long) *((*gargv++)+1);
450 
451 	errno = 0;
452 	val = strtol (*gargv, &ep, 0);
453 	check_conversion(*gargv++, ep);
454 	return val;
455 }
456 
457 static unsigned long
458 getulong(void)
459 {
460 	unsigned long val;
461 	char *ep;
462 
463 	if (!*gargv)
464 		return(0UL);
465 
466 	if (**gargv == '\"' || **gargv == '\'')
467 		return (unsigned long) *((*gargv++)+1);
468 
469 	errno = 0;
470 	val = strtoul (*gargv, &ep, 0);
471 	check_conversion(*gargv++, ep);
472 	return val;
473 }
474 
475 static double
476 getdouble(void)
477 {
478 	double val;
479 	char *ep;
480 
481 	if (!*gargv)
482 		return(0.0);
483 
484 	if (**gargv == '\"' || **gargv == '\'')
485 		return (double) *((*gargv++)+1);
486 
487 	errno = 0;
488 	val = strtod (*gargv, &ep);
489 	check_conversion(*gargv++, ep);
490 	return val;
491 }
492 
493 static void
494 check_conversion(const char *s, const char *ep)
495 {
496 	if (*ep) {
497 		if (ep == s)
498 			warnx ("%s: expected numeric value", s);
499 		else
500 			warnx ("%s: not completely converted", s);
501 		rval = 1;
502 	} else if (errno == ERANGE) {
503 		warnx ("%s: %s", s, strerror(ERANGE));
504 		rval = 1;
505 	}
506 }
507 
508 static void
509 usage(void)
510 {
511 	(void)fprintf(stderr, "usage: printf format [arg ...]\n");
512 }
513