Print this page
4854 printf(1) doesn't support %b and \c properly
4818 printf(1) should support n$ width and precision specifiers
Split |
Close |
Expand all |
Collapse all |
--- old/usr/src/cmd/printf/printf.c
+++ new/usr/src/cmd/printf/printf.c
1 1 /*
2 + * Copyright 2014 Garrett D'Amore <garrett@damore.org>
2 3 * Copyright 2010 Nexenta Systems, Inc. All rights reserved.
3 4 * Copyright (c) 1989, 1993
4 5 * The Regents of the University of California. All rights reserved.
5 6 *
6 7 * Redistribution and use in source and binary forms, with or without
7 8 * modification, are permitted provided that the following conditions
8 9 * are met:
9 10 * 1. Redistributions of source code must retain the above copyright
10 11 * notice, this list of conditions and the following disclaimer.
11 12 * 2. Redistributions in binary form must reproduce the above copyright
12 13 * notice, this list of conditions and the following disclaimer in the
13 14 * documentation and/or other materials provided with the distribution.
14 15 * 4. Neither the name of the University nor the names of its contributors
15 16 * may be used to endorse or promote products derived from this software
16 17 * without specific prior written permission.
17 18 *
18 19 * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
19 20 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
20 21 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
21 22 * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
22 23 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
23 24 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
24 25 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
25 26 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
26 27 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
27 28 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
28 29 * SUCH DAMAGE.
29 30 */
30 31
↓ open down ↓ |
19 lines elided |
↑ open up ↑ |
31 32 #include <sys/types.h>
32 33
33 34 #include <err.h>
34 35 #include <errno.h>
35 36 #include <inttypes.h>
36 37 #include <limits.h>
37 38 #include <stdio.h>
38 39 #include <stdlib.h>
39 40 #include <string.h>
40 41 #include <unistd.h>
42 +#include <alloca.h>
43 +#include <ctype.h>
41 44 #include <locale.h>
42 45 #include <note.h>
43 46
44 47 #define warnx1(a, b, c) warnx(a)
45 48 #define warnx2(a, b, c) warnx(a, b)
46 49 #define warnx3(a, b, c) warnx(a, b, c)
47 50
48 51 #define PTRDIFF(x, y) ((uintptr_t)(x) - (uintptr_t)(y))
49 52
50 53 #define _(x) gettext(x)
51 54
52 55 #define PF(f, func) do { \
53 56 char *b = NULL; \
54 - int dollar = 0; \
55 - if (*f == '$') { \
56 - dollar++; \
57 - *f = '%'; \
58 - } \
59 57 if (havewidth) \
60 58 if (haveprec) \
61 59 (void) asprintf(&b, f, fieldwidth, precision, func); \
62 60 else \
63 61 (void) asprintf(&b, f, fieldwidth, func); \
64 62 else if (haveprec) \
65 63 (void) asprintf(&b, f, precision, func); \
66 64 else \
67 65 (void) asprintf(&b, f, func); \
68 66 if (b) { \
69 67 (void) fputs(b, stdout); \
70 68 free(b); \
71 69 } \
72 - if (dollar) \
73 - *f = '$'; \
74 70 _NOTE(CONSTCOND) } while (0)
75 71
76 72 static int asciicode(void);
77 73 static char *doformat(char *, int *);
78 74 static int escape(char *, int, size_t *);
79 75 static int getchr(void);
80 76 static int getfloating(long double *, int);
81 77 static int getint(int *);
82 78 static int getnum(intmax_t *, uintmax_t *, int);
83 79 static const char
84 80 *getstr(void);
85 81 static char *mknum(char *, char);
86 82 static void usage(void);
87 83
84 +static const char digits[] = "0123456789";
85 +
88 86 static int myargc;
89 87 static char **myargv;
90 88 static char **gargv;
89 +static char **maxargv;
91 90
92 91 int
93 92 main(int argc, char *argv[])
94 93 {
95 94 size_t len;
96 - int chopped, end, rval;
95 + int end, rval;
97 96 char *format, *fmt, *start;
98 97
99 98 (void) setlocale(LC_ALL, "");
100 99
101 100 argv++;
102 101 argc--;
103 102
104 103 /*
105 104 * POSIX says: Standard utilities that do not accept options,
106 105 * but that do accept operands, shall recognize "--" as a
107 106 * first argument to be discarded.
108 107 */
109 108 if (argc && strcmp(argv[0], "--") == 0) {
110 109 argc--;
111 110 argv++;
112 111 }
113 112
114 113 if (argc < 1) {
115 114 usage();
116 115 return (1);
117 116 }
↓ open down ↓ |
11 lines elided |
↑ open up ↑ |
118 117
119 118 /*
120 119 * Basic algorithm is to scan the format string for conversion
121 120 * specifications -- once one is found, find out if the field
122 121 * width or precision is a '*'; if it is, gather up value. Note,
123 122 * format strings are reused as necessary to use up the provided
124 123 * arguments, arguments of zero/null string are provided to use
125 124 * up the format string.
126 125 */
127 126 fmt = format = *argv;
128 - chopped = escape(fmt, 1, &len); /* backslash interpretation */
127 + (void) escape(fmt, 1, &len); /* backslash interpretation */
129 128 rval = end = 0;
130 129 gargv = ++argv;
131 130
132 131 for (;;) {
133 - char **maxargv = gargv;
132 + maxargv = gargv;
134 133
135 134 myargv = gargv;
136 135 for (myargc = 0; gargv[myargc]; myargc++)
137 136 /* nop */;
138 137 start = fmt;
139 138 while (fmt < format + len) {
140 139 if (fmt[0] == '%') {
141 140 (void) fwrite(start, 1, PTRDIFF(fmt, start),
142 141 stdout);
143 142 if (fmt[1] == '%') {
144 143 /* %% prints a % */
145 144 (void) putchar('%');
146 145 fmt += 2;
147 146 } else {
148 147 fmt = doformat(fmt, &rval);
149 148 if (fmt == NULL)
150 149 return (1);
151 150 end = 0;
152 151 }
153 152 start = fmt;
154 153 } else
155 154 fmt++;
↓ open down ↓ |
12 lines elided |
↑ open up ↑ |
156 155 if (gargv > maxargv)
157 156 maxargv = gargv;
158 157 }
159 158 gargv = maxargv;
160 159
161 160 if (end == 1) {
162 161 warnx1(_("missing format character"), NULL, NULL);
163 162 return (1);
164 163 }
165 164 (void) fwrite(start, 1, PTRDIFF(fmt, start), stdout);
166 - if (chopped || !*gargv)
165 + if (!*gargv)
167 166 return (rval);
168 167 /* Restart at the beginning of the format string. */
169 168 fmt = format;
170 169 end = 1;
171 170 }
172 171 /* NOTREACHED */
173 172 }
174 173
175 174
176 175 static char *
177 -doformat(char *start, int *rval)
176 +doformat(char *fmt, int *rval)
178 177 {
179 178 static const char skip1[] = "#'-+ 0";
180 - static const char skip2[] = "0123456789";
181 - char *fmt;
182 179 int fieldwidth, haveprec, havewidth, mod_ldbl, precision;
183 180 char convch, nextch;
181 + char *start;
182 + char **fargv;
183 + char *dptr;
184 + int l;
184 185
185 - fmt = start + 1;
186 + start = alloca(strlen(fmt) + 1);
186 187
188 + dptr = start;
189 + *dptr++ = '%';
190 + *dptr = 0;
191 +
192 + fmt++;
193 +
187 194 /* look for "n$" field index specifier */
188 - fmt += strspn(fmt, skip2);
189 - if ((*fmt == '$') && (fmt != (start + 1))) {
190 - int idx = atoi(start + 1);
195 + l = strspn(fmt, digits);
196 + if ((l > 0) && (fmt[l] == '$')) {
197 + int idx = atoi(fmt);
191 198 if (idx <= myargc) {
192 199 gargv = &myargv[idx - 1];
193 200 } else {
194 201 gargv = &myargv[myargc];
195 202 }
196 - start = fmt;
197 - fmt++;
203 + if (gargv > maxargv) {
204 + maxargv = gargv;
205 + }
206 + fmt += l + 1;
207 +
208 + /* save format argument */
209 + fargv = gargv;
198 210 } else {
199 - fmt = start + 1;
211 + fargv = NULL;
200 212 }
201 213
202 214 /* skip to field width */
203 - fmt += strspn(fmt, skip1);
215 + while (strchr(skip1, *fmt) != NULL) {
216 + *dptr++ = *fmt++;
217 + *dptr = 0;
218 + }
219 +
220 +
204 221 if (*fmt == '*') {
222 +
223 + fmt++;
224 + l = strspn(fmt, digits);
225 + if ((l > 0) && (fmt[l] == '$')) {
226 + int idx = atoi(fmt);
227 + if (idx <= myargc) {
228 + gargv = &myargv[idx - 1];
229 + } else {
230 + gargv = &myargv[myargc];
231 + }
232 + fmt += l + 1;
233 + }
234 +
205 235 if (getint(&fieldwidth))
206 236 return (NULL);
237 + if (gargv > maxargv) {
238 + maxargv = gargv;
239 + }
207 240 havewidth = 1;
208 - ++fmt;
241 +
242 + *dptr++ = '*';
243 + *dptr = 0;
209 244 } else {
210 245 havewidth = 0;
211 246
212 247 /* skip to possible '.', get following precision */
213 - fmt += strspn(fmt, skip2);
248 + while (isdigit(*fmt)) {
249 + *dptr++ = *fmt++;
250 + *dptr = 0;
251 + }
214 252 }
253 +
215 254 if (*fmt == '.') {
216 255 /* precision present? */
217 - ++fmt;
256 + fmt++;
257 + *dptr++ = '.';
258 +
218 259 if (*fmt == '*') {
260 +
261 + fmt++;
262 + l = strspn(fmt, digits);
263 + if ((l > 0) && (fmt[l] == '$')) {
264 + int idx = atoi(fmt);
265 + if (idx <= myargc) {
266 + gargv = &myargv[idx - 1];
267 + } else {
268 + gargv = &myargv[myargc];
269 + }
270 + fmt += l + 1;
271 + }
272 +
219 273 if (getint(&precision))
220 274 return (NULL);
275 + if (gargv > maxargv) {
276 + maxargv = gargv;
277 + }
221 278 haveprec = 1;
222 - ++fmt;
279 + *dptr++ = '*';
280 + *dptr = 0;
223 281 } else {
224 282 haveprec = 0;
225 283
226 284 /* skip to conversion char */
227 - fmt += strspn(fmt, skip2);
285 + while (isdigit(*fmt)) {
286 + *dptr++ = *fmt++;
287 + *dptr = 0;
288 + }
228 289 }
229 290 } else
230 291 haveprec = 0;
231 292 if (!*fmt) {
232 293 warnx1(_("missing format character"), NULL, NULL);
233 294 return (NULL);
234 295 }
296 + *dptr++ = *fmt;
297 + *dptr = 0;
235 298
236 299 /*
237 300 * Look for a length modifier. POSIX doesn't have these, so
238 301 * we only support them for floating-point conversions, which
239 302 * are extensions. This is useful because the L modifier can
240 303 * be used to gain extra range and precision, while omitting
241 304 * it is more likely to produce consistent results on different
242 305 * architectures. This is not so important for integers
243 306 * because overflow is the only bad thing that can happen to
244 307 * them, but consider the command printf %a 1.1
245 308 */
246 309 if (*fmt == 'L') {
↓ open down ↓ |
2 lines elided |
↑ open up ↑ |
247 310 mod_ldbl = 1;
248 311 fmt++;
249 312 if (!strchr("aAeEfFgG", *fmt)) {
250 313 warnx2(_("bad modifier L for %%%c"), *fmt, NULL);
251 314 return (NULL);
252 315 }
253 316 } else {
254 317 mod_ldbl = 0;
255 318 }
256 319
320 + /* save the current arg offset, and set to the format arg */
321 + if (fargv != NULL) {
322 + gargv = fargv;
323 + }
324 +
257 325 convch = *fmt;
258 326 nextch = *++fmt;
327 +
259 328 *fmt = '\0';
260 329 switch (convch) {
261 330 case 'b': {
262 331 size_t len;
263 332 char *p;
264 333 int getout;
265 334
266 335 p = strdup(getstr());
267 336 if (p == NULL) {
268 337 warnx2("%s", strerror(ENOMEM), NULL);
269 338 return (NULL);
270 339 }
271 340 getout = escape(p, 0, &len);
272 - *(fmt - 1) = 's';
273 - PF(start, p);
274 - *(fmt - 1) = 'b';
341 + (void) fputs(p, stdout);
275 342 free(p);
276 343
277 344 if (getout)
278 - return (fmt);
345 + exit(*rval);
279 346 break;
280 347 }
281 348 case 'c': {
282 349 char p;
283 350
284 351 p = getchr();
285 352 PF(start, p);
286 353 break;
287 354 }
288 355 case 's': {
289 356 const char *p;
290 357
291 358 p = getstr();
292 359 PF(start, p);
293 360 break;
294 361 }
295 362 case 'd': case 'i': case 'o': case 'u': case 'x': case 'X': {
296 363 char *f;
297 364 intmax_t val;
298 365 uintmax_t uval;
299 366 int signedconv;
300 367
301 368 signedconv = (convch == 'd' || convch == 'i');
302 369 if ((f = mknum(start, convch)) == NULL)
303 370 return (NULL);
304 371 if (getnum(&val, &uval, signedconv))
305 372 *rval = 1;
306 373 if (signedconv)
307 374 PF(f, val);
308 375 else
309 376 PF(f, uval);
310 377 break;
311 378 }
312 379 case 'e': case 'E':
313 380 case 'f': case 'F':
314 381 case 'g': case 'G':
315 382 case 'a': case 'A': {
316 383 long double p;
317 384
318 385 if (getfloating(&p, mod_ldbl))
319 386 *rval = 1;
320 387 if (mod_ldbl)
↓ open down ↓ |
32 lines elided |
↑ open up ↑ |
321 388 PF(start, p);
322 389 else
323 390 PF(start, (double)p);
324 391 break;
325 392 }
326 393 default:
327 394 warnx2(_("illegal format character %c"), convch, NULL);
328 395 return (NULL);
329 396 }
330 397 *fmt = nextch;
398 +
399 + /* return the gargv to the next element */
331 400 return (fmt);
332 401 }
333 402
334 403 static char *
335 404 mknum(char *str, char ch)
336 405 {
337 406 static char *copy;
338 407 static size_t copy_size;
339 408 char *newcopy;
340 409 size_t len, newlen;
341 410
342 411 len = strlen(str) + 2;
343 412 if (len > copy_size) {
344 413 newlen = ((len + 1023) >> 10) << 10;
345 414 if ((newcopy = realloc(copy, newlen)) == NULL) {
346 415 warnx2("%s", strerror(ENOMEM), NULL);
347 416 return (NULL);
348 417 }
349 418 copy = newcopy;
350 419 copy_size = newlen;
351 420 }
352 421
353 422 (void) memmove(copy, str, len - 3);
354 423 copy[len - 3] = 'j';
355 424 copy[len - 2] = ch;
356 425 copy[len - 1] = '\0';
357 426 return (copy);
358 427 }
359 428
360 429 static int
361 430 escape(char *fmt, int percent, size_t *len)
362 431 {
363 432 char *save, *store, c;
364 433 int value;
365 434
366 435 for (save = store = fmt; ((c = *fmt) != 0); ++fmt, ++store) {
367 436 if (c != '\\') {
368 437 *store = c;
369 438 continue;
370 439 }
371 440 switch (*++fmt) {
372 441 case '\0': /* EOS, user error */
373 442 *store = '\\';
374 443 *++store = '\0';
375 444 *len = PTRDIFF(store, save);
376 445 return (0);
377 446 case '\\': /* backslash */
↓ open down ↓ |
37 lines elided |
↑ open up ↑ |
378 447 case '\'': /* single quote */
379 448 *store = *fmt;
380 449 break;
381 450 case 'a': /* bell/alert */
382 451 *store = '\a';
383 452 break;
384 453 case 'b': /* backspace */
385 454 *store = '\b';
386 455 break;
387 456 case 'c':
388 - *store = '\0';
389 - *len = PTRDIFF(store, save);
390 - return (1);
457 + if (!percent) {
458 + *store = '\0';
459 + *len = PTRDIFF(store, save);
460 + return (1);
461 + }
462 + *store = 'c';
463 + break;
391 464 case 'f': /* form-feed */
392 465 *store = '\f';
393 466 break;
394 467 case 'n': /* newline */
395 468 *store = '\n';
396 469 break;
397 470 case 'r': /* carriage-return */
398 471 *store = '\r';
399 472 break;
400 473 case 't': /* horizontal tab */
401 474 *store = '\t';
402 475 break;
403 476 case 'v': /* vertical tab */
404 477 *store = '\v';
405 478 break;
406 479 /* octal constant */
407 480 case '0': case '1': case '2': case '3':
408 481 case '4': case '5': case '6': case '7':
409 482 c = (!percent && *fmt == '0') ? 4 : 3;
410 483 for (value = 0;
411 484 c-- && *fmt >= '0' && *fmt <= '7'; ++fmt) {
412 485 value <<= 3;
413 486 value += *fmt - '0';
414 487 }
415 488 --fmt;
416 489 if (percent && value == '%') {
417 490 *store++ = '%';
418 491 *store = '%';
419 492 } else
420 493 *store = (char)value;
421 494 break;
422 495 default:
423 496 *store = *fmt;
424 497 break;
425 498 }
426 499 }
427 500 *store = '\0';
428 501 *len = PTRDIFF(store, save);
429 502 return (0);
430 503 }
431 504
432 505 static int
433 506 getchr(void)
434 507 {
435 508 if (!*gargv)
436 509 return ('\0');
437 510 return ((int)**gargv++);
438 511 }
439 512
440 513 static const char *
441 514 getstr(void)
442 515 {
443 516 if (!*gargv)
444 517 return ("");
445 518 return (*gargv++);
446 519 }
447 520
448 521 static int
449 522 getint(int *ip)
450 523 {
451 524 intmax_t val;
452 525 uintmax_t uval;
453 526 int rval;
454 527
455 528 if (getnum(&val, &uval, 1))
456 529 return (1);
457 530 rval = 0;
458 531 if (val < INT_MIN || val > INT_MAX) {
459 532 warnx3("%s: %s", *gargv, strerror(ERANGE));
460 533 rval = 1;
461 534 }
462 535 *ip = (int)val;
463 536 return (rval);
464 537 }
465 538
466 539 static int
467 540 getnum(intmax_t *ip, uintmax_t *uip, int signedconv)
468 541 {
469 542 char *ep;
470 543 int rval;
471 544
472 545 if (!*gargv) {
473 546 *ip = 0;
474 547 return (0);
475 548 }
476 549 if (**gargv == '"' || **gargv == '\'') {
477 550 if (signedconv)
478 551 *ip = asciicode();
479 552 else
480 553 *uip = asciicode();
481 554 return (0);
482 555 }
483 556 rval = 0;
484 557 errno = 0;
485 558 if (signedconv)
486 559 *ip = strtoimax(*gargv, &ep, 0);
487 560 else
488 561 *uip = strtoumax(*gargv, &ep, 0);
489 562 if (ep == *gargv) {
490 563 warnx2(_("%s: expected numeric value"), *gargv, NULL);
491 564 rval = 1;
492 565 } else if (*ep != '\0') {
493 566 warnx2(_("%s: not completely converted"), *gargv, NULL);
494 567 rval = 1;
495 568 }
496 569 if (errno == ERANGE) {
497 570 warnx3("%s: %s", *gargv, strerror(ERANGE));
498 571 rval = 1;
499 572 }
500 573 ++gargv;
501 574 return (rval);
502 575 }
503 576
504 577 static int
505 578 getfloating(long double *dp, int mod_ldbl)
506 579 {
507 580 char *ep;
508 581 int rval;
509 582
510 583 if (!*gargv) {
511 584 *dp = 0.0;
512 585 return (0);
513 586 }
514 587 if (**gargv == '"' || **gargv == '\'') {
515 588 *dp = asciicode();
516 589 return (0);
517 590 }
518 591 rval = 0;
519 592 errno = 0;
520 593 if (mod_ldbl)
521 594 *dp = strtold(*gargv, &ep);
522 595 else
523 596 *dp = strtod(*gargv, &ep);
524 597 if (ep == *gargv) {
525 598 warnx2(_("%s: expected numeric value"), *gargv, NULL);
526 599 rval = 1;
527 600 } else if (*ep != '\0') {
528 601 warnx2(_("%s: not completely converted"), *gargv, NULL);
529 602 rval = 1;
530 603 }
531 604 if (errno == ERANGE) {
532 605 warnx3("%s: %s", *gargv, strerror(ERANGE));
533 606 rval = 1;
534 607 }
535 608 ++gargv;
536 609 return (rval);
537 610 }
538 611
539 612 static int
540 613 asciicode(void)
541 614 {
542 615 int ch;
543 616
544 617 ch = **gargv;
545 618 if (ch == '\'' || ch == '"')
546 619 ch = (*gargv)[1];
547 620 ++gargv;
548 621 return (ch);
549 622 }
550 623
551 624 static void
552 625 usage(void)
553 626 {
554 627 (void) fprintf(stderr, _("usage: printf format [arguments ...]\n"));
555 628 }
↓ open down ↓ |
155 lines elided |
↑ open up ↑ |
XXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXX