1118537f2SMike Smith /*- 251369649SPedro F. Giffuni * SPDX-License-Identifier: BSD-3-Clause 351369649SPedro F. Giffuni * 4118537f2SMike Smith * Copyright (c) 1990, 1993 5118537f2SMike Smith * The Regents of the University of California. All rights reserved. 6118537f2SMike Smith * 7118537f2SMike Smith * This code is derived from software contributed to Berkeley by 8118537f2SMike Smith * Chris Torek. 9118537f2SMike Smith * 10118537f2SMike Smith * Redistribution and use in source and binary forms, with or without 11118537f2SMike Smith * modification, are permitted provided that the following conditions 12118537f2SMike Smith * are met: 13118537f2SMike Smith * 1. Redistributions of source code must retain the above copyright 14118537f2SMike Smith * notice, this list of conditions and the following disclaimer. 15118537f2SMike Smith * 2. Redistributions in binary form must reproduce the above copyright 16118537f2SMike Smith * notice, this list of conditions and the following disclaimer in the 17118537f2SMike Smith * documentation and/or other materials provided with the distribution. 1869a28758SEd Maste * 3. Neither the name of the University nor the names of its contributors 19118537f2SMike Smith * may be used to endorse or promote products derived from this software 20118537f2SMike Smith * without specific prior written permission. 21118537f2SMike Smith * 22118537f2SMike Smith * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND 23118537f2SMike Smith * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE 24118537f2SMike Smith * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE 25118537f2SMike Smith * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE 26118537f2SMike Smith * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL 27118537f2SMike Smith * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS 28118537f2SMike Smith * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) 29118537f2SMike Smith * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT 30118537f2SMike Smith * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY 31118537f2SMike Smith * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF 32118537f2SMike Smith * SUCH DAMAGE. 33118537f2SMike Smith * 34118537f2SMike Smith * From: Id: vfscanf.c,v 1.13 1998/09/25 12:20:27 obrien Exp 35bf9deabaSPoul-Henning Kamp * From: static char sccsid[] = "@(#)strtol.c 8.1 (Berkeley) 6/4/93"; 36bf9deabaSPoul-Henning Kamp * From: static char sccsid[] = "@(#)strtoul.c 8.1 (Berkeley) 6/4/93"; 37118537f2SMike Smith */ 38118537f2SMike Smith 39677b542eSDavid E. O'Brien #include <sys/cdefs.h> 40677b542eSDavid E. O'Brien __FBSDID("$FreeBSD$"); 41677b542eSDavid E. O'Brien 42118537f2SMike Smith #include <sys/param.h> 43118537f2SMike Smith #include <sys/systm.h> 445b664c7cSPoul-Henning Kamp #include <sys/ctype.h> 45104a9b7eSAlexander Kabaev #include <sys/limits.h> 46*3a60f3daSAlexander Motin #include <sys/stddef.h> 47118537f2SMike Smith 48118537f2SMike Smith /* 49118537f2SMike Smith * Note that stdarg.h and the ANSI style va_start macro is used for both 50118537f2SMike Smith * ANSI and traditional C compilers. 51118537f2SMike Smith */ 52118537f2SMike Smith #include <machine/stdarg.h> 53118537f2SMike Smith 54118537f2SMike Smith #define BUF 32 /* Maximum length of numeric string. */ 55118537f2SMike Smith 56118537f2SMike Smith /* 57118537f2SMike Smith * Flags used during conversion. 58118537f2SMike Smith */ 59118537f2SMike Smith #define LONG 0x01 /* l: long or double */ 60118537f2SMike Smith #define SHORT 0x04 /* h: short */ 61118537f2SMike Smith #define SUPPRESS 0x08 /* suppress assignment */ 62118537f2SMike Smith #define POINTER 0x10 /* weird %p pointer (`fake hex') */ 63118537f2SMike Smith #define NOSKIP 0x20 /* do not skip blanks */ 64118537f2SMike Smith #define QUAD 0x400 65*3a60f3daSAlexander Motin #define INTMAXT 0x800 /* j: intmax_t */ 66*3a60f3daSAlexander Motin #define PTRDIFFT 0x1000 /* t: ptrdiff_t */ 67*3a60f3daSAlexander Motin #define SIZET 0x2000 /* z: size_t */ 687e949c46SKenneth D. Merry #define SHORTSHORT 0x4000 /** hh: char */ 69118537f2SMike Smith 70118537f2SMike Smith /* 71118537f2SMike Smith * The following are used in numeric conversions only: 72118537f2SMike Smith * SIGNOK, NDIGITS, DPTOK, and EXPOK are for floating point; 73118537f2SMike Smith * SIGNOK, NDIGITS, PFXOK, and NZDIGITS are for integral. 74118537f2SMike Smith */ 75118537f2SMike Smith #define SIGNOK 0x40 /* +/- is (still) legal */ 76118537f2SMike Smith #define NDIGITS 0x80 /* no digits detected */ 77118537f2SMike Smith 78118537f2SMike Smith #define DPTOK 0x100 /* (float) decimal point is still legal */ 79118537f2SMike Smith #define EXPOK 0x200 /* (float) exponent (e+3, etc) still legal */ 80118537f2SMike Smith 81118537f2SMike Smith #define PFXOK 0x100 /* 0x prefix is (still) legal */ 82118537f2SMike Smith #define NZDIGITS 0x200 /* no zero digits detected */ 83118537f2SMike Smith 84118537f2SMike Smith /* 85118537f2SMike Smith * Conversion types. 86118537f2SMike Smith */ 87118537f2SMike Smith #define CT_CHAR 0 /* %c conversion */ 88118537f2SMike Smith #define CT_CCL 1 /* %[...] conversion */ 89118537f2SMike Smith #define CT_STRING 2 /* %s conversion */ 90118537f2SMike Smith #define CT_INT 3 /* integer, i.e., strtoq or strtouq */ 9125792ef3SArchie Cobbs typedef u_quad_t (*ccfntype)(const char *, char **, int); 92118537f2SMike Smith 93598217c4SMatthew Dillon static const u_char *__sccl(char *, const u_char *); 94118537f2SMike Smith 95118537f2SMike Smith int 96118537f2SMike Smith sscanf(const char *ibuf, const char *fmt, ...) 97118537f2SMike Smith { 98118537f2SMike Smith va_list ap; 99118537f2SMike Smith int ret; 100118537f2SMike Smith 101118537f2SMike Smith va_start(ap, fmt); 102118537f2SMike Smith ret = vsscanf(ibuf, fmt, ap); 103118537f2SMike Smith va_end(ap); 104118537f2SMike Smith return(ret); 105118537f2SMike Smith } 106118537f2SMike Smith 107118537f2SMike Smith int 108118537f2SMike Smith vsscanf(const char *inp, char const *fmt0, va_list ap) 109118537f2SMike Smith { 110118537f2SMike Smith int inr; 111598217c4SMatthew Dillon const u_char *fmt = (const u_char *)fmt0; 112118537f2SMike Smith int c; /* character from format, or conversion */ 113118537f2SMike Smith size_t width; /* field width, or 0 */ 114118537f2SMike Smith char *p; /* points into all kinds of strings */ 115118537f2SMike Smith int n; /* handy integer */ 116118537f2SMike Smith int flags; /* flags as defined above */ 117118537f2SMike Smith char *p0; /* saves original value of p when necessary */ 118118537f2SMike Smith int nassigned; /* number of fields assigned */ 119118537f2SMike Smith int nconversions; /* number of conversions */ 120118537f2SMike Smith int nread; /* number of characters consumed from fp */ 121118537f2SMike Smith int base; /* base argument to strtoq/strtouq */ 122118537f2SMike Smith ccfntype ccfn; /* conversion function (strtoq/strtouq) */ 123118537f2SMike Smith char ccltab[256]; /* character class table for %[...] */ 124118537f2SMike Smith char buf[BUF]; /* buffer for numeric conversions */ 125118537f2SMike Smith 126118537f2SMike Smith /* `basefix' is used to avoid `if' tests in the integer scanner */ 127118537f2SMike Smith static short basefix[17] = 128118537f2SMike Smith { 10, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16 }; 129118537f2SMike Smith 130118537f2SMike Smith inr = strlen(inp); 131118537f2SMike Smith 132118537f2SMike Smith nassigned = 0; 133118537f2SMike Smith nconversions = 0; 134118537f2SMike Smith nread = 0; 135118537f2SMike Smith base = 0; /* XXX just to keep gcc happy */ 136118537f2SMike Smith ccfn = NULL; /* XXX just to keep gcc happy */ 137118537f2SMike Smith for (;;) { 138118537f2SMike Smith c = *fmt++; 139118537f2SMike Smith if (c == 0) 140118537f2SMike Smith return (nassigned); 141118537f2SMike Smith if (isspace(c)) { 142118537f2SMike Smith while (inr > 0 && isspace(*inp)) 143118537f2SMike Smith nread++, inr--, inp++; 144118537f2SMike Smith continue; 145118537f2SMike Smith } 146118537f2SMike Smith if (c != '%') 147118537f2SMike Smith goto literal; 148118537f2SMike Smith width = 0; 149118537f2SMike Smith flags = 0; 150118537f2SMike Smith /* 151118537f2SMike Smith * switch on the format. continue if done; 152118537f2SMike Smith * break once format type is derived. 153118537f2SMike Smith */ 154118537f2SMike Smith again: c = *fmt++; 155118537f2SMike Smith switch (c) { 156118537f2SMike Smith case '%': 157118537f2SMike Smith literal: 158118537f2SMike Smith if (inr <= 0) 159118537f2SMike Smith goto input_failure; 160118537f2SMike Smith if (*inp != c) 161118537f2SMike Smith goto match_failure; 162118537f2SMike Smith inr--, inp++; 163118537f2SMike Smith nread++; 164118537f2SMike Smith continue; 165118537f2SMike Smith 166118537f2SMike Smith case '*': 167118537f2SMike Smith flags |= SUPPRESS; 168118537f2SMike Smith goto again; 169*3a60f3daSAlexander Motin case 'j': 170*3a60f3daSAlexander Motin flags |= INTMAXT; 171*3a60f3daSAlexander Motin goto again; 172118537f2SMike Smith case 'l': 1737e949c46SKenneth D. Merry if (flags & LONG){ 1747e949c46SKenneth D. Merry flags &= ~LONG; 1757e949c46SKenneth D. Merry flags |= QUAD; 1767e949c46SKenneth D. Merry } else { 177118537f2SMike Smith flags |= LONG; 1787e949c46SKenneth D. Merry } 179118537f2SMike Smith goto again; 180118537f2SMike Smith case 'q': 181118537f2SMike Smith flags |= QUAD; 182118537f2SMike Smith goto again; 183*3a60f3daSAlexander Motin case 't': 184*3a60f3daSAlexander Motin flags |= PTRDIFFT; 185*3a60f3daSAlexander Motin goto again; 186*3a60f3daSAlexander Motin case 'z': 187*3a60f3daSAlexander Motin flags |= SIZET; 188*3a60f3daSAlexander Motin goto again; 189118537f2SMike Smith case 'h': 1907e949c46SKenneth D. Merry if (flags & SHORT){ 1917e949c46SKenneth D. Merry flags &= ~SHORT; 1927e949c46SKenneth D. Merry flags |= SHORTSHORT; 1937e949c46SKenneth D. Merry } else { 194118537f2SMike Smith flags |= SHORT; 1957e949c46SKenneth D. Merry } 196118537f2SMike Smith goto again; 197118537f2SMike Smith 198118537f2SMike Smith case '0': case '1': case '2': case '3': case '4': 199118537f2SMike Smith case '5': case '6': case '7': case '8': case '9': 200118537f2SMike Smith width = width * 10 + c - '0'; 201118537f2SMike Smith goto again; 202118537f2SMike Smith 203118537f2SMike Smith /* 204118537f2SMike Smith * Conversions. 205118537f2SMike Smith * 206118537f2SMike Smith */ 207118537f2SMike Smith case 'd': 208118537f2SMike Smith c = CT_INT; 209118537f2SMike Smith ccfn = (ccfntype)strtoq; 210118537f2SMike Smith base = 10; 211118537f2SMike Smith break; 212118537f2SMike Smith 213118537f2SMike Smith case 'i': 214118537f2SMike Smith c = CT_INT; 215118537f2SMike Smith ccfn = (ccfntype)strtoq; 216118537f2SMike Smith base = 0; 217118537f2SMike Smith break; 218118537f2SMike Smith 219118537f2SMike Smith case 'o': 220118537f2SMike Smith c = CT_INT; 221118537f2SMike Smith ccfn = strtouq; 222118537f2SMike Smith base = 8; 223118537f2SMike Smith break; 224118537f2SMike Smith 225118537f2SMike Smith case 'u': 226118537f2SMike Smith c = CT_INT; 227118537f2SMike Smith ccfn = strtouq; 228118537f2SMike Smith base = 10; 229118537f2SMike Smith break; 230118537f2SMike Smith 231118537f2SMike Smith case 'x': 232118537f2SMike Smith flags |= PFXOK; /* enable 0x prefixing */ 233118537f2SMike Smith c = CT_INT; 234118537f2SMike Smith ccfn = strtouq; 235118537f2SMike Smith base = 16; 236118537f2SMike Smith break; 237118537f2SMike Smith 238118537f2SMike Smith case 's': 239118537f2SMike Smith c = CT_STRING; 240118537f2SMike Smith break; 241118537f2SMike Smith 242118537f2SMike Smith case '[': 243118537f2SMike Smith fmt = __sccl(ccltab, fmt); 244118537f2SMike Smith flags |= NOSKIP; 245118537f2SMike Smith c = CT_CCL; 246118537f2SMike Smith break; 247118537f2SMike Smith 248118537f2SMike Smith case 'c': 249118537f2SMike Smith flags |= NOSKIP; 250118537f2SMike Smith c = CT_CHAR; 251118537f2SMike Smith break; 252118537f2SMike Smith 253118537f2SMike Smith case 'p': /* pointer format is like hex */ 254118537f2SMike Smith flags |= POINTER | PFXOK; 255118537f2SMike Smith c = CT_INT; 256118537f2SMike Smith ccfn = strtouq; 257118537f2SMike Smith base = 16; 258118537f2SMike Smith break; 259118537f2SMike Smith 260118537f2SMike Smith case 'n': 261118537f2SMike Smith nconversions++; 262118537f2SMike Smith if (flags & SUPPRESS) /* ??? */ 263118537f2SMike Smith continue; 2647e949c46SKenneth D. Merry if (flags & SHORTSHORT) 2657e949c46SKenneth D. Merry *va_arg(ap, char *) = nread; 2667e949c46SKenneth D. Merry else if (flags & SHORT) 267118537f2SMike Smith *va_arg(ap, short *) = nread; 268118537f2SMike Smith else if (flags & LONG) 269118537f2SMike Smith *va_arg(ap, long *) = nread; 270118537f2SMike Smith else if (flags & QUAD) 271118537f2SMike Smith *va_arg(ap, quad_t *) = nread; 272*3a60f3daSAlexander Motin else if (flags & INTMAXT) 273*3a60f3daSAlexander Motin *va_arg(ap, intmax_t *) = nread; 274*3a60f3daSAlexander Motin else if (flags & SIZET) 275*3a60f3daSAlexander Motin *va_arg(ap, size_t *) = nread; 276*3a60f3daSAlexander Motin else if (flags & PTRDIFFT) 277*3a60f3daSAlexander Motin *va_arg(ap, ptrdiff_t *) = nread; 278118537f2SMike Smith else 279118537f2SMike Smith *va_arg(ap, int *) = nread; 280118537f2SMike Smith continue; 281118537f2SMike Smith } 282118537f2SMike Smith 283118537f2SMike Smith /* 284118537f2SMike Smith * We have a conversion that requires input. 285118537f2SMike Smith */ 286118537f2SMike Smith if (inr <= 0) 287118537f2SMike Smith goto input_failure; 288118537f2SMike Smith 289118537f2SMike Smith /* 290118537f2SMike Smith * Consume leading white space, except for formats 291118537f2SMike Smith * that suppress this. 292118537f2SMike Smith */ 293118537f2SMike Smith if ((flags & NOSKIP) == 0) { 294118537f2SMike Smith while (isspace(*inp)) { 295118537f2SMike Smith nread++; 296118537f2SMike Smith if (--inr > 0) 297118537f2SMike Smith inp++; 298118537f2SMike Smith else 299118537f2SMike Smith goto input_failure; 300118537f2SMike Smith } 301118537f2SMike Smith /* 302118537f2SMike Smith * Note that there is at least one character in 303118537f2SMike Smith * the buffer, so conversions that do not set NOSKIP 304118537f2SMike Smith * can no longer result in an input failure. 305118537f2SMike Smith */ 306118537f2SMike Smith } 307118537f2SMike Smith 308118537f2SMike Smith /* 309118537f2SMike Smith * Do the conversion. 310118537f2SMike Smith */ 311118537f2SMike Smith switch (c) { 312118537f2SMike Smith 313118537f2SMike Smith case CT_CHAR: 314118537f2SMike Smith /* scan arbitrary characters (sets NOSKIP) */ 315118537f2SMike Smith if (width == 0) 316118537f2SMike Smith width = 1; 317118537f2SMike Smith if (flags & SUPPRESS) { 318118537f2SMike Smith size_t sum = 0; 319118537f2SMike Smith for (;;) { 320118537f2SMike Smith if ((n = inr) < width) { 321118537f2SMike Smith sum += n; 322118537f2SMike Smith width -= n; 323118537f2SMike Smith inp += n; 324118537f2SMike Smith if (sum == 0) 325118537f2SMike Smith goto input_failure; 326118537f2SMike Smith break; 327118537f2SMike Smith } else { 328118537f2SMike Smith sum += width; 329118537f2SMike Smith inr -= width; 330118537f2SMike Smith inp += width; 331118537f2SMike Smith break; 332118537f2SMike Smith } 333118537f2SMike Smith } 334118537f2SMike Smith nread += sum; 335118537f2SMike Smith } else { 336118537f2SMike Smith bcopy(inp, va_arg(ap, char *), width); 337118537f2SMike Smith inr -= width; 338118537f2SMike Smith inp += width; 339118537f2SMike Smith nread += width; 340118537f2SMike Smith nassigned++; 341118537f2SMike Smith } 342118537f2SMike Smith nconversions++; 343118537f2SMike Smith break; 344118537f2SMike Smith 345118537f2SMike Smith case CT_CCL: 346118537f2SMike Smith /* scan a (nonempty) character class (sets NOSKIP) */ 347118537f2SMike Smith if (width == 0) 348118537f2SMike Smith width = (size_t)~0; /* `infinity' */ 349118537f2SMike Smith /* take only those things in the class */ 350118537f2SMike Smith if (flags & SUPPRESS) { 351118537f2SMike Smith n = 0; 352ef528b29SMatthew Dillon while (ccltab[(unsigned char)*inp]) { 353118537f2SMike Smith n++, inr--, inp++; 354118537f2SMike Smith if (--width == 0) 355118537f2SMike Smith break; 356118537f2SMike Smith if (inr <= 0) { 357118537f2SMike Smith if (n == 0) 358118537f2SMike Smith goto input_failure; 359118537f2SMike Smith break; 360118537f2SMike Smith } 361118537f2SMike Smith } 362118537f2SMike Smith if (n == 0) 363118537f2SMike Smith goto match_failure; 364118537f2SMike Smith } else { 365118537f2SMike Smith p0 = p = va_arg(ap, char *); 366ef528b29SMatthew Dillon while (ccltab[(unsigned char)*inp]) { 367118537f2SMike Smith inr--; 368118537f2SMike Smith *p++ = *inp++; 369118537f2SMike Smith if (--width == 0) 370118537f2SMike Smith break; 371118537f2SMike Smith if (inr <= 0) { 372118537f2SMike Smith if (p == p0) 373118537f2SMike Smith goto input_failure; 374118537f2SMike Smith break; 375118537f2SMike Smith } 376118537f2SMike Smith } 377118537f2SMike Smith n = p - p0; 378118537f2SMike Smith if (n == 0) 379118537f2SMike Smith goto match_failure; 380118537f2SMike Smith *p = 0; 381118537f2SMike Smith nassigned++; 382118537f2SMike Smith } 383118537f2SMike Smith nread += n; 384118537f2SMike Smith nconversions++; 385118537f2SMike Smith break; 386118537f2SMike Smith 387118537f2SMike Smith case CT_STRING: 388118537f2SMike Smith /* like CCL, but zero-length string OK, & no NOSKIP */ 389118537f2SMike Smith if (width == 0) 390118537f2SMike Smith width = (size_t)~0; 391118537f2SMike Smith if (flags & SUPPRESS) { 392118537f2SMike Smith n = 0; 393118537f2SMike Smith while (!isspace(*inp)) { 394118537f2SMike Smith n++, inr--, inp++; 395118537f2SMike Smith if (--width == 0) 396118537f2SMike Smith break; 397118537f2SMike Smith if (inr <= 0) 398118537f2SMike Smith break; 399118537f2SMike Smith } 400118537f2SMike Smith nread += n; 401118537f2SMike Smith } else { 402118537f2SMike Smith p0 = p = va_arg(ap, char *); 403118537f2SMike Smith while (!isspace(*inp)) { 404118537f2SMike Smith inr--; 405118537f2SMike Smith *p++ = *inp++; 406118537f2SMike Smith if (--width == 0) 407118537f2SMike Smith break; 408118537f2SMike Smith if (inr <= 0) 409118537f2SMike Smith break; 410118537f2SMike Smith } 411118537f2SMike Smith *p = 0; 412118537f2SMike Smith nread += p - p0; 413118537f2SMike Smith nassigned++; 414118537f2SMike Smith } 415118537f2SMike Smith nconversions++; 416118537f2SMike Smith continue; 417118537f2SMike Smith 418118537f2SMike Smith case CT_INT: 419118537f2SMike Smith /* scan an integer as if by strtoq/strtouq */ 420118537f2SMike Smith #ifdef hardway 421118537f2SMike Smith if (width == 0 || width > sizeof(buf) - 1) 422118537f2SMike Smith width = sizeof(buf) - 1; 423118537f2SMike Smith #else 424118537f2SMike Smith /* size_t is unsigned, hence this optimisation */ 425118537f2SMike Smith if (--width > sizeof(buf) - 2) 426118537f2SMike Smith width = sizeof(buf) - 2; 427118537f2SMike Smith width++; 428118537f2SMike Smith #endif 429118537f2SMike Smith flags |= SIGNOK | NDIGITS | NZDIGITS; 430118537f2SMike Smith for (p = buf; width; width--) { 431118537f2SMike Smith c = *inp; 432118537f2SMike Smith /* 433118537f2SMike Smith * Switch on the character; `goto ok' 434118537f2SMike Smith * if we accept it as a part of number. 435118537f2SMike Smith */ 436118537f2SMike Smith switch (c) { 437118537f2SMike Smith 438118537f2SMike Smith /* 439118537f2SMike Smith * The digit 0 is always legal, but is 440118537f2SMike Smith * special. For %i conversions, if no 441118537f2SMike Smith * digits (zero or nonzero) have been 442118537f2SMike Smith * scanned (only signs), we will have 443118537f2SMike Smith * base==0. In that case, we should set 444118537f2SMike Smith * it to 8 and enable 0x prefixing. 445118537f2SMike Smith * Also, if we have not scanned zero digits 446118537f2SMike Smith * before this, do not turn off prefixing 447118537f2SMike Smith * (someone else will turn it off if we 448118537f2SMike Smith * have scanned any nonzero digits). 449118537f2SMike Smith */ 450118537f2SMike Smith case '0': 451118537f2SMike Smith if (base == 0) { 452118537f2SMike Smith base = 8; 453118537f2SMike Smith flags |= PFXOK; 454118537f2SMike Smith } 455118537f2SMike Smith if (flags & NZDIGITS) 456118537f2SMike Smith flags &= ~(SIGNOK|NZDIGITS|NDIGITS); 457118537f2SMike Smith else 458118537f2SMike Smith flags &= ~(SIGNOK|PFXOK|NDIGITS); 459118537f2SMike Smith goto ok; 460118537f2SMike Smith 461118537f2SMike Smith /* 1 through 7 always legal */ 462118537f2SMike Smith case '1': case '2': case '3': 463118537f2SMike Smith case '4': case '5': case '6': case '7': 464118537f2SMike Smith base = basefix[base]; 465118537f2SMike Smith flags &= ~(SIGNOK | PFXOK | NDIGITS); 466118537f2SMike Smith goto ok; 467118537f2SMike Smith 468118537f2SMike Smith /* digits 8 and 9 ok iff decimal or hex */ 469118537f2SMike Smith case '8': case '9': 470118537f2SMike Smith base = basefix[base]; 471118537f2SMike Smith if (base <= 8) 472118537f2SMike Smith break; /* not legal here */ 473118537f2SMike Smith flags &= ~(SIGNOK | PFXOK | NDIGITS); 474118537f2SMike Smith goto ok; 475118537f2SMike Smith 476118537f2SMike Smith /* letters ok iff hex */ 477118537f2SMike Smith case 'A': case 'B': case 'C': 478118537f2SMike Smith case 'D': case 'E': case 'F': 479118537f2SMike Smith case 'a': case 'b': case 'c': 480118537f2SMike Smith case 'd': case 'e': case 'f': 481118537f2SMike Smith /* no need to fix base here */ 482118537f2SMike Smith if (base <= 10) 483118537f2SMike Smith break; /* not legal here */ 484118537f2SMike Smith flags &= ~(SIGNOK | PFXOK | NDIGITS); 485118537f2SMike Smith goto ok; 486118537f2SMike Smith 487118537f2SMike Smith /* sign ok only as first character */ 488118537f2SMike Smith case '+': case '-': 489118537f2SMike Smith if (flags & SIGNOK) { 490118537f2SMike Smith flags &= ~SIGNOK; 491118537f2SMike Smith goto ok; 492118537f2SMike Smith } 493118537f2SMike Smith break; 494118537f2SMike Smith 495118537f2SMike Smith /* x ok iff flag still set & 2nd char */ 496118537f2SMike Smith case 'x': case 'X': 497118537f2SMike Smith if (flags & PFXOK && p == buf + 1) { 498118537f2SMike Smith base = 16; /* if %i */ 499118537f2SMike Smith flags &= ~PFXOK; 500118537f2SMike Smith goto ok; 501118537f2SMike Smith } 502118537f2SMike Smith break; 503118537f2SMike Smith } 504118537f2SMike Smith 505118537f2SMike Smith /* 506118537f2SMike Smith * If we got here, c is not a legal character 507118537f2SMike Smith * for a number. Stop accumulating digits. 508118537f2SMike Smith */ 509118537f2SMike Smith break; 510118537f2SMike Smith ok: 511118537f2SMike Smith /* 512118537f2SMike Smith * c is legal: store it and look at the next. 513118537f2SMike Smith */ 514118537f2SMike Smith *p++ = c; 515118537f2SMike Smith if (--inr > 0) 516118537f2SMike Smith inp++; 517118537f2SMike Smith else 518118537f2SMike Smith break; /* end of input */ 519118537f2SMike Smith } 520118537f2SMike Smith /* 521118537f2SMike Smith * If we had only a sign, it is no good; push 522118537f2SMike Smith * back the sign. If the number ends in `x', 523118537f2SMike Smith * it was [sign] '0' 'x', so push back the x 524118537f2SMike Smith * and treat it as [sign] '0'. 525118537f2SMike Smith */ 526118537f2SMike Smith if (flags & NDIGITS) { 527118537f2SMike Smith if (p > buf) { 528118537f2SMike Smith inp--; 529118537f2SMike Smith inr++; 530118537f2SMike Smith } 531118537f2SMike Smith goto match_failure; 532118537f2SMike Smith } 533118537f2SMike Smith c = ((u_char *)p)[-1]; 534118537f2SMike Smith if (c == 'x' || c == 'X') { 535118537f2SMike Smith --p; 536118537f2SMike Smith inp--; 537118537f2SMike Smith inr++; 538118537f2SMike Smith } 539118537f2SMike Smith if ((flags & SUPPRESS) == 0) { 540118537f2SMike Smith u_quad_t res; 541118537f2SMike Smith 542118537f2SMike Smith *p = 0; 54325792ef3SArchie Cobbs res = (*ccfn)(buf, (char **)NULL, base); 544118537f2SMike Smith if (flags & POINTER) 545118537f2SMike Smith *va_arg(ap, void **) = 546d009ccfaSBruce Evans (void *)(uintptr_t)res; 5477e949c46SKenneth D. Merry else if (flags & SHORTSHORT) 5487e949c46SKenneth D. Merry *va_arg(ap, char *) = res; 549118537f2SMike Smith else if (flags & SHORT) 550118537f2SMike Smith *va_arg(ap, short *) = res; 551118537f2SMike Smith else if (flags & LONG) 552118537f2SMike Smith *va_arg(ap, long *) = res; 553118537f2SMike Smith else if (flags & QUAD) 554118537f2SMike Smith *va_arg(ap, quad_t *) = res; 555*3a60f3daSAlexander Motin else if (flags & INTMAXT) 556*3a60f3daSAlexander Motin *va_arg(ap, intmax_t *) = res; 557*3a60f3daSAlexander Motin else if (flags & PTRDIFFT) 558*3a60f3daSAlexander Motin *va_arg(ap, ptrdiff_t *) = res; 559*3a60f3daSAlexander Motin else if (flags & SIZET) 560*3a60f3daSAlexander Motin *va_arg(ap, size_t *) = res; 561118537f2SMike Smith else 562118537f2SMike Smith *va_arg(ap, int *) = res; 563118537f2SMike Smith nassigned++; 564118537f2SMike Smith } 565118537f2SMike Smith nread += p - buf; 566118537f2SMike Smith nconversions++; 567118537f2SMike Smith break; 568118537f2SMike Smith 569118537f2SMike Smith } 570118537f2SMike Smith } 571118537f2SMike Smith input_failure: 572118537f2SMike Smith return (nconversions != 0 ? nassigned : -1); 573118537f2SMike Smith match_failure: 574118537f2SMike Smith return (nassigned); 575118537f2SMike Smith } 576118537f2SMike Smith 577118537f2SMike Smith /* 578118537f2SMike Smith * Fill in the given table from the scanset at the given format 579118537f2SMike Smith * (just after `['). Return a pointer to the character past the 580118537f2SMike Smith * closing `]'. The table has a 1 wherever characters should be 581118537f2SMike Smith * considered part of the scanset. 582118537f2SMike Smith */ 583598217c4SMatthew Dillon static const u_char * 584598217c4SMatthew Dillon __sccl(char *tab, const u_char *fmt) 585118537f2SMike Smith { 586118537f2SMike Smith int c, n, v; 587118537f2SMike Smith 588118537f2SMike Smith /* first `clear' the whole table */ 589118537f2SMike Smith c = *fmt++; /* first char hat => negated scanset */ 590118537f2SMike Smith if (c == '^') { 591118537f2SMike Smith v = 1; /* default => accept */ 592118537f2SMike Smith c = *fmt++; /* get new first char */ 593118537f2SMike Smith } else 594118537f2SMike Smith v = 0; /* default => reject */ 595118537f2SMike Smith 596118537f2SMike Smith /* XXX: Will not work if sizeof(tab*) > sizeof(char) */ 597118537f2SMike Smith for (n = 0; n < 256; n++) 598118537f2SMike Smith tab[n] = v; /* memset(tab, v, 256) */ 599118537f2SMike Smith 600118537f2SMike Smith if (c == 0) 601118537f2SMike Smith return (fmt - 1);/* format ended before closing ] */ 602118537f2SMike Smith 603118537f2SMike Smith /* 604118537f2SMike Smith * Now set the entries corresponding to the actual scanset 605118537f2SMike Smith * to the opposite of the above. 606118537f2SMike Smith * 607118537f2SMike Smith * The first character may be ']' (or '-') without being special; 608118537f2SMike Smith * the last character may be '-'. 609118537f2SMike Smith */ 610118537f2SMike Smith v = 1 - v; 611118537f2SMike Smith for (;;) { 612118537f2SMike Smith tab[c] = v; /* take character c */ 613118537f2SMike Smith doswitch: 614118537f2SMike Smith n = *fmt++; /* and examine the next */ 615118537f2SMike Smith switch (n) { 616118537f2SMike Smith 617118537f2SMike Smith case 0: /* format ended too soon */ 618118537f2SMike Smith return (fmt - 1); 619118537f2SMike Smith 620118537f2SMike Smith case '-': 621118537f2SMike Smith /* 622118537f2SMike Smith * A scanset of the form 623118537f2SMike Smith * [01+-] 624118537f2SMike Smith * is defined as `the digit 0, the digit 1, 625118537f2SMike Smith * the character +, the character -', but 626118537f2SMike Smith * the effect of a scanset such as 627118537f2SMike Smith * [a-zA-Z0-9] 628118537f2SMike Smith * is implementation defined. The V7 Unix 629118537f2SMike Smith * scanf treats `a-z' as `the letters a through 630118537f2SMike Smith * z', but treats `a-a' as `the letter a, the 631118537f2SMike Smith * character -, and the letter a'. 632118537f2SMike Smith * 633e3043798SPedro F. Giffuni * For compatibility, the `-' is not considered 634118537f2SMike Smith * to define a range if the character following 635118537f2SMike Smith * it is either a close bracket (required by ANSI) 636118537f2SMike Smith * or is not numerically greater than the character 637118537f2SMike Smith * we just stored in the table (c). 638118537f2SMike Smith */ 639118537f2SMike Smith n = *fmt; 640118537f2SMike Smith if (n == ']' || n < c) { 641118537f2SMike Smith c = '-'; 642118537f2SMike Smith break; /* resume the for(;;) */ 643118537f2SMike Smith } 644118537f2SMike Smith fmt++; 645118537f2SMike Smith /* fill in the range */ 646118537f2SMike Smith do { 647118537f2SMike Smith tab[++c] = v; 648118537f2SMike Smith } while (c < n); 649118537f2SMike Smith c = n; 650118537f2SMike Smith /* 651118537f2SMike Smith * Alas, the V7 Unix scanf also treats formats 652118537f2SMike Smith * such as [a-c-e] as `the letters a through e'. 653118537f2SMike Smith * This too is permitted by the standard.... 654118537f2SMike Smith */ 655118537f2SMike Smith goto doswitch; 656118537f2SMike Smith break; 657118537f2SMike Smith 658118537f2SMike Smith case ']': /* end of scanset */ 659118537f2SMike Smith return (fmt); 660118537f2SMike Smith 661118537f2SMike Smith default: /* just another character */ 662118537f2SMike Smith c = n; 663118537f2SMike Smith break; 664118537f2SMike Smith } 665118537f2SMike Smith } 666118537f2SMike Smith /* NOTREACHED */ 667118537f2SMike Smith } 668118537f2SMike Smith 669