1 /* 2 * CDDL HEADER START 3 * 4 * The contents of this file are subject to the terms of the 5 * Common Development and Distribution License (the "License"). 6 * You may not use this file except in compliance with the License. 7 * 8 * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE 9 * or http://www.opensolaris.org/os/licensing. 10 * See the License for the specific language governing permissions 11 * and limitations under the License. 12 * 13 * When distributing Covered Code, include this CDDL HEADER in each 14 * file and include the License file at usr/src/OPENSOLARIS.LICENSE. 15 * If applicable, add the following below this CDDL HEADER, with the 16 * fields enclosed by brackets "[]" replaced with your own identifying 17 * information: Portions Copyright [yyyy] [name of copyright owner] 18 * 19 * CDDL HEADER END 20 */ 21 /* 22 * Copyright 2009 Sun Microsystems, Inc. All rights reserved. 23 * Use is subject to license terms. 24 * 25 * sgsmsg generates several message files from an input template file. Messages 26 * are constructed for use with gettext(3i) - the default - or catgets(3c). The 27 * files generate are: 28 * 29 * msg.h a header file containing definitions for each message. The -h 30 * option triggers the creation of these definitions and specifies 31 * the name to use. 32 * 33 * msg.c a data array of message strings. The msg.h definitions are 34 * offsets into this array. The -d option triggers the creation of 35 * these definitions and specifies the name to use. 36 * 37 * messages a message file suitable for catgets(3c) or gettext(3i) use. The 38 * -m option triggers this output and specifies the filename to be 39 * used. 40 * 41 * The template file is processed based on the first character of each line: 42 * 43 * # or $ entries are copied (as is) to the message file (messages). 44 * 45 * @ token(s) entries are translated. Two translations are possible dependent 46 * on whether one or more tokens are supplied: 47 * 48 * A single token is interpreted as one of two reserved message 49 * output indicators, or a message identifier. The reserved output 50 * indicator _START_ enables output to the message file - Note that 51 * the occurance of any other @ token will also enable message 52 * output. The reserved output indicator _END_ disables output to 53 * the message file. The use of these two indicators provides for 54 * only those message strings that require translation to be output 55 * to the message file. 56 * 57 * Besides the reserved output indicators, a single token is taken 58 * to be a message identifier which will be subsituted for a 59 * `setid' for catgets(3c) output, or a `domain' name for 60 * gettext(3i) output. This value is determine by substituting the 61 * token for the associated definition found in the message 62 * identifier file (specified with the -i option). 63 * 64 * Multiple tokens are taken to be a message definition followed by 65 * the associated message string. The message string is copied to 66 * the data array being built in msg.c. The index into this array 67 * becomes the `message' identifier created in the msg.h file. 68 */ 69 70 #include <fcntl.h> 71 #include <stdlib.h> 72 #include <stdio.h> 73 #include <unistd.h> 74 #include <limits.h> 75 #include <string.h> 76 #include <ctype.h> 77 #include <errno.h> 78 #include <sys/param.h> 79 80 #include <sgs.h> 81 #include <_string_table.h> 82 83 /* 84 * Define any error message strings. 85 */ 86 static const char 87 * Errmsg_malt = "sgsmsg: file %s: line %d: malformed input " 88 "at line\n", 89 * Errmsg_nmem = "sgsmsg: memory allocation failed: %s\n", 90 * Errmsg_opne = "sgsmsg: file %s: open failed: %s\n", 91 * Errmsg_wrte = "sgsmsg: file %s: write failed: %s\n", 92 * Errmsg_read = "sgsmsg: file %s: read failed %s\n", 93 * Errmsg_stnw = "sgsmsg: st_new(): failed: %s\n", 94 * Errmsg_stin = "sgsmsg: Str_tbl insert failed: %s\n", 95 * Errmsg_mnfn = "sgsmsg: message not found in Str_tbl: %s\n", 96 * Errmsg_use = "usage: sgsmsg [-clv] [-d mesgdata] [-h mesgdefs] " 97 "[-m messages] [-n name] [-i mesgident] file ...\n"; 98 99 /* 100 * Define all output filenames and associated descriptors. 101 */ 102 static FILE *fddefs, *fddata, *fdmsgs, *fdmids, *fddesc; 103 static char *fldefs, *fldata, *flmsgs, *flmids, *fldesc; 104 static FILE *fdlint; 105 static char fllint[MAXPATHLEN]; 106 107 static uint_t vflag; /* verbose flag */ 108 static Str_tbl *stp; /* string table */ 109 110 /* 111 * Define any default strings. 112 */ 113 static const char 114 *nmlint = "/tmp/sgsmsg.lint", 115 *interface = "sgs_msg", 116 *start = "_START_", 117 *end = "_END_"; 118 119 /* 120 * Define any default flags and data items. 121 */ 122 static int cflag = 0, lflag = 0, prtmsgs = 0, line, ptr = 1, msgid = 0; 123 static char *mesgid = 0, *setid = 0, *domain = 0; 124 125 typedef struct msg_string { 126 char *ms_defn; 127 char *ms_message; 128 struct msg_string *ms_next; 129 } msg_string; 130 131 static msg_string *msg_head; 132 static msg_string *msg_tail; 133 134 /* 135 * message_append() is responsible for both inserting strings into 136 * the master Str_tbl as well as maintaining a list of the 137 * DEFINITIONS associated with each string. 138 * 139 * The list of strings is traversed at the end once the full 140 * Str_tbl has been constructed - and string offsets can be 141 * assigned. 142 */ 143 static void 144 message_append(const char *defn, const char *message) 145 { 146 msg_string *msg; 147 if ((msg = calloc(sizeof (msg_string), 1)) == 0) { 148 (void) fprintf(stderr, Errmsg_nmem, strerror(errno)); 149 exit(1); 150 } 151 152 /* 153 * Initialize the string table. 154 */ 155 if ((stp == 0) && ((stp = st_new(FLG_STNEW_COMPRESS)) == NULL)) { 156 (void) fprintf(stderr, Errmsg_stnw, strerror(errno)); 157 exit(1); 158 } 159 160 161 if ((msg->ms_defn = strdup(defn)) == 0) { 162 (void) fprintf(stderr, Errmsg_nmem, strerror(errno)); 163 exit(1); 164 } 165 if ((msg->ms_message = strdup(message)) == 0) { 166 (void) fprintf(stderr, Errmsg_nmem, strerror(errno)); 167 exit(1); 168 } 169 170 if (st_insert(stp, msg->ms_message) == -1) { 171 (void) fprintf(stderr, Errmsg_stin, 172 message); 173 exit(1); 174 } 175 176 if (msg_head == 0) { 177 msg_head = msg_tail = msg; 178 return; 179 } 180 msg_tail->ms_next = msg; 181 msg_tail = msg; 182 } 183 184 /* 185 * Initialize a setid value. Given a setid definition determine its numeric 186 * value from the specified message identifier file (specified with the -i 187 * option). Return a pointer to the numeric string. 188 */ 189 static int 190 getmesgid(char *id) 191 { 192 char *buffer, *token, *_mesgid = 0, *_setid = 0, *_domain = 0; 193 194 /* 195 * If we're being asked to interpret a message id but the user didn't 196 * provide the required message identifier file (-i option) we're in 197 * trouble. 198 */ 199 if (flmids == 0) { 200 (void) fprintf(stderr, "sgsmsg: file %s: line %d: mesgid %s: " 201 "unable to process mesgid\n\t" 202 "no message identifier file specified " 203 "(see -i option)\n", fldesc, line, id); 204 return (1); 205 } 206 207 if ((buffer = malloc(LINE_MAX)) == 0) { 208 (void) fprintf(stderr, Errmsg_nmem, strerror(errno)); 209 return (1); 210 } 211 212 /* 213 * Read the message identifier file and locate the required mesgid. 214 */ 215 rewind(fdmids); 216 while (fgets(buffer, LINE_MAX, fdmids) != NULL) { 217 if ((token = strstr(buffer, id)) == NULL) 218 continue; 219 220 /* 221 * Establish individual strings for the mesgid, setid and domain 222 * values. 223 */ 224 _mesgid = token; 225 while (!(isspace(*token))) 226 token++; 227 *token++ = 0; 228 229 while (isspace(*token)) 230 token++; 231 _setid = token; 232 while (!(isspace(*token))) 233 token++; 234 *token++ = 0; 235 236 while (isspace(*token)) 237 token++; 238 _domain = token; 239 while (!(isspace(*token))) 240 token++; 241 *token = 0; 242 break; 243 } 244 245 /* 246 * Did we find a match? 247 */ 248 if ((_mesgid == 0) || (_setid == 0) || (_domain == 0)) { 249 (void) fprintf(stderr, "sgsmsg: file %s: line %d: mesgid %s: " 250 "unable to process mesgid\n\t" 251 "identifier does not exist in file %s\n", 252 fldesc, line, id, flmids); 253 return (1); 254 } 255 256 /* 257 * Have we been here before? 258 */ 259 if (mesgid) { 260 if (cflag == 1) { 261 /* 262 * If we're being asked to process more than one mesgid 263 * warn the user that only one mesgid can be used for 264 * the catgets(3c) call. 265 */ 266 (void) fprintf(stderr, "sgsmsg: file %s: line %d: " 267 "setid %s: warning: multiple mesgids " 268 "encountered\n\t" 269 "last setting used in messaging code\n", 270 fldesc, line, id); 271 } 272 } 273 274 mesgid = _mesgid; 275 setid = _setid; 276 domain = _domain; 277 278 /* 279 * Generate the message file output (insure output flag is enabled). 280 */ 281 if (prtmsgs != -1) 282 prtmsgs = 1; 283 if (fdmsgs && (prtmsgs == 1)) { 284 if (cflag == 1) { 285 if (fprintf(fdmsgs, "$quote \"\n$set %s\n", 286 setid) < 0) { 287 (void) fprintf(stderr, Errmsg_wrte, flmsgs, 288 strerror(errno)); 289 return (1); 290 } 291 } else { 292 if (fprintf(fdmsgs, "domain\t\"%s\"\n", domain) < 0) { 293 (void) fprintf(stderr, Errmsg_wrte, flmsgs, 294 strerror(errno)); 295 return (1); 296 } 297 } 298 } 299 300 /* 301 * For catgets(3c) output generate a setid definition in the message 302 * definition file. 303 */ 304 if (fddefs && (cflag == 1) && 305 (fprintf(fddefs, "#define\t%s\t%s\n\n", mesgid, setid) < 0)) { 306 (void) fprintf(stderr, Errmsg_wrte, fldefs, strerror(errno)); 307 return (1); 308 } 309 310 return (0); 311 } 312 313 /* 314 * Dump contents of String Table to standard out 315 */ 316 static void 317 dump_stringtab(Str_tbl *stp) 318 { 319 uint_t cnt; 320 321 if ((stp->st_flags & FLG_STTAB_COMPRESS) == 0) { 322 (void) printf("string table full size: %ld: uncompressed\n", 323 stp->st_fullstrsize); 324 return; 325 } 326 327 (void) printf("string table full size: %ld compressed down to: %ld\n\n", 328 stp->st_fullstrsize, stp->st_strsize); 329 (void) printf("string table compression information [%d buckets]:\n", 330 stp->st_hbckcnt); 331 332 for (cnt = 0; cnt < stp->st_hbckcnt; cnt++) { 333 Str_hash *sthash = stp->st_hashbcks[cnt]; 334 335 if (sthash == 0) 336 continue; 337 338 (void) printf(" bucket: [%d]\n", cnt); 339 340 while (sthash) { 341 size_t stroff = sthash->hi_mstr->sm_strlen - 342 sthash->hi_strlen; 343 344 if (stroff == 0) { 345 (void) printf(" [%ld]: '%s' <master>\n", 346 sthash->hi_refcnt, sthash->hi_mstr->sm_str); 347 } else { 348 (void) printf(" [%ld]: '%s' <suffix of: " 349 "'%s'>\n", sthash->hi_refcnt, 350 &sthash->hi_mstr->sm_str[stroff], 351 sthash->hi_mstr->sm_str); 352 } 353 sthash = sthash->hi_next; 354 } 355 } 356 } 357 358 /* 359 * Initialize the message definition header file stream. 360 */ 361 static int 362 init_defs(void) 363 { 364 static char guard[FILENAME_MAX + 6]; 365 char *optr; 366 const char *iptr, *_ptr; 367 368 /* 369 * Establish a header guard name using the files basename. 370 */ 371 for (iptr = 0, _ptr = fldefs; _ptr && (*_ptr != '\0'); _ptr++) { 372 if (*_ptr == '/') 373 iptr = _ptr + 1; 374 } 375 if (iptr == 0) 376 iptr = fldefs; 377 378 optr = guard; 379 for (*optr++ = '_'; iptr && (*iptr != '\0'); iptr++, optr++) { 380 if (*iptr == '.') { 381 *optr++ = '_'; 382 *optr++ = 'D'; 383 *optr++ = 'O'; 384 *optr++ = 'T'; 385 *optr = '_'; 386 } else 387 *optr = toupper(*iptr); 388 } 389 390 if (fprintf(fddefs, "#ifndef\t%s\n#define\t%s\n\n", guard, guard) < 0) { 391 (void) fprintf(stderr, Errmsg_wrte, fldefs, strerror(errno)); 392 return (1); 393 } 394 395 if (fprintf(fddefs, "#include <sgsmsg.h>\t/* Msg typedef */\n\n") < 0) { 396 (void) fprintf(stderr, Errmsg_wrte, fldefs, strerror(errno)); 397 return (1); 398 } 399 400 if (fprintf(fddefs, "#ifndef\t__lint\n\n") < 0) { 401 (void) fprintf(stderr, Errmsg_wrte, fldefs, strerror(errno)); 402 return (1); 403 } 404 405 /* 406 * The MSG_SGS_ARRAY_NAME macro supplies a generic way to 407 * reference the string table regardless of its name. 408 */ 409 if (fprintf(fddefs, "#define\tMSG_SGS_LOCAL_ARRAY\t__%s\n\n", 410 interface) < 0) { 411 (void) fprintf(stderr, Errmsg_wrte, fldefs, strerror(errno)); 412 return (1); 413 } 414 415 /* 416 * If the associated data array is global define a prototype. 417 * Define a macro to access the array elements. 418 */ 419 if (lflag == 0) { 420 if (fprintf(fddefs, "extern\tconst char\t__%s[];\n\n", 421 interface) < 0) { 422 (void) fprintf(stderr, Errmsg_wrte, fldefs, 423 strerror(errno)); 424 return (1); 425 } 426 } 427 if (fprintf(fddefs, 428 "#define\tMSG_ORIG_STRTAB(_x, _s)\t&_s[_x]\n\n") < 0) { 429 (void) fprintf(stderr, Errmsg_wrte, fldefs, strerror(errno)); 430 return (1); 431 } 432 if (fprintf(fddefs, 433 "#define\tMSG_ORIG(x)\tMSG_ORIG_STRTAB(x, __%s)\n\n", 434 interface) < 0) { 435 (void) fprintf(stderr, Errmsg_wrte, fldefs, strerror(errno)); 436 return (1); 437 } 438 439 /* 440 * Generate a prototype to access the associated data array. 441 */ 442 if (fprintf(fddefs, "extern\tconst char *\t_%s(Msg);\n\n", 443 interface) < 0) { 444 (void) fprintf(stderr, Errmsg_wrte, fldefs, strerror(errno)); 445 return (1); 446 } 447 if (fprintf(fddefs, "#define\tMSG_INTL(x)\t_%s(x)\n\n", 448 interface) < 0) { 449 (void) fprintf(stderr, Errmsg_wrte, fldefs, strerror(errno)); 450 return (1); 451 } 452 453 return (0); 454 } 455 456 457 /* 458 * Finish the message definition header file. 459 */ 460 static int 461 fini_defs(void) 462 { 463 if (fprintf(fddefs, "\n#else\t/* __lint */\n\n") < 0) { 464 (void) fprintf(stderr, Errmsg_wrte, fldefs, strerror(errno)); 465 return (1); 466 } 467 468 if (fprintf(fddefs, "extern\tconst char *\t_%s(Msg);\n\n", 469 interface) < 0) { 470 (void) fprintf(stderr, Errmsg_wrte, fldefs, strerror(errno)); 471 return (1); 472 } 473 474 if (fprintf(fddefs, "#ifndef MSG_SGS_LOCAL_ARRAY\n" 475 "#define\tMSG_SGS_LOCAL_ARRAY\t\"\"\n#endif\n\n") < 0) { 476 (void) fprintf(stderr, Errmsg_wrte, fldefs, strerror(errno)); 477 return (1); 478 } 479 480 if (lflag == 0) { 481 if (fprintf(fddefs, "extern\tconst char\t__%s[];\n\n", 482 interface) < 0) { 483 (void) fprintf(stderr, Errmsg_wrte, fldefs, 484 strerror(errno)); 485 return (1); 486 } 487 } 488 489 if (fprintf(fddefs, 490 "#define MSG_ORIG_STRTAB(_x, _s)\t_x\n" 491 "#define MSG_ORIG(x)\tx\n#define MSG_INTL(x)\tx\n") < 0) { 492 (void) fprintf(stderr, Errmsg_wrte, fldefs, strerror(errno)); 493 return (1); 494 } 495 496 /* 497 * Provide a way to get the array and function declarations above 498 * without also getting the actual messages. This is useful in 499 * our lintsup.c files that include more than one message header. 500 * lintsup doesn't need the actual messages, and this prevents 501 * macro name collisions. 502 */ 503 if (fprintf(fddefs, "\n#ifndef LINTSUP_SUPPRESS_STRINGS\n") < 0) { 504 (void) fprintf(stderr, Errmsg_wrte, fldefs, strerror(errno)); 505 return (1); 506 } 507 508 /* 509 * Copy the temporary lint defs file into the new header. 510 */ 511 if (fdlint) { 512 long size; 513 char *buf; 514 515 size = ftell(fdlint); 516 (void) rewind(fdlint); 517 518 if ((buf = malloc(size)) == 0) { 519 (void) fprintf(stderr, Errmsg_nmem, strerror(errno)); 520 return (1); 521 } 522 if (fread(buf, size, 1, fdlint) == 0) { 523 (void) fprintf(stderr, Errmsg_read, fllint, 524 strerror(errno)); 525 return (1); 526 } 527 if (fwrite(buf, size, 1, fddefs) == 0) { 528 (void) fprintf(stderr, Errmsg_wrte, fldefs, 529 strerror(errno)); 530 return (1); 531 } 532 (void) free(buf); 533 } 534 535 if (fprintf(fddefs, "\n#endif\t/* LINTSUP_SUPPRESS_STRINGS */\n") < 0) { 536 (void) fprintf(stderr, Errmsg_wrte, fldefs, strerror(errno)); 537 return (1); 538 } 539 540 if (fprintf(fddefs, "\n#endif\t/* __lint */\n") < 0) { 541 (void) fprintf(stderr, Errmsg_wrte, fldefs, strerror(errno)); 542 return (1); 543 } 544 545 if (fprintf(fddefs, "\n#endif\n") < 0) { 546 (void) fprintf(stderr, Errmsg_wrte, fldefs, strerror(errno)); 547 return (1); 548 } 549 550 return (0); 551 } 552 553 /* 554 * The entire messaging file has been scanned - and all strings have been 555 * inserted into the string_table. We can now walk the message queue 556 * and create the '#define <DEFN>' for each string - with the strings 557 * assigned offset into the string_table. 558 */ 559 static int 560 output_defs(void) 561 { 562 msg_string *msg; 563 size_t stbufsize; 564 char *stbuf; 565 566 stbufsize = st_getstrtab_sz(stp); 567 if ((stbuf = malloc(stbufsize)) == 0) { 568 (void) fprintf(stderr, Errmsg_nmem, strerror(errno)); 569 exit(1); 570 } 571 (void) st_setstrbuf(stp, stbuf, stbufsize); 572 for (msg = msg_head; msg; msg = msg->ms_next) { 573 size_t stoff; 574 if ((st_setstring(stp, msg->ms_message, &stoff)) == -1) { 575 (void) fprintf(stderr, Errmsg_mnfn, msg->ms_message); 576 return (1); 577 } 578 if (fprintf(fddefs, "\n#define\t%s\t%ld\n", 579 msg->ms_defn, stoff) < 0) { 580 (void) fprintf(stderr, Errmsg_wrte, 581 fldefs, strerror(errno)); 582 return (1); 583 } 584 if (fddefs && fprintf(fddefs, "#define\t%s_SIZE\t%d\n", 585 msg->ms_defn, strlen(msg->ms_message)) < 0) { 586 (void) fprintf(stderr, Errmsg_wrte, 587 fldefs, strerror(errno)); 588 return (1); 589 } 590 } 591 return (0); 592 } 593 594 595 /* 596 * Finish off the data structure definition. 597 */ 598 static int 599 output_data(void) 600 { 601 size_t stbufsize; 602 size_t ndx; 603 size_t column = 1; 604 const char *stbuf; 605 const char *fmtstr; 606 607 stbufsize = st_getstrtab_sz(stp); 608 stbuf = st_getstrbuf(stp); 609 610 assert(stbuf); 611 612 /* 613 * Determine from the local flag whether the data declaration should 614 * be static. 615 */ 616 if (lflag) 617 fmtstr = (const char *)"static const"; 618 else 619 fmtstr = (const char *)"const"; 620 621 if (fprintf(fddata, "\n%s char __%s[%ld] = { ", 622 fmtstr, interface, stbufsize) < 0) { 623 (void) fprintf(stderr, Errmsg_wrte, fldata, strerror(errno)); 624 return (1); 625 } 626 627 for (ndx = 0; ndx < (stbufsize - 1); ndx++) { 628 if (column == 1) { 629 if (fddata && fprintf(fddata, 630 "\n/* %4ld */ 0x%.2x,", ndx, 631 (unsigned char)stbuf[ndx]) < 0) { 632 (void) fprintf(stderr, Errmsg_wrte, 633 fldata, strerror(errno)); 634 return (1); 635 } 636 } else { 637 if (fddata && fprintf(fddata, " 0x%.2x,", 638 (unsigned char)stbuf[ndx]) < 0) { 639 (void) fprintf(stderr, Errmsg_wrte, 640 fldata, strerror(errno)); 641 return (1); 642 } 643 } 644 645 if (column++ == 10) 646 column = 1; 647 } 648 649 if (column == 1) 650 fmtstr = "\n\t0x%.2x };\n"; 651 else 652 fmtstr = " 0x%.2x };\n"; 653 654 if (fprintf(fddata, fmtstr, (unsigned char)stbuf[stbufsize - 1]) < 0) { 655 (void) fprintf(stderr, Errmsg_wrte, fldata, strerror(errno)); 656 return (1); 657 } 658 659 return (0); 660 } 661 662 static int 663 file() 664 { 665 char buffer[LINE_MAX], * token; 666 uint_t bufsize; 667 char *token_buffer; 668 int escape = 0; 669 670 if ((token_buffer = malloc(LINE_MAX)) == 0) { 671 (void) fprintf(stderr, Errmsg_nmem, strerror(errno)); 672 return (1); 673 } 674 bufsize = LINE_MAX; 675 676 line = 1; 677 678 while ((token = fgets(buffer, LINE_MAX, fddesc)) != NULL) { 679 char defn[PATH_MAX], * _defn, * str; 680 int len; 681 682 switch (*token) { 683 case '#': 684 case '$': 685 if (escape) { 686 (void) fprintf(stderr, Errmsg_malt, fldesc, 687 line); 688 return (1); 689 } 690 691 /* 692 * If a msgid has been output a msgstr must follow 693 * before we digest the new token. A msgid is only set 694 * if fdmsgs is in use. 695 */ 696 if (msgid) { 697 msgid = 0; 698 if (fprintf(fdmsgs, "msgstr\t\"\"\n") < 0) { 699 (void) fprintf(stderr, Errmsg_wrte, 700 flmsgs, strerror(errno)); 701 return (1); 702 } 703 } 704 705 /* 706 * Pass lines directly through to the output message 707 * file. 708 */ 709 if (fdmsgs && (prtmsgs == 1)) { 710 char comment; 711 712 if (cflag == 0) 713 comment = '#'; 714 else 715 comment = '$'; 716 717 if (fprintf(fdmsgs, "%c%s", comment, 718 ++token) < 0) { 719 (void) fprintf(stderr, Errmsg_wrte, 720 flmsgs, strerror(errno)); 721 return (1); 722 } 723 } 724 break; 725 726 case '@': 727 if (escape) { 728 (void) fprintf(stderr, Errmsg_malt, fldesc, 729 line); 730 return (1); 731 } 732 733 /* 734 * If a msgid has been output a msgstr must follow 735 * before we digest the new token. 736 */ 737 if (msgid) { 738 msgid = 0; 739 if (fprintf(fdmsgs, "msgstr\t\"\"\n") < 0) { 740 (void) fprintf(stderr, Errmsg_wrte, 741 flmsgs, strerror(errno)); 742 return (1); 743 } 744 } 745 746 /* 747 * Determine whether we have one or more tokens. 748 */ 749 token++; 750 while (isspace(*token)) /* rid any whitespace */ 751 token++; 752 _defn = token; /* definition start */ 753 while (!(isspace(*token))) 754 token++; 755 *token++ = 0; 756 757 while (isspace(*token)) /* rid any whitespace */ 758 token++; 759 760 /* 761 * Determine whether the single token is one of the 762 * reserved message output delimiters otherwise 763 * translate it as a message identifier. 764 */ 765 if (*token == 0) { 766 if (strcmp(_defn, start) == 0) 767 prtmsgs = 1; 768 else if (strcmp(_defn, end) == 0) 769 prtmsgs = -1; 770 else if (getmesgid(_defn) == 1) 771 return (1); 772 break; 773 } 774 775 /* 776 * Multiple tokens are translated by taking the first 777 * token as the message definition, and the rest of the 778 * line as the message itself. A message line ending 779 * with an escape ('\') is expected to be continued on 780 * the next line. 781 */ 782 if (prtmsgs != -1) 783 prtmsgs = 1; 784 if (fdmsgs && (prtmsgs == 1)) { 785 /* 786 * For catgets(3c) make sure a message 787 * identifier has been established (this is 788 * normally a domain for gettext(3i), but for 789 * sgsmsg use this could be argued as being 790 * redundent). Also make sure that the message 791 * definitions haven't exceeeded the maximum 792 * value allowed by gencat(1) before generating 793 * any message file entries. 794 */ 795 if (cflag == 1) { 796 if (setid == 0) { 797 (void) fprintf(stderr, "file " 798 "%s: no message identifier " 799 "has been established\n", 800 fldesc); 801 return (1); 802 } 803 if (ptr > NL_MSGMAX) { 804 (void) fprintf(stderr, "file " 805 "%s: message definition " 806 "(%d) exceeds allowable " 807 "limit (NL_MSGMAX)\n", 808 fldesc, ptr); 809 return (1); 810 } 811 } 812 813 /* 814 * For catgets(3c) write the definition and the 815 * message string to the message file. For 816 * gettext(3i) write the message string as a 817 * mesgid - indicate a mesgid has been output 818 * so that a msgstr can follow. 819 */ 820 if (cflag == 1) { 821 if (fprintf(fdmsgs, "%d\t%s", ptr, 822 token) < 0) { 823 (void) fprintf(stderr, 824 Errmsg_wrte, flmsgs, 825 strerror(errno)); 826 return (1); 827 } 828 } else { 829 if (fprintf(fdmsgs, "msgid\t\"") < 0) { 830 (void) fprintf(stderr, 831 Errmsg_wrte, flmsgs, 832 strerror(errno)); 833 return (1); 834 } 835 msgid = 1; 836 } 837 } 838 839 /* 840 * The message itself is a quoted string as this makes 841 * embedding spaces at the start (or the end) of the 842 * string very easy. 843 */ 844 if (*token != '"') { 845 (void) fprintf(stderr, Errmsg_malt, fldesc, 846 line); 847 return (1); 848 } 849 850 (void) strcpy(defn, _defn); 851 852 /* 853 * Write the tag to the lint definitions. 854 */ 855 if (fdlint) { 856 if (fprintf(fdlint, "\n#define\t%s\t", 857 _defn) < 0) { 858 (void) fprintf(stderr, Errmsg_wrte, 859 fllint, strerror(errno)); 860 return (1); 861 } 862 } 863 864 len = 0; 865 866 /* 867 * Write each character of the message string to the 868 * data array. Translate any escaped characters - use 869 * the same specially recognized characters as defined 870 * by gencat(1). 871 */ 872 message: 873 if (*token == '"') { 874 if (fdlint && 875 (fprintf(fdlint, "%c", *token) < 0)) { 876 (void) fprintf(stderr, Errmsg_wrte, 877 fllint, strerror(errno)); 878 return (1); 879 } 880 token++; 881 } 882 while (*token) { 883 char _token; 884 885 if ((*token == '\\') && (escape == 0)) { 886 escape = 1; 887 if (fdlint && (*(token + 1) != '\n') && 888 fprintf(fdlint, "%c", *token) < 0) { 889 (void) fprintf(stderr, 890 Errmsg_wrte, fllint, 891 strerror(errno)); 892 return (1); 893 } 894 token++; 895 continue; 896 } 897 if (escape) { 898 if (*token == 'n') 899 _token = '\n'; 900 else if (*token == 't') 901 _token = '\t'; 902 else if (*token == 'v') 903 _token = '\v'; 904 else if (*token == 'b') 905 _token = '\b'; 906 else if (*token == 'f') 907 _token = '\f'; 908 else if (*token == '\\') 909 _token = '\\'; 910 else if (*token == '"') 911 _token = '"'; 912 else if (*token == '\n') 913 break; 914 else 915 _token = *token; 916 917 if (fdmsgs && (prtmsgs == 1) && 918 (fprintf(fdmsgs, "\\") < 0)) { 919 (void) fprintf(stderr, 920 Errmsg_wrte, flmsgs, 921 strerror(errno)); 922 return (1); 923 } 924 } else { 925 /* 926 * If this is the trailing quote then 927 * thats the last of the message string. 928 * Eat up any remaining white space and 929 * unless an escape character is found 930 * terminate the data string with a 0. 931 */ 932 /* BEGIN CSTYLED */ 933 if (*token == '"') { 934 if (fdlint && (fprintf(fdlint, 935 "%c", *token) < 0)) { 936 (void) fprintf(stderr, 937 Errmsg_wrte, fllint, 938 strerror(errno)); 939 return (1); 940 } 941 942 if (fdmsgs && (prtmsgs == 1) && 943 (fprintf(fdmsgs, "%c", 944 *token) < 0)) { 945 (void) fprintf(stderr, 946 Errmsg_wrte, flmsgs, 947 strerror(errno)); 948 return (1); 949 } 950 951 while (*++token) { 952 if (*token == '\n') 953 break; 954 } 955 _token = '\0'; 956 } else 957 _token = *token; 958 /* END CSTYLED */ 959 } 960 961 if (fdmsgs && (prtmsgs == 1) && 962 (fprintf(fdmsgs, "%c", *token) < 0)) { 963 (void) fprintf(stderr, Errmsg_wrte, 964 flmsgs, strerror(errno)); 965 return (1); 966 } 967 968 if (fdlint && fprintf(fdlint, 969 "%c", *token) < 0) { 970 (void) fprintf(stderr, Errmsg_wrte, 971 fllint, strerror(errno)); 972 return (1); 973 } 974 975 if (len >= bufsize) { 976 bufsize += LINE_MAX; 977 if ((token_buffer = realloc( 978 token_buffer, bufsize)) == 0) { 979 (void) fprintf(stderr, 980 Errmsg_nmem, 981 strerror(errno)); 982 return (1); 983 } 984 } 985 token_buffer[len] = _token; 986 ptr++, token++, len++; 987 escape = 0; 988 989 if (_token == '\0') 990 break; 991 } 992 993 /* 994 * After the complete message string has been processed 995 * (including its continuation beyond one line), create 996 * a string size definition. 997 */ 998 if (escape == 0) { 999 const char *form = "#define\t%s_SIZE\t%d\n"; 1000 1001 token_buffer[len] = '\0'; 1002 1003 message_append(defn, token_buffer); 1004 1005 if (fdlint && fprintf(fdlint, form, defn, 1006 (len - 1)) < 0) { 1007 (void) fprintf(stderr, Errmsg_wrte, 1008 fllint, strerror(errno)); 1009 return (1); 1010 } 1011 } 1012 break; 1013 1014 default: 1015 /* 1016 * Empty lines are passed through to the message file. 1017 */ 1018 while (isspace(*token)) 1019 token++; 1020 1021 if (*token == 0) { 1022 if (msgid || (fdmsgs && (prtmsgs == 1))) { 1023 /* 1024 * If a msgid has been output a msgstr 1025 * must follow before we digest the new 1026 * token. 1027 */ 1028 if (msgid) { 1029 msgid = 0; 1030 str = "msgstr\t\"\"\n\n"; 1031 } else 1032 str = "\n"; 1033 1034 if (fprintf(fdmsgs, str) < 0) { 1035 (void) fprintf(stderr, 1036 Errmsg_wrte, flmsgs, 1037 strerror(errno)); 1038 return (1); 1039 } 1040 } 1041 break; 1042 } 1043 1044 /* 1045 * If an escape is in effect then any tokens are taken 1046 * to be message continuations. 1047 */ 1048 if (escape) { 1049 escape = 0; 1050 goto message; 1051 } 1052 1053 (void) fprintf(stderr, "file %s: line %d: invalid " 1054 "input does not start with #, $ or @\n", fldesc, 1055 line); 1056 return (1); 1057 } 1058 line++; 1059 } 1060 1061 free(token_buffer); 1062 1063 return (0); 1064 } 1065 1066 int 1067 main(int argc, char ** argv) 1068 { 1069 opterr = 0; 1070 while ((line = getopt(argc, argv, "cd:h:lm:n:i:v")) != EOF) { 1071 switch (line) { 1072 case 'c': /* catgets instead of gettext */ 1073 cflag = 1; 1074 break; 1075 case 'd': /* new message data filename */ 1076 fldata = optarg; /* (msg.c is default) */ 1077 break; 1078 case 'h': /* new message defs filename */ 1079 fldefs = optarg; /* (msg.h is default) */ 1080 break; 1081 case 'i': /* input message ids from */ 1082 flmids = optarg; /* from this file */ 1083 break; 1084 case 'l': /* define message data arrays */ 1085 lflag = 1; /* to be local (static) */ 1086 break; 1087 case 'm': /* generate message database */ 1088 flmsgs = optarg; /* to this file */ 1089 break; 1090 case 'n': /* new data array and func */ 1091 interface = optarg; /* name (msg is default) */ 1092 break; 1093 case 'v': 1094 vflag = 1; /* set verbose flag */ 1095 break; 1096 case '?': 1097 (void) fprintf(stderr, Errmsg_use, argv[0]); 1098 exit(1); 1099 default: 1100 break; 1101 } 1102 } 1103 1104 /* 1105 * Validate the we have been given at least one input file. 1106 */ 1107 if ((argc - optind) < 1) { 1108 (void) fprintf(stderr, Errmsg_use); 1109 exit(1); 1110 } 1111 1112 /* 1113 * Open all the required output files. 1114 */ 1115 if (fldefs) { 1116 if ((fddefs = fopen(fldefs, "w+")) == NULL) { 1117 (void) fprintf(stderr, Errmsg_opne, fldefs, 1118 strerror(errno)); 1119 return (1); 1120 } 1121 } 1122 if (fldata) { 1123 if (fldefs && (strcmp(fldefs, fldata) == 0)) 1124 fddata = fddefs; 1125 else if ((fddata = fopen(fldata, "w+")) == NULL) { 1126 (void) fprintf(stderr, Errmsg_opne, fldata, 1127 strerror(errno)); 1128 return (1); 1129 } 1130 } 1131 if (fddefs && fddata) { 1132 (void) sprintf(fllint, "%s.%d", nmlint, (int)getpid()); 1133 if ((fdlint = fopen(fllint, "w+")) == NULL) { 1134 (void) fprintf(stderr, Errmsg_opne, fllint, 1135 strerror(errno)); 1136 return (1); 1137 } 1138 } 1139 if (flmsgs) { 1140 if ((fdmsgs = fopen(flmsgs, "w+")) == NULL) { 1141 (void) fprintf(stderr, Errmsg_opne, flmsgs, 1142 strerror(errno)); 1143 return (1); 1144 } 1145 } 1146 if (flmids) { 1147 if ((fdmids = fopen(flmids, "r")) == NULL) { 1148 (void) fprintf(stderr, Errmsg_opne, flmids, 1149 strerror(errno)); 1150 return (1); 1151 } 1152 } 1153 1154 1155 /* 1156 * Initialize the message definition and message data streams. 1157 */ 1158 if (fddefs) { 1159 if (init_defs()) 1160 return (1); 1161 } 1162 1163 /* 1164 * Read the input message file, and for each line process accordingly. 1165 */ 1166 for (; optind < argc; optind++) { 1167 int err; 1168 1169 fldesc = argv[optind]; 1170 1171 if ((fddesc = fopen(fldesc, "r")) == NULL) { 1172 (void) fprintf(stderr, Errmsg_opne, fldesc, 1173 strerror(errno)); 1174 return (1); 1175 } 1176 err = file(); 1177 (void) fclose(fddesc); 1178 1179 if (err != 0) 1180 return (1); 1181 } 1182 1183 /* 1184 * If a msgid has been output a msgstr must follow before we end the 1185 * file. 1186 */ 1187 if (msgid) { 1188 msgid = 0; 1189 if (fprintf(fdmsgs, "msgstr\t\"\"\n") < 0) { 1190 (void) fprintf(stderr, Errmsg_wrte, flmsgs, 1191 strerror(errno)); 1192 return (1); 1193 } 1194 } 1195 1196 if (fdmids) 1197 (void) fclose(fdmids); 1198 if (fdmsgs) 1199 (void) fclose(fdmsgs); 1200 1201 if (fddefs) { 1202 if (output_defs()) 1203 return (1); 1204 } 1205 1206 /* 1207 * Finish off any generated data and header file. 1208 */ 1209 if (fldata) { 1210 if (output_data()) 1211 return (1); 1212 } 1213 if (fddefs) { 1214 if (fini_defs()) 1215 return (1); 1216 } 1217 1218 if (vflag) 1219 dump_stringtab(stp); 1220 1221 /* 1222 * Close up everything and go home. 1223 */ 1224 if (fddata) 1225 (void) fclose(fddata); 1226 if (fddefs && (fddefs != fddata)) 1227 (void) fclose(fddefs); 1228 if (fddefs && fddata) { 1229 (void) fclose(fdlint); 1230 (void) unlink(fllint); 1231 } 1232 1233 if (stp) 1234 st_destroy(stp); 1235 1236 return (0); 1237 } 1238