17c478bd9Sstevel@tonic-gate /* 27c478bd9Sstevel@tonic-gate * CDDL HEADER START 37c478bd9Sstevel@tonic-gate * 47c478bd9Sstevel@tonic-gate * The contents of this file are subject to the terms of the 57c478bd9Sstevel@tonic-gate * Common Development and Distribution License, Version 1.0 only 67c478bd9Sstevel@tonic-gate * (the "License"). You may not use this file except in compliance 77c478bd9Sstevel@tonic-gate * with the License. 87c478bd9Sstevel@tonic-gate * 97c478bd9Sstevel@tonic-gate * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE 107c478bd9Sstevel@tonic-gate * or http://www.opensolaris.org/os/licensing. 117c478bd9Sstevel@tonic-gate * See the License for the specific language governing permissions 127c478bd9Sstevel@tonic-gate * and limitations under the License. 137c478bd9Sstevel@tonic-gate * 147c478bd9Sstevel@tonic-gate * When distributing Covered Code, include this CDDL HEADER in each 157c478bd9Sstevel@tonic-gate * file and include the License file at usr/src/OPENSOLARIS.LICENSE. 167c478bd9Sstevel@tonic-gate * If applicable, add the following below this CDDL HEADER, with the 177c478bd9Sstevel@tonic-gate * fields enclosed by brackets "[]" replaced with your own identifying 187c478bd9Sstevel@tonic-gate * information: Portions Copyright [yyyy] [name of copyright owner] 197c478bd9Sstevel@tonic-gate * 207c478bd9Sstevel@tonic-gate * CDDL HEADER END 217c478bd9Sstevel@tonic-gate */ 22*0d8b5334Sceastha /* 23*0d8b5334Sceastha * Copyright 2005 Sun Microsystems, Inc. All rights reserved. 24*0d8b5334Sceastha * Use is subject to license terms. 25*0d8b5334Sceastha */ 26*0d8b5334Sceastha 277c478bd9Sstevel@tonic-gate /* Copyright (c) 1984, 1986, 1987, 1988, 1989 AT&T */ 287c478bd9Sstevel@tonic-gate /* All Rights Reserved */ 297c478bd9Sstevel@tonic-gate 307c478bd9Sstevel@tonic-gate 31*0d8b5334Sceastha #pragma ident "%Z%%M% %I% %E% SMI" 32*0d8b5334Sceastha 337c478bd9Sstevel@tonic-gate #include <unistd.h> 347c478bd9Sstevel@tonic-gate #include <stdlib.h> 357c478bd9Sstevel@tonic-gate #include <stdio.h> 367c478bd9Sstevel@tonic-gate #include <locale.h> 377c478bd9Sstevel@tonic-gate #include "hash.h" 387c478bd9Sstevel@tonic-gate #include "huff.h" 397c478bd9Sstevel@tonic-gate 407c478bd9Sstevel@tonic-gate int encode(long, long *); 417c478bd9Sstevel@tonic-gate 427c478bd9Sstevel@tonic-gate #define S (BYTE * sizeof (long)) 437c478bd9Sstevel@tonic-gate #define B (BYTE * sizeof (unsigned)) 447c478bd9Sstevel@tonic-gate unsigned *table; 457c478bd9Sstevel@tonic-gate int hindex[NI]; 467c478bd9Sstevel@tonic-gate unsigned wp; /* word pointer */ 477c478bd9Sstevel@tonic-gate int bp = B; /* bit pointer */ 487c478bd9Sstevel@tonic-gate static int ignore; 497c478bd9Sstevel@tonic-gate static int extra; 507c478bd9Sstevel@tonic-gate 517c478bd9Sstevel@tonic-gate static int 527c478bd9Sstevel@tonic-gate append(register unsigned w1, register int i) 537c478bd9Sstevel@tonic-gate { 547c478bd9Sstevel@tonic-gate while (wp < ND - 1) { 557c478bd9Sstevel@tonic-gate table[wp] |= w1>>(B-bp); 567c478bd9Sstevel@tonic-gate i -= bp; 577c478bd9Sstevel@tonic-gate if (i < 0) { 587c478bd9Sstevel@tonic-gate bp = -i; 597c478bd9Sstevel@tonic-gate return (1); 607c478bd9Sstevel@tonic-gate } 617c478bd9Sstevel@tonic-gate w1 <<= bp; 627c478bd9Sstevel@tonic-gate bp = B; 637c478bd9Sstevel@tonic-gate wp++; 647c478bd9Sstevel@tonic-gate } 657c478bd9Sstevel@tonic-gate return (0); 667c478bd9Sstevel@tonic-gate } 677c478bd9Sstevel@tonic-gate 687c478bd9Sstevel@tonic-gate 697c478bd9Sstevel@tonic-gate /* 707c478bd9Sstevel@tonic-gate * usage: hashin N 717c478bd9Sstevel@tonic-gate * where N is number of words in dictionary 727c478bd9Sstevel@tonic-gate * and standard input contains sorted, unique 737c478bd9Sstevel@tonic-gate * hashed words in octal 747c478bd9Sstevel@tonic-gate */ 757c478bd9Sstevel@tonic-gate 76*0d8b5334Sceastha int 777c478bd9Sstevel@tonic-gate main(int argc, char **argv) 787c478bd9Sstevel@tonic-gate { 797c478bd9Sstevel@tonic-gate long h, k, d; 807c478bd9Sstevel@tonic-gate int i; 817c478bd9Sstevel@tonic-gate long count; 827c478bd9Sstevel@tonic-gate long w1; 837c478bd9Sstevel@tonic-gate long x; 847c478bd9Sstevel@tonic-gate int t, u; 857c478bd9Sstevel@tonic-gate double z; 867c478bd9Sstevel@tonic-gate 877c478bd9Sstevel@tonic-gate /* Set locale environment variables local definitions */ 887c478bd9Sstevel@tonic-gate (void) setlocale(LC_ALL, ""); 897c478bd9Sstevel@tonic-gate #if !defined(TEXT_DOMAIN) /* Should be defined by cc -D */ 907c478bd9Sstevel@tonic-gate #define TEXT_DOMAIN "SYS_TEST" /* Use this only if it wasn't */ 917c478bd9Sstevel@tonic-gate #endif 927c478bd9Sstevel@tonic-gate (void) textdomain(TEXT_DOMAIN); 937c478bd9Sstevel@tonic-gate 947c478bd9Sstevel@tonic-gate k = 0; 957c478bd9Sstevel@tonic-gate u = 0; 967c478bd9Sstevel@tonic-gate if (argc != 2) { 977c478bd9Sstevel@tonic-gate (void) fprintf(stderr, gettext("%s: arg count\n"), argv[0]); 987c478bd9Sstevel@tonic-gate exit(1); 997c478bd9Sstevel@tonic-gate } 1007c478bd9Sstevel@tonic-gate table = (unsigned *)malloc(ND * sizeof (*table)); 1017c478bd9Sstevel@tonic-gate if (table == 0) { 1027c478bd9Sstevel@tonic-gate (void) fprintf(stderr, gettext("%s: no space for table\n"), 1037c478bd9Sstevel@tonic-gate argv[0]); 1047c478bd9Sstevel@tonic-gate exit(1); 1057c478bd9Sstevel@tonic-gate } 1067c478bd9Sstevel@tonic-gate if ((atof(argv[1])) == 0.0) { 1077c478bd9Sstevel@tonic-gate (void) fprintf(stderr, gettext("%s: illegal count"), argv[0]); 1087c478bd9Sstevel@tonic-gate exit(1); 1097c478bd9Sstevel@tonic-gate } 1107c478bd9Sstevel@tonic-gate 1117c478bd9Sstevel@tonic-gate z = huff((1L<<HASHWIDTH)/atof(argv[1])); 1127c478bd9Sstevel@tonic-gate (void) fprintf(stderr, gettext("%s: expected code widths = %f\n"), 1137c478bd9Sstevel@tonic-gate argv[0], z); 1147c478bd9Sstevel@tonic-gate for (count = 0; scanf("%lo", (unsigned long *)&h) == 1; ++count) { 1157c478bd9Sstevel@tonic-gate if ((t = h >> (HASHWIDTH - INDEXWIDTH)) != u) { 1167c478bd9Sstevel@tonic-gate if (bp != B) 1177c478bd9Sstevel@tonic-gate wp++; 1187c478bd9Sstevel@tonic-gate bp = B; 1197c478bd9Sstevel@tonic-gate while (u < t) 1207c478bd9Sstevel@tonic-gate hindex[++u] = wp; 1217c478bd9Sstevel@tonic-gate k = (long)t<<(HASHWIDTH-INDEXWIDTH); 1227c478bd9Sstevel@tonic-gate } 1237c478bd9Sstevel@tonic-gate d = h-k; 1247c478bd9Sstevel@tonic-gate k = h; 1257c478bd9Sstevel@tonic-gate for (;;) { 1267c478bd9Sstevel@tonic-gate for (x = d; ; x /= 2) { 1277c478bd9Sstevel@tonic-gate i = encode(x, &w1); 1287c478bd9Sstevel@tonic-gate if (i > 0) 1297c478bd9Sstevel@tonic-gate break; 1307c478bd9Sstevel@tonic-gate } 1317c478bd9Sstevel@tonic-gate if (i > B) { 1327c478bd9Sstevel@tonic-gate if (!(append((unsigned)(w1>>(long) (i-B)), B) && 1337c478bd9Sstevel@tonic-gate append((unsigned)(w1<<(long) (B+B-i)), 1347c478bd9Sstevel@tonic-gate i-B))) 1357c478bd9Sstevel@tonic-gate ignore++; 1367c478bd9Sstevel@tonic-gate } else 1377c478bd9Sstevel@tonic-gate if (!append((unsigned)(w1<<(long)(B-i)), i)) 1387c478bd9Sstevel@tonic-gate ignore++; 1397c478bd9Sstevel@tonic-gate d -= x; 1407c478bd9Sstevel@tonic-gate if (d > 0) 1417c478bd9Sstevel@tonic-gate extra++; 1427c478bd9Sstevel@tonic-gate else 1437c478bd9Sstevel@tonic-gate break; 1447c478bd9Sstevel@tonic-gate } 1457c478bd9Sstevel@tonic-gate } 1467c478bd9Sstevel@tonic-gate if (bp != B) 1477c478bd9Sstevel@tonic-gate wp++; 1487c478bd9Sstevel@tonic-gate while (++u < NI) 1497c478bd9Sstevel@tonic-gate hindex[u] = wp; 1507c478bd9Sstevel@tonic-gate whuff(); 1517c478bd9Sstevel@tonic-gate (void) fwrite((char *)hindex, sizeof (*hindex), NI, stdout); 1527c478bd9Sstevel@tonic-gate (void) fwrite((char *)table, sizeof (*table), wp, stdout); 1537c478bd9Sstevel@tonic-gate (void) fprintf(stderr, 1547c478bd9Sstevel@tonic-gate gettext("%s: %ld items, %d ignored, %d extra, %u words occupied\n"), 1557c478bd9Sstevel@tonic-gate argv[0], count, ignore, extra, wp); 1567c478bd9Sstevel@tonic-gate count -= ignore; 1577c478bd9Sstevel@tonic-gate (void) fprintf(stderr, "%s: %f table bits/item, %f table+index bits\n", 1587c478bd9Sstevel@tonic-gate argv[0], (((float)BYTE * wp) * sizeof (*table) / count), 1597c478bd9Sstevel@tonic-gate (BYTE * ((float)wp * sizeof (*table) + sizeof (hindex)) / count)); 160*0d8b5334Sceastha return (0); 1617c478bd9Sstevel@tonic-gate } 162