19b50d902SRodney W. Grimes /* 29b50d902SRodney W. Grimes * Copyright (c) 1989, 1993 39b50d902SRodney W. Grimes * The Regents of the University of California. All rights reserved. 49b50d902SRodney W. Grimes * 59b50d902SRodney W. Grimes * This code is derived from software contributed to Berkeley by 69b50d902SRodney W. Grimes * James A. Woods. 79b50d902SRodney W. Grimes * 89b50d902SRodney W. Grimes * Redistribution and use in source and binary forms, with or without 99b50d902SRodney W. Grimes * modification, are permitted provided that the following conditions 109b50d902SRodney W. Grimes * are met: 119b50d902SRodney W. Grimes * 1. Redistributions of source code must retain the above copyright 129b50d902SRodney W. Grimes * notice, this list of conditions and the following disclaimer. 139b50d902SRodney W. Grimes * 2. Redistributions in binary form must reproduce the above copyright 149b50d902SRodney W. Grimes * notice, this list of conditions and the following disclaimer in the 159b50d902SRodney W. Grimes * documentation and/or other materials provided with the distribution. 169b50d902SRodney W. Grimes * 3. All advertising materials mentioning features or use of this software 179b50d902SRodney W. Grimes * must display the following acknowledgement: 189b50d902SRodney W. Grimes * This product includes software developed by the University of 199b50d902SRodney W. Grimes * California, Berkeley and its contributors. 209b50d902SRodney W. Grimes * 4. Neither the name of the University nor the names of its contributors 219b50d902SRodney W. Grimes * may be used to endorse or promote products derived from this software 229b50d902SRodney W. Grimes * without specific prior written permission. 239b50d902SRodney W. Grimes * 249b50d902SRodney W. Grimes * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND 259b50d902SRodney W. Grimes * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE 269b50d902SRodney W. Grimes * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE 279b50d902SRodney W. Grimes * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE 289b50d902SRodney W. Grimes * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL 299b50d902SRodney W. Grimes * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS 309b50d902SRodney W. Grimes * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) 319b50d902SRodney W. Grimes * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT 329b50d902SRodney W. Grimes * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY 339b50d902SRodney W. Grimes * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF 349b50d902SRodney W. Grimes * SUCH DAMAGE. 357ec1929dSWolfram Schneider * 36df62e52bSWolfram Schneider * $Id: locate.bigram.c,v 1.1 1996/09/13 13:23:48 wosch Exp wosch $ 379b50d902SRodney W. Grimes */ 389b50d902SRodney W. Grimes 399b50d902SRodney W. Grimes #ifndef lint 409b50d902SRodney W. Grimes static char copyright[] = 419b50d902SRodney W. Grimes "@(#) Copyright (c) 1989, 1993\n\ 429b50d902SRodney W. Grimes The Regents of the University of California. All rights reserved.\n"; 439b50d902SRodney W. Grimes #endif /* not lint */ 449b50d902SRodney W. Grimes 459b50d902SRodney W. Grimes #ifndef lint 469b50d902SRodney W. Grimes static char sccsid[] = "@(#)locate.bigram.c 8.1 (Berkeley) 6/6/93"; 479b50d902SRodney W. Grimes #endif /* not lint */ 489b50d902SRodney W. Grimes 499b50d902SRodney W. Grimes /* 507ec1929dSWolfram Schneider * bigram < sorted_file_names | sort -nr | 517ec1929dSWolfram Schneider * awk 'NR <= 128 { printf $2 }' > bigrams 529b50d902SRodney W. Grimes * 539b50d902SRodney W. Grimes * List bigrams for 'updatedb' script. 549b50d902SRodney W. Grimes * Use 'code' to encode a file using this output. 559b50d902SRodney W. Grimes */ 569b50d902SRodney W. Grimes 579b50d902SRodney W. Grimes #include <stdio.h> 589b50d902SRodney W. Grimes #include <sys/param.h> /* for MAXPATHLEN */ 5937002181SWolfram Schneider #include "locate.h" 609b50d902SRodney W. Grimes 6137002181SWolfram Schneider u_char buf1[MAXPATHLEN] = " "; 6237002181SWolfram Schneider u_char buf2[MAXPATHLEN]; 637ec1929dSWolfram Schneider u_int bigram[UCHAR_MAX][UCHAR_MAX]; 649b50d902SRodney W. Grimes 657ec1929dSWolfram Schneider int 667ec1929dSWolfram Schneider main(void) 679b50d902SRodney W. Grimes { 6837002181SWolfram Schneider register u_char *cp; 6937002181SWolfram Schneider register u_char *oldpath = buf1, *path = buf2; 707ec1929dSWolfram Schneider register u_int i, j; 719b50d902SRodney W. Grimes 729b50d902SRodney W. Grimes while (fgets(path, sizeof(buf2), stdin) != NULL) { 739b50d902SRodney W. Grimes 74df62e52bSWolfram Schneider /* 75df62e52bSWolfram Schneider * We don't need remove newline character '\n'. 76df62e52bSWolfram Schneider * '\n' is less than ASCII_MIN and will be later 77df62e52bSWolfram Schneider * ignored at output. 78df62e52bSWolfram Schneider */ 7937002181SWolfram Schneider 8037002181SWolfram Schneider 819b50d902SRodney W. Grimes /* skip longest common prefix */ 82df62e52bSWolfram Schneider for (cp = path; *cp == *oldpath; cp++, oldpath++) 83df62e52bSWolfram Schneider if (*cp == '\0') 84df62e52bSWolfram Schneider break; 8537002181SWolfram Schneider 861a1ee31fSWolfram Schneider while (*cp != '\0' && *(cp + 1) != '\0') { 87df62e52bSWolfram Schneider bigram[(u_int)*cp][(u_int)*(cp + 1)]++; 8837002181SWolfram Schneider cp += 2; 899b50d902SRodney W. Grimes } 9037002181SWolfram Schneider 917ec1929dSWolfram Schneider /* swap pointers */ 927ec1929dSWolfram Schneider if (path == buf1) { 937ec1929dSWolfram Schneider path = buf2; 947ec1929dSWolfram Schneider oldpath = buf1; 957ec1929dSWolfram Schneider } else { 967ec1929dSWolfram Schneider path = buf1; 977ec1929dSWolfram Schneider oldpath = buf2; 987ec1929dSWolfram Schneider } 999b50d902SRodney W. Grimes } 10037002181SWolfram Schneider 101df62e52bSWolfram Schneider /* output, boundary check */ 10237002181SWolfram Schneider for (i = ASCII_MIN; i <= ASCII_MAX; i++) 10337002181SWolfram Schneider for (j = ASCII_MIN; j <= ASCII_MAX; j++) 10437002181SWolfram Schneider if (bigram[i][j] != 0) 105df62e52bSWolfram Schneider (void)printf("%4u %c%c\n", bigram[i][j], i, j); 1067ec1929dSWolfram Schneider 1077ec1929dSWolfram Schneider exit(0); 1089b50d902SRodney W. Grimes } 109