19b50d902SRodney W. Grimes /* 29b50d902SRodney W. Grimes * Copyright (c) 1989, 1993 39b50d902SRodney W. Grimes * The Regents of the University of California. All rights reserved. 49b50d902SRodney W. Grimes * 59b50d902SRodney W. Grimes * This code is derived from software contributed to Berkeley by 69b50d902SRodney W. Grimes * James A. Woods. 79b50d902SRodney W. Grimes * 89b50d902SRodney W. Grimes * Redistribution and use in source and binary forms, with or without 99b50d902SRodney W. Grimes * modification, are permitted provided that the following conditions 109b50d902SRodney W. Grimes * are met: 119b50d902SRodney W. Grimes * 1. Redistributions of source code must retain the above copyright 129b50d902SRodney W. Grimes * notice, this list of conditions and the following disclaimer. 139b50d902SRodney W. Grimes * 2. Redistributions in binary form must reproduce the above copyright 149b50d902SRodney W. Grimes * notice, this list of conditions and the following disclaimer in the 159b50d902SRodney W. Grimes * documentation and/or other materials provided with the distribution. 169b50d902SRodney W. Grimes * 3. All advertising materials mentioning features or use of this software 179b50d902SRodney W. Grimes * must display the following acknowledgement: 189b50d902SRodney W. Grimes * This product includes software developed by the University of 199b50d902SRodney W. Grimes * California, Berkeley and its contributors. 209b50d902SRodney W. Grimes * 4. Neither the name of the University nor the names of its contributors 219b50d902SRodney W. Grimes * may be used to endorse or promote products derived from this software 229b50d902SRodney W. Grimes * without specific prior written permission. 239b50d902SRodney W. Grimes * 249b50d902SRodney W. Grimes * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND 259b50d902SRodney W. Grimes * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE 269b50d902SRodney W. Grimes * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE 279b50d902SRodney W. Grimes * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE 289b50d902SRodney W. Grimes * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL 299b50d902SRodney W. Grimes * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS 309b50d902SRodney W. Grimes * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) 319b50d902SRodney W. Grimes * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT 329b50d902SRodney W. Grimes * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY 339b50d902SRodney W. Grimes * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF 349b50d902SRodney W. Grimes * SUCH DAMAGE. 357ec1929dSWolfram Schneider * 367ec1929dSWolfram Schneider * $Id$ 379b50d902SRodney W. Grimes */ 389b50d902SRodney W. Grimes 399b50d902SRodney W. Grimes #ifndef lint 409b50d902SRodney W. Grimes static char copyright[] = 419b50d902SRodney W. Grimes "@(#) Copyright (c) 1989, 1993\n\ 429b50d902SRodney W. Grimes The Regents of the University of California. All rights reserved.\n"; 439b50d902SRodney W. Grimes #endif /* not lint */ 449b50d902SRodney W. Grimes 459b50d902SRodney W. Grimes #ifndef lint 469b50d902SRodney W. Grimes static char sccsid[] = "@(#)locate.bigram.c 8.1 (Berkeley) 6/6/93"; 479b50d902SRodney W. Grimes #endif /* not lint */ 489b50d902SRodney W. Grimes 499b50d902SRodney W. Grimes /* 507ec1929dSWolfram Schneider * bigram < sorted_file_names | sort -nr | 517ec1929dSWolfram Schneider * awk 'NR <= 128 { printf $2 }' > bigrams 529b50d902SRodney W. Grimes * 539b50d902SRodney W. Grimes * List bigrams for 'updatedb' script. 549b50d902SRodney W. Grimes * Use 'code' to encode a file using this output. 559b50d902SRodney W. Grimes */ 569b50d902SRodney W. Grimes 579b50d902SRodney W. Grimes #include <stdio.h> 589b50d902SRodney W. Grimes #include <sys/param.h> /* for MAXPATHLEN */ 5937002181SWolfram Schneider #include <string.h> /* memchr */ 6037002181SWolfram Schneider #include "locate.h" 619b50d902SRodney W. Grimes 6237002181SWolfram Schneider u_char buf1[MAXPATHLEN] = " "; 6337002181SWolfram Schneider u_char buf2[MAXPATHLEN]; 647ec1929dSWolfram Schneider u_int bigram[UCHAR_MAX][UCHAR_MAX]; 659b50d902SRodney W. Grimes 667ec1929dSWolfram Schneider int 677ec1929dSWolfram Schneider main(void) 689b50d902SRodney W. Grimes { 6937002181SWolfram Schneider register u_char *cp; 7037002181SWolfram Schneider register u_char *oldpath = buf1, *path = buf2; 717ec1929dSWolfram Schneider register u_int i, j; 729b50d902SRodney W. Grimes 739b50d902SRodney W. Grimes while (fgets(path, sizeof(buf2), stdin) != NULL) { 749b50d902SRodney W. Grimes 7537002181SWolfram Schneider /* skip empty lines */ 7637002181SWolfram Schneider if (*path == '\n') 7737002181SWolfram Schneider continue; 7837002181SWolfram Schneider 7937002181SWolfram Schneider /* Squelch characters that would botch the decoding. */ 8037002181SWolfram Schneider for (cp = path; *cp != NULL; cp++) { 8137002181SWolfram Schneider /* chop newline */ 8237002181SWolfram Schneider if (*cp == '\n') 8337002181SWolfram Schneider *cp = NULL; 8437002181SWolfram Schneider /* range */ 8537002181SWolfram Schneider else if (*cp < ASCII_MIN || *cp > ASCII_MAX) 8637002181SWolfram Schneider *cp = '?'; 8737002181SWolfram Schneider } 8837002181SWolfram Schneider 899b50d902SRodney W. Grimes /* skip longest common prefix */ 907ec1929dSWolfram Schneider for (cp = path; *cp == *oldpath && *cp != NULL; cp++, oldpath++); 9137002181SWolfram Schneider 929b50d902SRodney W. Grimes while (*cp != NULL && *(cp+1) != NULL) { 9337002181SWolfram Schneider bigram[*cp][*(cp+1)]++; 9437002181SWolfram Schneider cp += 2; 959b50d902SRodney W. Grimes } 9637002181SWolfram Schneider 977ec1929dSWolfram Schneider /* swap pointers */ 987ec1929dSWolfram Schneider if (path == buf1) { 997ec1929dSWolfram Schneider path = buf2; 1007ec1929dSWolfram Schneider oldpath = buf1; 1017ec1929dSWolfram Schneider } else { 1027ec1929dSWolfram Schneider path = buf1; 1037ec1929dSWolfram Schneider oldpath = buf2; 1047ec1929dSWolfram Schneider } 1059b50d902SRodney W. Grimes } 10637002181SWolfram Schneider 1077ec1929dSWolfram Schneider /* output, (paranoid) boundary check */ 10837002181SWolfram Schneider for (i = ASCII_MIN; i <= ASCII_MAX; i++) 10937002181SWolfram Schneider for (j = ASCII_MIN; j <= ASCII_MAX; j++) 11037002181SWolfram Schneider if (bigram[i][j] != 0) 1117ec1929dSWolfram Schneider printf("%4u %c%c\n", bigram[i][j], i, j); 1127ec1929dSWolfram Schneider 1137ec1929dSWolfram Schneider exit(0); 1149b50d902SRodney W. Grimes } 115