19b50d902SRodney W. Grimes /* 2139764e8SWolfram Schneider * Copyright (c) 1995 Wolfram Schneider <wosch@FreeBSD.org>. Berlin. 39b50d902SRodney W. Grimes * Copyright (c) 1989, 1993 49b50d902SRodney W. Grimes * The Regents of the University of California. All rights reserved. 59b50d902SRodney W. Grimes * 69b50d902SRodney W. Grimes * This code is derived from software contributed to Berkeley by 79b50d902SRodney W. Grimes * James A. Woods. 89b50d902SRodney W. Grimes * 99b50d902SRodney W. Grimes * Redistribution and use in source and binary forms, with or without 109b50d902SRodney W. Grimes * modification, are permitted provided that the following conditions 119b50d902SRodney W. Grimes * are met: 129b50d902SRodney W. Grimes * 1. Redistributions of source code must retain the above copyright 139b50d902SRodney W. Grimes * notice, this list of conditions and the following disclaimer. 149b50d902SRodney W. Grimes * 2. Redistributions in binary form must reproduce the above copyright 159b50d902SRodney W. Grimes * notice, this list of conditions and the following disclaimer in the 169b50d902SRodney W. Grimes * documentation and/or other materials provided with the distribution. 179b50d902SRodney W. Grimes * 3. All advertising materials mentioning features or use of this software 189b50d902SRodney W. Grimes * must display the following acknowledgement: 199b50d902SRodney W. Grimes * This product includes software developed by the University of 209b50d902SRodney W. Grimes * California, Berkeley and its contributors. 219b50d902SRodney W. Grimes * 4. Neither the name of the University nor the names of its contributors 229b50d902SRodney W. Grimes * may be used to endorse or promote products derived from this software 239b50d902SRodney W. Grimes * without specific prior written permission. 249b50d902SRodney W. Grimes * 259b50d902SRodney W. Grimes * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND 269b50d902SRodney W. Grimes * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE 279b50d902SRodney W. Grimes * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE 289b50d902SRodney W. Grimes * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE 299b50d902SRodney W. Grimes * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL 309b50d902SRodney W. Grimes * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS 319b50d902SRodney W. Grimes * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) 329b50d902SRodney W. Grimes * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT 339b50d902SRodney W. Grimes * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY 349b50d902SRodney W. Grimes * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF 359b50d902SRodney W. Grimes * SUCH DAMAGE. 367ec1929dSWolfram Schneider * 37c3aac50fSPeter Wemm * $FreeBSD$ 389b50d902SRodney W. Grimes */ 399b50d902SRodney W. Grimes 40*31fa4102SGavin Atkinson #if 0 419b50d902SRodney W. Grimes #ifndef lint 429b50d902SRodney W. Grimes static char copyright[] = 439b50d902SRodney W. Grimes "@(#) Copyright (c) 1989, 1993\n\ 449b50d902SRodney W. Grimes The Regents of the University of California. All rights reserved.\n"; 459b50d902SRodney W. Grimes #endif /* not lint */ 469b50d902SRodney W. Grimes 479b50d902SRodney W. Grimes #ifndef lint 489b50d902SRodney W. Grimes static char sccsid[] = "@(#)locate.bigram.c 8.1 (Berkeley) 6/6/93"; 499b50d902SRodney W. Grimes #endif /* not lint */ 50*31fa4102SGavin Atkinson #endif 519b50d902SRodney W. Grimes 529b50d902SRodney W. Grimes /* 537ec1929dSWolfram Schneider * bigram < sorted_file_names | sort -nr | 547ec1929dSWolfram Schneider * awk 'NR <= 128 { printf $2 }' > bigrams 559b50d902SRodney W. Grimes * 569b50d902SRodney W. Grimes * List bigrams for 'updatedb' script. 579b50d902SRodney W. Grimes * Use 'code' to encode a file using this output. 589b50d902SRodney W. Grimes */ 599b50d902SRodney W. Grimes 609b50d902SRodney W. Grimes #include <stdio.h> 61a3eb24c6SStefan Farfeleder #include <stdlib.h> 629b50d902SRodney W. Grimes #include <sys/param.h> /* for MAXPATHLEN */ 6337002181SWolfram Schneider #include "locate.h" 649b50d902SRodney W. Grimes 6537002181SWolfram Schneider u_char buf1[MAXPATHLEN] = " "; 6637002181SWolfram Schneider u_char buf2[MAXPATHLEN]; 67139764e8SWolfram Schneider u_int bigram[UCHAR_MAX + 1][UCHAR_MAX + 1]; 689b50d902SRodney W. Grimes 697ec1929dSWolfram Schneider int 707ec1929dSWolfram Schneider main(void) 719b50d902SRodney W. Grimes { 72*31fa4102SGavin Atkinson u_char *cp; 73*31fa4102SGavin Atkinson u_char *oldpath = buf1, *path = buf2; 74*31fa4102SGavin Atkinson u_int i, j; 759b50d902SRodney W. Grimes 769b50d902SRodney W. Grimes while (fgets(path, sizeof(buf2), stdin) != NULL) { 779b50d902SRodney W. Grimes 78df62e52bSWolfram Schneider /* 79df62e52bSWolfram Schneider * We don't need remove newline character '\n'. 80df62e52bSWolfram Schneider * '\n' is less than ASCII_MIN and will be later 81df62e52bSWolfram Schneider * ignored at output. 82df62e52bSWolfram Schneider */ 8337002181SWolfram Schneider 8437002181SWolfram Schneider 859b50d902SRodney W. Grimes /* skip longest common prefix */ 86df62e52bSWolfram Schneider for (cp = path; *cp == *oldpath; cp++, oldpath++) 87df62e52bSWolfram Schneider if (*cp == '\0') 88df62e52bSWolfram Schneider break; 8937002181SWolfram Schneider 901a1ee31fSWolfram Schneider while (*cp != '\0' && *(cp + 1) != '\0') { 91139764e8SWolfram Schneider bigram[(u_char)*cp][(u_char)*(cp + 1)]++; 9237002181SWolfram Schneider cp += 2; 939b50d902SRodney W. Grimes } 9437002181SWolfram Schneider 957ec1929dSWolfram Schneider /* swap pointers */ 967ec1929dSWolfram Schneider if (path == buf1) { 977ec1929dSWolfram Schneider path = buf2; 987ec1929dSWolfram Schneider oldpath = buf1; 997ec1929dSWolfram Schneider } else { 1007ec1929dSWolfram Schneider path = buf1; 1017ec1929dSWolfram Schneider oldpath = buf2; 1027ec1929dSWolfram Schneider } 1039b50d902SRodney W. Grimes } 10437002181SWolfram Schneider 105df62e52bSWolfram Schneider /* output, boundary check */ 10637002181SWolfram Schneider for (i = ASCII_MIN; i <= ASCII_MAX; i++) 10737002181SWolfram Schneider for (j = ASCII_MIN; j <= ASCII_MAX; j++) 10837002181SWolfram Schneider if (bigram[i][j] != 0) 109df62e52bSWolfram Schneider (void)printf("%4u %c%c\n", bigram[i][j], i, j); 1107ec1929dSWolfram Schneider 1117ec1929dSWolfram Schneider exit(0); 1129b50d902SRodney W. Grimes } 113