xref: /titanic_44/usr/src/lib/libcmd/common/comm.c (revision fcf3ce441efd61da9bb2884968af01cb7c1452cc)
1 /***********************************************************************
2 *                                                                      *
3 *               This software is part of the ast package               *
4 *           Copyright (c) 1992-2007 AT&T Knowledge Ventures            *
5 *                      and is licensed under the                       *
6 *                  Common Public License, Version 1.0                  *
7 *                      by AT&T Knowledge Ventures                      *
8 *                                                                      *
9 *                A copy of the License is available at                 *
10 *            http://www.opensource.org/licenses/cpl1.0.txt             *
11 *         (with md5 checksum 059e8cd6165cb4c31e351f2b69388fd9)         *
12 *                                                                      *
13 *              Information and Software Systems Research               *
14 *                            AT&T Research                             *
15 *                           Florham Park NJ                            *
16 *                                                                      *
17 *                 Glenn Fowler <gsf@research.att.com>                  *
18 *                  David Korn <dgk@research.att.com>                   *
19 *                                                                      *
20 ***********************************************************************/
21 #pragma prototyped
22 /*
23  * David Korn
24  * AT&T Bell Laboratories
25  *
26  * comm
27  */
28 
29 static const char usage[] =
30 "[-?\n@(#)$Id: comm (AT&T Research) 1999-04-28 $\n]"
31 USAGE_LICENSE
32 "[+NAME?comm - select or reject lines common to two files]"
33 "[+DESCRIPTION?\bcomm\b reads two files \afile1\a and \afile2\a "
34 	"which should be ordered in the collating sequence of the "
35 	"current locale, and produces three text columns as output:]{"
36 	"[+1?Lines only in \afile1\a.]"
37 	"[+2?Lines only in \afile2\a.]"
38 	"[+3?Lines in both files.]"
39 	"}"
40 "[+?If lines in either file are not ordered according to the collating "
41 	"sequence of the current locale, the results are not specified.]"
42 "[+?If either \afile1\a or \afile2\a is \b-\b, \bcomm\b "
43         "uses standard input starting at the current location.]"
44 
45 "[1?Suppress the output column of lines unique to \afile1\a.]"
46 "[2?Suppress the output column of lines unique to \afile2\a.]"
47 "[3?Suppress the output column of lines duplicate in \afile1\a and \afile2\a.]"
48 "\n"
49 "\nfile1 file2\n"
50 "\n"
51 "[+EXIT STATUS?]{"
52 	"[+0?Both files processed successfully.]"
53 	"[+>0?An error occurred.]"
54 "}"
55 "[+SEE ALSO?\bcmp\b(1), \bdiff\b(1)]"
56 ;
57 
58 
59 #include <cmd.h>
60 
61 #define C_FILE1		1
62 #define C_FILE2		2
63 #define C_COMMON	4
64 #define C_ALL		(C_FILE1|C_FILE2|C_COMMON)
65 
66 static int comm(Sfio_t *in1, Sfio_t *in2, register Sfio_t *out,register int mode)
67 {
68 	register char *cp1, *cp2;
69 	register int n1, n2, n, comp;
70 	if(cp1 = sfgetr(in1,'\n',0))
71 		n1 = sfvalue(in1);
72 	if(cp2 = sfgetr(in2,'\n',0))
73 		n2 = sfvalue(in2);
74 	while(cp1 && cp2)
75 	{
76 		n=(n1<n2?n1:n2);
77 		if((comp=memcmp(cp1,cp2,n-1))==0 && (comp=n1-n2)==0)
78 		{
79 			if(mode&C_COMMON)
80 			{
81 				if(mode!=C_COMMON)
82 				{
83 					sfputc(out,'\t');
84 					if(mode==C_ALL)
85 						sfputc(out,'\t');
86 				}
87 				if(sfwrite(out,cp1,n) < 0)
88 					return(-1);
89 			}
90 			if(cp1 = sfgetr(in1,'\n',0))
91 				n1 = sfvalue(in1);
92 			if(cp2 = sfgetr(in2,'\n',0))
93 				n2 = sfvalue(in2);
94 		}
95 		else if(comp > 0)
96 		{
97 			if(mode&C_FILE2)
98 			{
99 				if(mode&C_FILE1)
100 					sfputc(out,'\t');
101 				if(sfwrite(out,cp2,n2) < 0)
102 					return(-1);
103 			}
104 			if(cp2 = sfgetr(in2,'\n',0))
105 				n2 = sfvalue(in2);
106 		}
107 		else
108 		{
109 			if((mode&C_FILE1) && sfwrite(out,cp1,n1) < 0)
110 				return(-1);
111 			if(cp1 = sfgetr(in1,'\n',0))
112 				n1 = sfvalue(in1);
113 		}
114 	}
115 	n = 0;
116 	if(cp2)
117 	{
118 		cp1 = cp2;
119 		in1 = in2;
120 		n1 = n2;
121 		if(mode&C_FILE1)
122 			n = 1;
123 		mode &= C_FILE2;
124 	}
125 	else
126 		mode &= C_FILE1;
127 	if(!mode || !cp1)
128 	{
129 		if(cp1 && in1==sfstdin)
130 			sfseek(in1,(Sfoff_t)0,SEEK_END);
131 		return(0);
132 	}
133 	/* process the remaining stream */
134 	while(1)
135 	{
136 		if(n)
137 			sfputc(out,'\t');
138 		if(sfwrite(out,cp1,n1) < 0)
139 			return(-1);
140 		if(!(cp1 = sfgetr(in1,'\n',0)))
141 			return(0);
142 		n1 = sfvalue(in1);
143 	}
144 	/* NOT REACHED */
145 }
146 
147 int
148 b_comm(int argc, char *argv[], void* context)
149 {
150 	register int n;
151 	register int mode = C_FILE1|C_FILE2|C_COMMON;
152 	register char *cp;
153 	Sfio_t *f1, *f2;
154 
155 	cmdinit(argc, argv, context, ERROR_CATALOG, 0);
156 	while (n = optget(argv, usage)) switch (n)
157 	{
158  	    case '1':
159 		mode &= ~C_FILE1;
160 		break;
161 	    case '2':
162 		mode &= ~C_FILE2;
163 		break;
164 	    case '3':
165 		mode &= ~C_COMMON;
166 		break;
167 	    case ':':
168 		error(2, "%s",opt_info.arg);
169 		break;
170 	    case '?':
171 		error(ERROR_usage(2), "%s",opt_info.arg);
172 		break;
173 	}
174 	argv += opt_info.index;
175 	argc -= opt_info.index;
176 	if(error_info.errors || argc!=2)
177 		error(ERROR_usage(2),"%s",optusage(NiL));
178 	cp = *argv++;
179 	if(streq(cp,"-"))
180 		f1 = sfstdin;
181 	else if(!(f1 = sfopen(NiL, cp,"r")))
182 		error(ERROR_system(1),"%s: cannot open",cp);
183 	cp = *argv;
184 	if(streq(cp,"-"))
185 		f2 = sfstdin;
186 	else if(!(f2 = sfopen(NiL, cp,"r")))
187 		error(ERROR_system(1),"%s: cannot open",cp);
188 	if(mode)
189 	{
190 		if(comm(f1,f2,sfstdout,mode) < 0)
191 			error(ERROR_system(1)," write error");
192 	}
193 	else if(f1==sfstdin || f2==sfstdin)
194 		sfseek(sfstdin,(Sfoff_t)0,SEEK_END);
195 	if(f1!=sfstdin)
196 		sfclose(f1);
197 	if(f2!=sfstdin)
198 		sfclose(f2);
199 	return(error_info.errors);
200 }
201 
202