xref: /onnv-gate/usr/src/lib/libcmd/common/comm.c (revision 4887)
1*4887Schin /***********************************************************************
2*4887Schin *                                                                      *
3*4887Schin *               This software is part of the ast package               *
4*4887Schin *           Copyright (c) 1992-2007 AT&T Knowledge Ventures            *
5*4887Schin *                      and is licensed under the                       *
6*4887Schin *                  Common Public License, Version 1.0                  *
7*4887Schin *                      by AT&T Knowledge Ventures                      *
8*4887Schin *                                                                      *
9*4887Schin *                A copy of the License is available at                 *
10*4887Schin *            http://www.opensource.org/licenses/cpl1.0.txt             *
11*4887Schin *         (with md5 checksum 059e8cd6165cb4c31e351f2b69388fd9)         *
12*4887Schin *                                                                      *
13*4887Schin *              Information and Software Systems Research               *
14*4887Schin *                            AT&T Research                             *
15*4887Schin *                           Florham Park NJ                            *
16*4887Schin *                                                                      *
17*4887Schin *                 Glenn Fowler <gsf@research.att.com>                  *
18*4887Schin *                  David Korn <dgk@research.att.com>                   *
19*4887Schin *                                                                      *
20*4887Schin ***********************************************************************/
21*4887Schin #pragma prototyped
22*4887Schin /*
23*4887Schin  * David Korn
24*4887Schin  * AT&T Bell Laboratories
25*4887Schin  *
26*4887Schin  * comm
27*4887Schin  */
28*4887Schin 
29*4887Schin static const char usage[] =
30*4887Schin "[-?\n@(#)$Id: comm (AT&T Research) 1999-04-28 $\n]"
31*4887Schin USAGE_LICENSE
32*4887Schin "[+NAME?comm - select or reject lines common to two files]"
33*4887Schin "[+DESCRIPTION?\bcomm\b reads two files \afile1\a and \afile2\a "
34*4887Schin 	"which should be ordered in the collating sequence of the "
35*4887Schin 	"current locale, and produces three text columns as output:]{"
36*4887Schin 	"[+1?Lines only in \afile1\a.]"
37*4887Schin 	"[+2?Lines only in \afile2\a.]"
38*4887Schin 	"[+3?Lines in both files.]"
39*4887Schin 	"}"
40*4887Schin "[+?If lines in either file are not ordered according to the collating "
41*4887Schin 	"sequence of the current locale, the results are not specified.]"
42*4887Schin "[+?If either \afile1\a or \afile2\a is \b-\b, \bcomm\b "
43*4887Schin         "uses standard input starting at the current location.]"
44*4887Schin 
45*4887Schin "[1?Suppress the output column of lines unique to \afile1\a.]"
46*4887Schin "[2?Suppress the output column of lines unique to \afile2\a.]"
47*4887Schin "[3?Suppress the output column of lines duplicate in \afile1\a and \afile2\a.]"
48*4887Schin "\n"
49*4887Schin "\nfile1 file2\n"
50*4887Schin "\n"
51*4887Schin "[+EXIT STATUS?]{"
52*4887Schin 	"[+0?Both files processed successfully.]"
53*4887Schin 	"[+>0?An error occurred.]"
54*4887Schin "}"
55*4887Schin "[+SEE ALSO?\bcmp\b(1), \bdiff\b(1)]"
56*4887Schin ;
57*4887Schin 
58*4887Schin 
59*4887Schin #include <cmd.h>
60*4887Schin 
61*4887Schin #define C_FILE1		1
62*4887Schin #define C_FILE2		2
63*4887Schin #define C_COMMON	4
64*4887Schin #define C_ALL		(C_FILE1|C_FILE2|C_COMMON)
65*4887Schin 
66*4887Schin static int comm(Sfio_t *in1, Sfio_t *in2, register Sfio_t *out,register int mode)
67*4887Schin {
68*4887Schin 	register char *cp1, *cp2;
69*4887Schin 	register int n1, n2, n, comp;
70*4887Schin 	if(cp1 = sfgetr(in1,'\n',0))
71*4887Schin 		n1 = sfvalue(in1);
72*4887Schin 	if(cp2 = sfgetr(in2,'\n',0))
73*4887Schin 		n2 = sfvalue(in2);
74*4887Schin 	while(cp1 && cp2)
75*4887Schin 	{
76*4887Schin 		n=(n1<n2?n1:n2);
77*4887Schin 		if((comp=memcmp(cp1,cp2,n-1))==0 && (comp=n1-n2)==0)
78*4887Schin 		{
79*4887Schin 			if(mode&C_COMMON)
80*4887Schin 			{
81*4887Schin 				if(mode!=C_COMMON)
82*4887Schin 				{
83*4887Schin 					sfputc(out,'\t');
84*4887Schin 					if(mode==C_ALL)
85*4887Schin 						sfputc(out,'\t');
86*4887Schin 				}
87*4887Schin 				if(sfwrite(out,cp1,n) < 0)
88*4887Schin 					return(-1);
89*4887Schin 			}
90*4887Schin 			if(cp1 = sfgetr(in1,'\n',0))
91*4887Schin 				n1 = sfvalue(in1);
92*4887Schin 			if(cp2 = sfgetr(in2,'\n',0))
93*4887Schin 				n2 = sfvalue(in2);
94*4887Schin 		}
95*4887Schin 		else if(comp > 0)
96*4887Schin 		{
97*4887Schin 			if(mode&C_FILE2)
98*4887Schin 			{
99*4887Schin 				if(mode&C_FILE1)
100*4887Schin 					sfputc(out,'\t');
101*4887Schin 				if(sfwrite(out,cp2,n2) < 0)
102*4887Schin 					return(-1);
103*4887Schin 			}
104*4887Schin 			if(cp2 = sfgetr(in2,'\n',0))
105*4887Schin 				n2 = sfvalue(in2);
106*4887Schin 		}
107*4887Schin 		else
108*4887Schin 		{
109*4887Schin 			if((mode&C_FILE1) && sfwrite(out,cp1,n1) < 0)
110*4887Schin 				return(-1);
111*4887Schin 			if(cp1 = sfgetr(in1,'\n',0))
112*4887Schin 				n1 = sfvalue(in1);
113*4887Schin 		}
114*4887Schin 	}
115*4887Schin 	n = 0;
116*4887Schin 	if(cp2)
117*4887Schin 	{
118*4887Schin 		cp1 = cp2;
119*4887Schin 		in1 = in2;
120*4887Schin 		n1 = n2;
121*4887Schin 		if(mode&C_FILE1)
122*4887Schin 			n = 1;
123*4887Schin 		mode &= C_FILE2;
124*4887Schin 	}
125*4887Schin 	else
126*4887Schin 		mode &= C_FILE1;
127*4887Schin 	if(!mode || !cp1)
128*4887Schin 	{
129*4887Schin 		if(cp1 && in1==sfstdin)
130*4887Schin 			sfseek(in1,(Sfoff_t)0,SEEK_END);
131*4887Schin 		return(0);
132*4887Schin 	}
133*4887Schin 	/* process the remaining stream */
134*4887Schin 	while(1)
135*4887Schin 	{
136*4887Schin 		if(n)
137*4887Schin 			sfputc(out,'\t');
138*4887Schin 		if(sfwrite(out,cp1,n1) < 0)
139*4887Schin 			return(-1);
140*4887Schin 		if(!(cp1 = sfgetr(in1,'\n',0)))
141*4887Schin 			return(0);
142*4887Schin 		n1 = sfvalue(in1);
143*4887Schin 	}
144*4887Schin 	/* NOT REACHED */
145*4887Schin }
146*4887Schin 
147*4887Schin int
148*4887Schin b_comm(int argc, char *argv[], void* context)
149*4887Schin {
150*4887Schin 	register int n;
151*4887Schin 	register int mode = C_FILE1|C_FILE2|C_COMMON;
152*4887Schin 	register char *cp;
153*4887Schin 	Sfio_t *f1, *f2;
154*4887Schin 
155*4887Schin 	cmdinit(argc, argv, context, ERROR_CATALOG, 0);
156*4887Schin 	while (n = optget(argv, usage)) switch (n)
157*4887Schin 	{
158*4887Schin  	    case '1':
159*4887Schin 		mode &= ~C_FILE1;
160*4887Schin 		break;
161*4887Schin 	    case '2':
162*4887Schin 		mode &= ~C_FILE2;
163*4887Schin 		break;
164*4887Schin 	    case '3':
165*4887Schin 		mode &= ~C_COMMON;
166*4887Schin 		break;
167*4887Schin 	    case ':':
168*4887Schin 		error(2, "%s",opt_info.arg);
169*4887Schin 		break;
170*4887Schin 	    case '?':
171*4887Schin 		error(ERROR_usage(2), "%s",opt_info.arg);
172*4887Schin 		break;
173*4887Schin 	}
174*4887Schin 	argv += opt_info.index;
175*4887Schin 	argc -= opt_info.index;
176*4887Schin 	if(error_info.errors || argc!=2)
177*4887Schin 		error(ERROR_usage(2),"%s",optusage(NiL));
178*4887Schin 	cp = *argv++;
179*4887Schin 	if(streq(cp,"-"))
180*4887Schin 		f1 = sfstdin;
181*4887Schin 	else if(!(f1 = sfopen(NiL, cp,"r")))
182*4887Schin 		error(ERROR_system(1),"%s: cannot open",cp);
183*4887Schin 	cp = *argv;
184*4887Schin 	if(streq(cp,"-"))
185*4887Schin 		f2 = sfstdin;
186*4887Schin 	else if(!(f2 = sfopen(NiL, cp,"r")))
187*4887Schin 		error(ERROR_system(1),"%s: cannot open",cp);
188*4887Schin 	if(mode)
189*4887Schin 	{
190*4887Schin 		if(comm(f1,f2,sfstdout,mode) < 0)
191*4887Schin 			error(ERROR_system(1)," write error");
192*4887Schin 	}
193*4887Schin 	else if(f1==sfstdin || f2==sfstdin)
194*4887Schin 		sfseek(sfstdin,(Sfoff_t)0,SEEK_END);
195*4887Schin 	if(f1!=sfstdin)
196*4887Schin 		sfclose(f1);
197*4887Schin 	if(f2!=sfstdin)
198*4887Schin 		sfclose(f2);
199*4887Schin 	return(error_info.errors);
200*4887Schin }
201*4887Schin 
202