1*4887Schin /*********************************************************************** 2*4887Schin * * 3*4887Schin * This software is part of the ast package * 4*4887Schin * Copyright (c) 1992-2007 AT&T Knowledge Ventures * 5*4887Schin * and is licensed under the * 6*4887Schin * Common Public License, Version 1.0 * 7*4887Schin * by AT&T Knowledge Ventures * 8*4887Schin * * 9*4887Schin * A copy of the License is available at * 10*4887Schin * http://www.opensource.org/licenses/cpl1.0.txt * 11*4887Schin * (with md5 checksum 059e8cd6165cb4c31e351f2b69388fd9) * 12*4887Schin * * 13*4887Schin * Information and Software Systems Research * 14*4887Schin * AT&T Research * 15*4887Schin * Florham Park NJ * 16*4887Schin * * 17*4887Schin * Glenn Fowler <gsf@research.att.com> * 18*4887Schin * David Korn <dgk@research.att.com> * 19*4887Schin * * 20*4887Schin ***********************************************************************/ 21*4887Schin #pragma prototyped 22*4887Schin /* 23*4887Schin * David Korn 24*4887Schin * AT&T Bell Laboratories 25*4887Schin * 26*4887Schin * comm 27*4887Schin */ 28*4887Schin 29*4887Schin static const char usage[] = 30*4887Schin "[-?\n@(#)$Id: comm (AT&T Research) 1999-04-28 $\n]" 31*4887Schin USAGE_LICENSE 32*4887Schin "[+NAME?comm - select or reject lines common to two files]" 33*4887Schin "[+DESCRIPTION?\bcomm\b reads two files \afile1\a and \afile2\a " 34*4887Schin "which should be ordered in the collating sequence of the " 35*4887Schin "current locale, and produces three text columns as output:]{" 36*4887Schin "[+1?Lines only in \afile1\a.]" 37*4887Schin "[+2?Lines only in \afile2\a.]" 38*4887Schin "[+3?Lines in both files.]" 39*4887Schin "}" 40*4887Schin "[+?If lines in either file are not ordered according to the collating " 41*4887Schin "sequence of the current locale, the results are not specified.]" 42*4887Schin "[+?If either \afile1\a or \afile2\a is \b-\b, \bcomm\b " 43*4887Schin "uses standard input starting at the current location.]" 44*4887Schin 45*4887Schin "[1?Suppress the output column of lines unique to \afile1\a.]" 46*4887Schin "[2?Suppress the output column of lines unique to \afile2\a.]" 47*4887Schin "[3?Suppress the output column of lines duplicate in \afile1\a and \afile2\a.]" 48*4887Schin "\n" 49*4887Schin "\nfile1 file2\n" 50*4887Schin "\n" 51*4887Schin "[+EXIT STATUS?]{" 52*4887Schin "[+0?Both files processed successfully.]" 53*4887Schin "[+>0?An error occurred.]" 54*4887Schin "}" 55*4887Schin "[+SEE ALSO?\bcmp\b(1), \bdiff\b(1)]" 56*4887Schin ; 57*4887Schin 58*4887Schin 59*4887Schin #include <cmd.h> 60*4887Schin 61*4887Schin #define C_FILE1 1 62*4887Schin #define C_FILE2 2 63*4887Schin #define C_COMMON 4 64*4887Schin #define C_ALL (C_FILE1|C_FILE2|C_COMMON) 65*4887Schin 66*4887Schin static int comm(Sfio_t *in1, Sfio_t *in2, register Sfio_t *out,register int mode) 67*4887Schin { 68*4887Schin register char *cp1, *cp2; 69*4887Schin register int n1, n2, n, comp; 70*4887Schin if(cp1 = sfgetr(in1,'\n',0)) 71*4887Schin n1 = sfvalue(in1); 72*4887Schin if(cp2 = sfgetr(in2,'\n',0)) 73*4887Schin n2 = sfvalue(in2); 74*4887Schin while(cp1 && cp2) 75*4887Schin { 76*4887Schin n=(n1<n2?n1:n2); 77*4887Schin if((comp=memcmp(cp1,cp2,n-1))==0 && (comp=n1-n2)==0) 78*4887Schin { 79*4887Schin if(mode&C_COMMON) 80*4887Schin { 81*4887Schin if(mode!=C_COMMON) 82*4887Schin { 83*4887Schin sfputc(out,'\t'); 84*4887Schin if(mode==C_ALL) 85*4887Schin sfputc(out,'\t'); 86*4887Schin } 87*4887Schin if(sfwrite(out,cp1,n) < 0) 88*4887Schin return(-1); 89*4887Schin } 90*4887Schin if(cp1 = sfgetr(in1,'\n',0)) 91*4887Schin n1 = sfvalue(in1); 92*4887Schin if(cp2 = sfgetr(in2,'\n',0)) 93*4887Schin n2 = sfvalue(in2); 94*4887Schin } 95*4887Schin else if(comp > 0) 96*4887Schin { 97*4887Schin if(mode&C_FILE2) 98*4887Schin { 99*4887Schin if(mode&C_FILE1) 100*4887Schin sfputc(out,'\t'); 101*4887Schin if(sfwrite(out,cp2,n2) < 0) 102*4887Schin return(-1); 103*4887Schin } 104*4887Schin if(cp2 = sfgetr(in2,'\n',0)) 105*4887Schin n2 = sfvalue(in2); 106*4887Schin } 107*4887Schin else 108*4887Schin { 109*4887Schin if((mode&C_FILE1) && sfwrite(out,cp1,n1) < 0) 110*4887Schin return(-1); 111*4887Schin if(cp1 = sfgetr(in1,'\n',0)) 112*4887Schin n1 = sfvalue(in1); 113*4887Schin } 114*4887Schin } 115*4887Schin n = 0; 116*4887Schin if(cp2) 117*4887Schin { 118*4887Schin cp1 = cp2; 119*4887Schin in1 = in2; 120*4887Schin n1 = n2; 121*4887Schin if(mode&C_FILE1) 122*4887Schin n = 1; 123*4887Schin mode &= C_FILE2; 124*4887Schin } 125*4887Schin else 126*4887Schin mode &= C_FILE1; 127*4887Schin if(!mode || !cp1) 128*4887Schin { 129*4887Schin if(cp1 && in1==sfstdin) 130*4887Schin sfseek(in1,(Sfoff_t)0,SEEK_END); 131*4887Schin return(0); 132*4887Schin } 133*4887Schin /* process the remaining stream */ 134*4887Schin while(1) 135*4887Schin { 136*4887Schin if(n) 137*4887Schin sfputc(out,'\t'); 138*4887Schin if(sfwrite(out,cp1,n1) < 0) 139*4887Schin return(-1); 140*4887Schin if(!(cp1 = sfgetr(in1,'\n',0))) 141*4887Schin return(0); 142*4887Schin n1 = sfvalue(in1); 143*4887Schin } 144*4887Schin /* NOT REACHED */ 145*4887Schin } 146*4887Schin 147*4887Schin int 148*4887Schin b_comm(int argc, char *argv[], void* context) 149*4887Schin { 150*4887Schin register int n; 151*4887Schin register int mode = C_FILE1|C_FILE2|C_COMMON; 152*4887Schin register char *cp; 153*4887Schin Sfio_t *f1, *f2; 154*4887Schin 155*4887Schin cmdinit(argc, argv, context, ERROR_CATALOG, 0); 156*4887Schin while (n = optget(argv, usage)) switch (n) 157*4887Schin { 158*4887Schin case '1': 159*4887Schin mode &= ~C_FILE1; 160*4887Schin break; 161*4887Schin case '2': 162*4887Schin mode &= ~C_FILE2; 163*4887Schin break; 164*4887Schin case '3': 165*4887Schin mode &= ~C_COMMON; 166*4887Schin break; 167*4887Schin case ':': 168*4887Schin error(2, "%s",opt_info.arg); 169*4887Schin break; 170*4887Schin case '?': 171*4887Schin error(ERROR_usage(2), "%s",opt_info.arg); 172*4887Schin break; 173*4887Schin } 174*4887Schin argv += opt_info.index; 175*4887Schin argc -= opt_info.index; 176*4887Schin if(error_info.errors || argc!=2) 177*4887Schin error(ERROR_usage(2),"%s",optusage(NiL)); 178*4887Schin cp = *argv++; 179*4887Schin if(streq(cp,"-")) 180*4887Schin f1 = sfstdin; 181*4887Schin else if(!(f1 = sfopen(NiL, cp,"r"))) 182*4887Schin error(ERROR_system(1),"%s: cannot open",cp); 183*4887Schin cp = *argv; 184*4887Schin if(streq(cp,"-")) 185*4887Schin f2 = sfstdin; 186*4887Schin else if(!(f2 = sfopen(NiL, cp,"r"))) 187*4887Schin error(ERROR_system(1),"%s: cannot open",cp); 188*4887Schin if(mode) 189*4887Schin { 190*4887Schin if(comm(f1,f2,sfstdout,mode) < 0) 191*4887Schin error(ERROR_system(1)," write error"); 192*4887Schin } 193*4887Schin else if(f1==sfstdin || f2==sfstdin) 194*4887Schin sfseek(sfstdin,(Sfoff_t)0,SEEK_END); 195*4887Schin if(f1!=sfstdin) 196*4887Schin sfclose(f1); 197*4887Schin if(f2!=sfstdin) 198*4887Schin sfclose(f2); 199*4887Schin return(error_info.errors); 200*4887Schin } 201*4887Schin 202