1da2e3ebdSchin /***********************************************************************
2da2e3ebdSchin *                                                                      *
3da2e3ebdSchin *               This software is part of the ast package               *
4*b30d1939SAndy Fiddaman *          Copyright (c) 1992-2012 AT&T Intellectual Property          *
5da2e3ebdSchin *                      and is licensed under the                       *
6*b30d1939SAndy Fiddaman *                 Eclipse Public License, Version 1.0                  *
77c2fbfb3SApril Chin *                    by AT&T Intellectual Property                     *
8da2e3ebdSchin *                                                                      *
9da2e3ebdSchin *                A copy of the License is available at                 *
10*b30d1939SAndy Fiddaman *          http://www.eclipse.org/org/documents/epl-v10.html           *
11*b30d1939SAndy Fiddaman *         (with md5 checksum b35adb5213ca9657e911e9befb180842)         *
12da2e3ebdSchin *                                                                      *
13da2e3ebdSchin *              Information and Software Systems Research               *
14da2e3ebdSchin *                            AT&T Research                             *
15da2e3ebdSchin *                           Florham Park NJ                            *
16da2e3ebdSchin *                                                                      *
17da2e3ebdSchin *                 Glenn Fowler <gsf@research.att.com>                  *
18da2e3ebdSchin *                  David Korn <dgk@research.att.com>                   *
19da2e3ebdSchin *                                                                      *
20da2e3ebdSchin ***********************************************************************/
21da2e3ebdSchin #pragma prototyped
22da2e3ebdSchin /*
23da2e3ebdSchin  * David Korn
24da2e3ebdSchin  * AT&T Bell Laboratories
25da2e3ebdSchin  *
26da2e3ebdSchin  * comm
27da2e3ebdSchin  */
28da2e3ebdSchin 
29da2e3ebdSchin static const char usage[] =
30da2e3ebdSchin "[-?\n@(#)$Id: comm (AT&T Research) 1999-04-28 $\n]"
31da2e3ebdSchin USAGE_LICENSE
32da2e3ebdSchin "[+NAME?comm - select or reject lines common to two files]"
33da2e3ebdSchin "[+DESCRIPTION?\bcomm\b reads two files \afile1\a and \afile2\a "
34da2e3ebdSchin 	"which should be ordered in the collating sequence of the "
35da2e3ebdSchin 	"current locale, and produces three text columns as output:]{"
36da2e3ebdSchin 	"[+1?Lines only in \afile1\a.]"
37da2e3ebdSchin 	"[+2?Lines only in \afile2\a.]"
38da2e3ebdSchin 	"[+3?Lines in both files.]"
39da2e3ebdSchin 	"}"
40da2e3ebdSchin "[+?If lines in either file are not ordered according to the collating "
41da2e3ebdSchin 	"sequence of the current locale, the results are not specified.]"
42da2e3ebdSchin "[+?If either \afile1\a or \afile2\a is \b-\b, \bcomm\b "
43da2e3ebdSchin         "uses standard input starting at the current location.]"
44da2e3ebdSchin 
45da2e3ebdSchin "[1?Suppress the output column of lines unique to \afile1\a.]"
46da2e3ebdSchin "[2?Suppress the output column of lines unique to \afile2\a.]"
47da2e3ebdSchin "[3?Suppress the output column of lines duplicate in \afile1\a and \afile2\a.]"
48da2e3ebdSchin "\n"
49da2e3ebdSchin "\nfile1 file2\n"
50da2e3ebdSchin "\n"
51da2e3ebdSchin "[+EXIT STATUS?]{"
52da2e3ebdSchin 	"[+0?Both files processed successfully.]"
53da2e3ebdSchin 	"[+>0?An error occurred.]"
54da2e3ebdSchin "}"
55da2e3ebdSchin "[+SEE ALSO?\bcmp\b(1), \bdiff\b(1)]"
56da2e3ebdSchin ;
57da2e3ebdSchin 
58da2e3ebdSchin 
59da2e3ebdSchin #include <cmd.h>
60da2e3ebdSchin 
61da2e3ebdSchin #define C_FILE1		1
62da2e3ebdSchin #define C_FILE2		2
63da2e3ebdSchin #define C_COMMON	4
64da2e3ebdSchin #define C_ALL		(C_FILE1|C_FILE2|C_COMMON)
65da2e3ebdSchin 
comm(Sfio_t * in1,Sfio_t * in2,register Sfio_t * out,register int mode)66da2e3ebdSchin static int comm(Sfio_t *in1, Sfio_t *in2, register Sfio_t *out,register int mode)
67da2e3ebdSchin {
68da2e3ebdSchin 	register char *cp1, *cp2;
69da2e3ebdSchin 	register int n1, n2, n, comp;
70da2e3ebdSchin 	if(cp1 = sfgetr(in1,'\n',0))
71da2e3ebdSchin 		n1 = sfvalue(in1);
72da2e3ebdSchin 	if(cp2 = sfgetr(in2,'\n',0))
73da2e3ebdSchin 		n2 = sfvalue(in2);
74da2e3ebdSchin 	while(cp1 && cp2)
75da2e3ebdSchin 	{
76da2e3ebdSchin 		n=(n1<n2?n1:n2);
77da2e3ebdSchin 		if((comp=memcmp(cp1,cp2,n-1))==0 && (comp=n1-n2)==0)
78da2e3ebdSchin 		{
79da2e3ebdSchin 			if(mode&C_COMMON)
80da2e3ebdSchin 			{
81da2e3ebdSchin 				if(mode!=C_COMMON)
82da2e3ebdSchin 				{
83da2e3ebdSchin 					sfputc(out,'\t');
84da2e3ebdSchin 					if(mode==C_ALL)
85da2e3ebdSchin 						sfputc(out,'\t');
86da2e3ebdSchin 				}
87da2e3ebdSchin 				if(sfwrite(out,cp1,n) < 0)
88da2e3ebdSchin 					return(-1);
89da2e3ebdSchin 			}
90da2e3ebdSchin 			if(cp1 = sfgetr(in1,'\n',0))
91da2e3ebdSchin 				n1 = sfvalue(in1);
92da2e3ebdSchin 			if(cp2 = sfgetr(in2,'\n',0))
93da2e3ebdSchin 				n2 = sfvalue(in2);
94da2e3ebdSchin 		}
95da2e3ebdSchin 		else if(comp > 0)
96da2e3ebdSchin 		{
97da2e3ebdSchin 			if(mode&C_FILE2)
98da2e3ebdSchin 			{
99da2e3ebdSchin 				if(mode&C_FILE1)
100da2e3ebdSchin 					sfputc(out,'\t');
101da2e3ebdSchin 				if(sfwrite(out,cp2,n2) < 0)
102da2e3ebdSchin 					return(-1);
103da2e3ebdSchin 			}
104da2e3ebdSchin 			if(cp2 = sfgetr(in2,'\n',0))
105da2e3ebdSchin 				n2 = sfvalue(in2);
106da2e3ebdSchin 		}
107da2e3ebdSchin 		else
108da2e3ebdSchin 		{
109da2e3ebdSchin 			if((mode&C_FILE1) && sfwrite(out,cp1,n1) < 0)
110da2e3ebdSchin 				return(-1);
111da2e3ebdSchin 			if(cp1 = sfgetr(in1,'\n',0))
112da2e3ebdSchin 				n1 = sfvalue(in1);
113da2e3ebdSchin 		}
114da2e3ebdSchin 	}
115da2e3ebdSchin 	n = 0;
116da2e3ebdSchin 	if(cp2)
117da2e3ebdSchin 	{
118da2e3ebdSchin 		cp1 = cp2;
119da2e3ebdSchin 		in1 = in2;
120da2e3ebdSchin 		n1 = n2;
121da2e3ebdSchin 		if(mode&C_FILE1)
122da2e3ebdSchin 			n = 1;
123da2e3ebdSchin 		mode &= C_FILE2;
124da2e3ebdSchin 	}
125da2e3ebdSchin 	else
126da2e3ebdSchin 		mode &= C_FILE1;
127da2e3ebdSchin 	if(!mode || !cp1)
128da2e3ebdSchin 	{
129da2e3ebdSchin 		if(cp1 && in1==sfstdin)
130da2e3ebdSchin 			sfseek(in1,(Sfoff_t)0,SEEK_END);
131da2e3ebdSchin 		return(0);
132da2e3ebdSchin 	}
133da2e3ebdSchin 	/* process the remaining stream */
134da2e3ebdSchin 	while(1)
135da2e3ebdSchin 	{
136da2e3ebdSchin 		if(n)
137da2e3ebdSchin 			sfputc(out,'\t');
138da2e3ebdSchin 		if(sfwrite(out,cp1,n1) < 0)
139da2e3ebdSchin 			return(-1);
140da2e3ebdSchin 		if(!(cp1 = sfgetr(in1,'\n',0)))
141da2e3ebdSchin 			return(0);
142da2e3ebdSchin 		n1 = sfvalue(in1);
143da2e3ebdSchin 	}
144da2e3ebdSchin 	/* NOT REACHED */
145da2e3ebdSchin }
146da2e3ebdSchin 
147da2e3ebdSchin int
b_comm(int argc,char * argv[],Shbltin_t * context)148*b30d1939SAndy Fiddaman b_comm(int argc, char *argv[], Shbltin_t* context)
149da2e3ebdSchin {
150da2e3ebdSchin 	register int mode = C_FILE1|C_FILE2|C_COMMON;
151da2e3ebdSchin 	register char *cp;
152da2e3ebdSchin 	Sfio_t *f1, *f2;
153da2e3ebdSchin 
154da2e3ebdSchin 	cmdinit(argc, argv, context, ERROR_CATALOG, 0);
155*b30d1939SAndy Fiddaman 	for (;;)
156da2e3ebdSchin 	{
157*b30d1939SAndy Fiddaman 		switch (optget(argv, usage))
158*b30d1939SAndy Fiddaman 		{
159*b30d1939SAndy Fiddaman  		case '1':
160*b30d1939SAndy Fiddaman 			mode &= ~C_FILE1;
161*b30d1939SAndy Fiddaman 			continue;
162*b30d1939SAndy Fiddaman 		case '2':
163*b30d1939SAndy Fiddaman 			mode &= ~C_FILE2;
164*b30d1939SAndy Fiddaman 			continue;
165*b30d1939SAndy Fiddaman 		case '3':
166*b30d1939SAndy Fiddaman 			mode &= ~C_COMMON;
167*b30d1939SAndy Fiddaman 			continue;
168*b30d1939SAndy Fiddaman 		case ':':
169*b30d1939SAndy Fiddaman 			error(2, "%s",opt_info.arg);
170*b30d1939SAndy Fiddaman 			break;
171*b30d1939SAndy Fiddaman 		case '?':
172*b30d1939SAndy Fiddaman 			error(ERROR_usage(2), "%s",opt_info.arg);
173*b30d1939SAndy Fiddaman 			break;
174*b30d1939SAndy Fiddaman 		}
175da2e3ebdSchin 		break;
176da2e3ebdSchin 	}
177da2e3ebdSchin 	argv += opt_info.index;
178da2e3ebdSchin 	argc -= opt_info.index;
179da2e3ebdSchin 	if(error_info.errors || argc!=2)
180da2e3ebdSchin 		error(ERROR_usage(2),"%s",optusage(NiL));
181da2e3ebdSchin 	cp = *argv++;
182da2e3ebdSchin 	if(streq(cp,"-"))
183da2e3ebdSchin 		f1 = sfstdin;
184da2e3ebdSchin 	else if(!(f1 = sfopen(NiL, cp,"r")))
185da2e3ebdSchin 		error(ERROR_system(1),"%s: cannot open",cp);
186da2e3ebdSchin 	cp = *argv;
187da2e3ebdSchin 	if(streq(cp,"-"))
188da2e3ebdSchin 		f2 = sfstdin;
189da2e3ebdSchin 	else if(!(f2 = sfopen(NiL, cp,"r")))
190da2e3ebdSchin 		error(ERROR_system(1),"%s: cannot open",cp);
191da2e3ebdSchin 	if(mode)
192da2e3ebdSchin 	{
193da2e3ebdSchin 		if(comm(f1,f2,sfstdout,mode) < 0)
194da2e3ebdSchin 			error(ERROR_system(1)," write error");
195da2e3ebdSchin 	}
196da2e3ebdSchin 	else if(f1==sfstdin || f2==sfstdin)
197da2e3ebdSchin 		sfseek(sfstdin,(Sfoff_t)0,SEEK_END);
198da2e3ebdSchin 	if(f1!=sfstdin)
199da2e3ebdSchin 		sfclose(f1);
200da2e3ebdSchin 	if(f2!=sfstdin)
201da2e3ebdSchin 		sfclose(f2);
202*b30d1939SAndy Fiddaman 	return error_info.errors;
203da2e3ebdSchin }
204