xref: /plan9/sys/src/ape/cmd/diff/dir.c (revision 0b459c2cb92b7c9d88818e9a2f72e678e5bc4553)
1*0b459c2cSDavid du Colombier /* Read, sort and compare two directories.  Used for GNU DIFF.
2*0b459c2cSDavid du Colombier    Copyright (C) 1988, 1989, 1992, 1993, 1994 Free Software Foundation, Inc.
3*0b459c2cSDavid du Colombier 
4*0b459c2cSDavid du Colombier This file is part of GNU DIFF.
5*0b459c2cSDavid du Colombier 
6*0b459c2cSDavid du Colombier GNU DIFF is free software; you can redistribute it and/or modify
7*0b459c2cSDavid du Colombier it under the terms of the GNU General Public License as published by
8*0b459c2cSDavid du Colombier the Free Software Foundation; either version 2, or (at your option)
9*0b459c2cSDavid du Colombier any later version.
10*0b459c2cSDavid du Colombier 
11*0b459c2cSDavid du Colombier GNU DIFF is distributed in the hope that it will be useful,
12*0b459c2cSDavid du Colombier but WITHOUT ANY WARRANTY; without even the implied warranty of
13*0b459c2cSDavid du Colombier MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
14*0b459c2cSDavid du Colombier GNU General Public License for more details.
15*0b459c2cSDavid du Colombier 
16*0b459c2cSDavid du Colombier You should have received a copy of the GNU General Public License
17*0b459c2cSDavid du Colombier along with GNU DIFF; see the file COPYING.  If not, write to
18*0b459c2cSDavid du Colombier the Free Software Foundation, 675 Mass Ave, Cambridge, MA 02139, USA.  */
19*0b459c2cSDavid du Colombier 
20*0b459c2cSDavid du Colombier #include "diff.h"
21*0b459c2cSDavid du Colombier 
22*0b459c2cSDavid du Colombier /* Read the directory named by DIR and store into DIRDATA a sorted vector
23*0b459c2cSDavid du Colombier    of filenames for its contents.  DIR->desc == -1 means this directory is
24*0b459c2cSDavid du Colombier    known to be nonexistent, so set DIRDATA to an empty vector.
25*0b459c2cSDavid du Colombier    Return -1 (setting errno) if error, 0 otherwise.  */
26*0b459c2cSDavid du Colombier 
27*0b459c2cSDavid du Colombier struct dirdata
28*0b459c2cSDavid du Colombier {
29*0b459c2cSDavid du Colombier   char const **names;	/* Sorted names of files in dir, 0-terminated.  */
30*0b459c2cSDavid du Colombier   char *data;	/* Allocated storage for file names.  */
31*0b459c2cSDavid du Colombier };
32*0b459c2cSDavid du Colombier 
33*0b459c2cSDavid du Colombier static int compare_names PARAMS((void const *, void const *));
34*0b459c2cSDavid du Colombier static int dir_sort PARAMS((struct file_data const *, struct dirdata *));
35*0b459c2cSDavid du Colombier 
36*0b459c2cSDavid du Colombier static int
dir_sort(dir,dirdata)37*0b459c2cSDavid du Colombier dir_sort (dir, dirdata)
38*0b459c2cSDavid du Colombier      struct file_data const *dir;
39*0b459c2cSDavid du Colombier      struct dirdata *dirdata;
40*0b459c2cSDavid du Colombier {
41*0b459c2cSDavid du Colombier   register struct dirent *next;
42*0b459c2cSDavid du Colombier   register int i;
43*0b459c2cSDavid du Colombier 
44*0b459c2cSDavid du Colombier   /* Address of block containing the files that are described.  */
45*0b459c2cSDavid du Colombier   char const **names;
46*0b459c2cSDavid du Colombier 
47*0b459c2cSDavid du Colombier   /* Number of files in directory.  */
48*0b459c2cSDavid du Colombier   size_t nnames;
49*0b459c2cSDavid du Colombier 
50*0b459c2cSDavid du Colombier   /* Allocated and used storage for file name data.  */
51*0b459c2cSDavid du Colombier   char *data;
52*0b459c2cSDavid du Colombier   size_t data_alloc, data_used;
53*0b459c2cSDavid du Colombier 
54*0b459c2cSDavid du Colombier   dirdata->names = 0;
55*0b459c2cSDavid du Colombier   dirdata->data = 0;
56*0b459c2cSDavid du Colombier   nnames = 0;
57*0b459c2cSDavid du Colombier   data = 0;
58*0b459c2cSDavid du Colombier 
59*0b459c2cSDavid du Colombier   if (dir->desc != -1)
60*0b459c2cSDavid du Colombier     {
61*0b459c2cSDavid du Colombier       /* Open the directory and check for errors.  */
62*0b459c2cSDavid du Colombier       register DIR *reading = opendir (dir->name);
63*0b459c2cSDavid du Colombier       if (!reading)
64*0b459c2cSDavid du Colombier 	return -1;
65*0b459c2cSDavid du Colombier 
66*0b459c2cSDavid du Colombier       /* Initialize the table of filenames.  */
67*0b459c2cSDavid du Colombier 
68*0b459c2cSDavid du Colombier       data_alloc = max (1, (size_t) dir->stat.st_size);
69*0b459c2cSDavid du Colombier       data_used = 0;
70*0b459c2cSDavid du Colombier       dirdata->data = data = xmalloc (data_alloc);
71*0b459c2cSDavid du Colombier 
72*0b459c2cSDavid du Colombier       /* Read the directory entries, and insert the subfiles
73*0b459c2cSDavid du Colombier 	 into the `data' table.  */
74*0b459c2cSDavid du Colombier 
75*0b459c2cSDavid du Colombier       while ((errno = 0, (next = readdir (reading)) != 0))
76*0b459c2cSDavid du Colombier 	{
77*0b459c2cSDavid du Colombier 	  char *d_name = next->d_name;
78*0b459c2cSDavid du Colombier 	  size_t d_size = NAMLEN (next) + 1;
79*0b459c2cSDavid du Colombier 
80*0b459c2cSDavid du Colombier 	  /* Ignore the files `.' and `..' */
81*0b459c2cSDavid du Colombier 	  if (d_name[0] == '.'
82*0b459c2cSDavid du Colombier 	      && (d_name[1] == 0 || (d_name[1] == '.' && d_name[2] == 0)))
83*0b459c2cSDavid du Colombier 	    continue;
84*0b459c2cSDavid du Colombier 
85*0b459c2cSDavid du Colombier 	  if (excluded_filename (d_name))
86*0b459c2cSDavid du Colombier 	    continue;
87*0b459c2cSDavid du Colombier 
88*0b459c2cSDavid du Colombier 	  while (data_alloc < data_used + d_size)
89*0b459c2cSDavid du Colombier 	    dirdata->data = data = xrealloc (data, data_alloc *= 2);
90*0b459c2cSDavid du Colombier 	  memcpy (data + data_used, d_name, d_size);
91*0b459c2cSDavid du Colombier 	  data_used += d_size;
92*0b459c2cSDavid du Colombier 	  nnames++;
93*0b459c2cSDavid du Colombier 	}
94*0b459c2cSDavid du Colombier       if (errno)
95*0b459c2cSDavid du Colombier 	{
96*0b459c2cSDavid du Colombier 	  int e = errno;
97*0b459c2cSDavid du Colombier 	  closedir (reading);
98*0b459c2cSDavid du Colombier 	  errno = e;
99*0b459c2cSDavid du Colombier 	  return -1;
100*0b459c2cSDavid du Colombier 	}
101*0b459c2cSDavid du Colombier #if CLOSEDIR_VOID
102*0b459c2cSDavid du Colombier       closedir (reading);
103*0b459c2cSDavid du Colombier #else
104*0b459c2cSDavid du Colombier       if (closedir (reading) != 0)
105*0b459c2cSDavid du Colombier 	return -1;
106*0b459c2cSDavid du Colombier #endif
107*0b459c2cSDavid du Colombier     }
108*0b459c2cSDavid du Colombier 
109*0b459c2cSDavid du Colombier   /* Create the `names' table from the `data' table.  */
110*0b459c2cSDavid du Colombier   dirdata->names = names = (char const **) xmalloc (sizeof (char *)
111*0b459c2cSDavid du Colombier 						    * (nnames + 1));
112*0b459c2cSDavid du Colombier   for (i = 0;  i < nnames;  i++)
113*0b459c2cSDavid du Colombier     {
114*0b459c2cSDavid du Colombier       names[i] = data;
115*0b459c2cSDavid du Colombier       data += strlen (data) + 1;
116*0b459c2cSDavid du Colombier     }
117*0b459c2cSDavid du Colombier   names[nnames] = 0;
118*0b459c2cSDavid du Colombier 
119*0b459c2cSDavid du Colombier   /* Sort the table.  */
120*0b459c2cSDavid du Colombier   qsort (names, nnames, sizeof (char *), compare_names);
121*0b459c2cSDavid du Colombier 
122*0b459c2cSDavid du Colombier   return 0;
123*0b459c2cSDavid du Colombier }
124*0b459c2cSDavid du Colombier 
125*0b459c2cSDavid du Colombier /* Sort the files now in the table.  */
126*0b459c2cSDavid du Colombier 
127*0b459c2cSDavid du Colombier static int
compare_names(file1,file2)128*0b459c2cSDavid du Colombier compare_names (file1, file2)
129*0b459c2cSDavid du Colombier      void const *file1, *file2;
130*0b459c2cSDavid du Colombier {
131*0b459c2cSDavid du Colombier   return filename_cmp (* (char const *const *) file1,
132*0b459c2cSDavid du Colombier 		       * (char const *const *) file2);
133*0b459c2cSDavid du Colombier }
134*0b459c2cSDavid du Colombier 
135*0b459c2cSDavid du Colombier /* Compare the contents of two directories named in FILEVEC[0] and FILEVEC[1].
136*0b459c2cSDavid du Colombier    This is a top-level routine; it does everything necessary for diff
137*0b459c2cSDavid du Colombier    on two directories.
138*0b459c2cSDavid du Colombier 
139*0b459c2cSDavid du Colombier    FILEVEC[0].desc == -1 says directory FILEVEC[0] doesn't exist,
140*0b459c2cSDavid du Colombier    but pretend it is empty.  Likewise for FILEVEC[1].
141*0b459c2cSDavid du Colombier 
142*0b459c2cSDavid du Colombier    HANDLE_FILE is a caller-provided subroutine called to handle each file.
143*0b459c2cSDavid du Colombier    It gets five operands: dir and name (rel to original working dir) of file
144*0b459c2cSDavid du Colombier    in dir 0, dir and name pathname of file in dir 1, and the recursion depth.
145*0b459c2cSDavid du Colombier 
146*0b459c2cSDavid du Colombier    For a file that appears in only one of the dirs, one of the name-args
147*0b459c2cSDavid du Colombier    to HANDLE_FILE is zero.
148*0b459c2cSDavid du Colombier 
149*0b459c2cSDavid du Colombier    DEPTH is the current depth in recursion, used for skipping top-level
150*0b459c2cSDavid du Colombier    files by the -S option.
151*0b459c2cSDavid du Colombier 
152*0b459c2cSDavid du Colombier    Returns the maximum of all the values returned by HANDLE_FILE,
153*0b459c2cSDavid du Colombier    or 2 if trouble is encountered in opening files.  */
154*0b459c2cSDavid du Colombier 
155*0b459c2cSDavid du Colombier int
diff_dirs(filevec,handle_file,depth)156*0b459c2cSDavid du Colombier diff_dirs (filevec, handle_file, depth)
157*0b459c2cSDavid du Colombier      struct file_data const filevec[];
158*0b459c2cSDavid du Colombier      int (*handle_file) PARAMS((char const *, char const *, char const *, char const *, int));
159*0b459c2cSDavid du Colombier      int depth;
160*0b459c2cSDavid du Colombier {
161*0b459c2cSDavid du Colombier   struct dirdata dirdata[2];
162*0b459c2cSDavid du Colombier   int val = 0;			/* Return value.  */
163*0b459c2cSDavid du Colombier   int i;
164*0b459c2cSDavid du Colombier 
165*0b459c2cSDavid du Colombier   /* Get sorted contents of both dirs.  */
166*0b459c2cSDavid du Colombier   for (i = 0; i < 2; i++)
167*0b459c2cSDavid du Colombier     if (dir_sort (&filevec[i], &dirdata[i]) != 0)
168*0b459c2cSDavid du Colombier       {
169*0b459c2cSDavid du Colombier 	perror_with_name (filevec[i].name);
170*0b459c2cSDavid du Colombier 	val = 2;
171*0b459c2cSDavid du Colombier       }
172*0b459c2cSDavid du Colombier 
173*0b459c2cSDavid du Colombier   if (val == 0)
174*0b459c2cSDavid du Colombier     {
175*0b459c2cSDavid du Colombier       register char const * const *names0 = dirdata[0].names;
176*0b459c2cSDavid du Colombier       register char const * const *names1 = dirdata[1].names;
177*0b459c2cSDavid du Colombier       char const *name0 = filevec[0].name;
178*0b459c2cSDavid du Colombier       char const *name1 = filevec[1].name;
179*0b459c2cSDavid du Colombier 
180*0b459c2cSDavid du Colombier       /* If `-S name' was given, and this is the topmost level of comparison,
181*0b459c2cSDavid du Colombier 	 ignore all file names less than the specified starting name.  */
182*0b459c2cSDavid du Colombier 
183*0b459c2cSDavid du Colombier       if (dir_start_file && depth == 0)
184*0b459c2cSDavid du Colombier 	{
185*0b459c2cSDavid du Colombier 	  while (*names0 && filename_cmp (*names0, dir_start_file) < 0)
186*0b459c2cSDavid du Colombier 	    names0++;
187*0b459c2cSDavid du Colombier 	  while (*names1 && filename_cmp (*names1, dir_start_file) < 0)
188*0b459c2cSDavid du Colombier 	    names1++;
189*0b459c2cSDavid du Colombier 	}
190*0b459c2cSDavid du Colombier 
191*0b459c2cSDavid du Colombier       /* Loop while files remain in one or both dirs.  */
192*0b459c2cSDavid du Colombier       while (*names0 || *names1)
193*0b459c2cSDavid du Colombier 	{
194*0b459c2cSDavid du Colombier 	  /* Compare next name in dir 0 with next name in dir 1.
195*0b459c2cSDavid du Colombier 	     At the end of a dir,
196*0b459c2cSDavid du Colombier 	     pretend the "next name" in that dir is very large.  */
197*0b459c2cSDavid du Colombier 	  int nameorder = (!*names0 ? 1 : !*names1 ? -1
198*0b459c2cSDavid du Colombier 			   : filename_cmp (*names0, *names1));
199*0b459c2cSDavid du Colombier 	  int v1 = (*handle_file) (name0, 0 < nameorder ? 0 : *names0++,
200*0b459c2cSDavid du Colombier 				   name1, nameorder < 0 ? 0 : *names1++,
201*0b459c2cSDavid du Colombier 				   depth + 1);
202*0b459c2cSDavid du Colombier 	  if (v1 > val)
203*0b459c2cSDavid du Colombier 	    val = v1;
204*0b459c2cSDavid du Colombier 	}
205*0b459c2cSDavid du Colombier     }
206*0b459c2cSDavid du Colombier 
207*0b459c2cSDavid du Colombier   for (i = 0; i < 2; i++)
208*0b459c2cSDavid du Colombier     {
209*0b459c2cSDavid du Colombier       if (dirdata[i].names)
210*0b459c2cSDavid du Colombier 	free (dirdata[i].names);
211*0b459c2cSDavid du Colombier       if (dirdata[i].data)
212*0b459c2cSDavid du Colombier 	free (dirdata[i].data);
213*0b459c2cSDavid du Colombier     }
214*0b459c2cSDavid du Colombier 
215*0b459c2cSDavid du Colombier   return val;
216*0b459c2cSDavid du Colombier }
217