1*48296Sbostic /*-
2*48296Sbostic * %sccs.include.proprietary.c%
3*48296Sbostic */
4*48296Sbostic
512283Stut #ifndef lint
6*48296Sbostic static char sccsid[] = "@(#)hunt1.c 4.4 (Berkeley) 04/18/91";
7*48296Sbostic #endif /* not lint */
812283Stut
913225Sgarrison # include <stdio.h>
1013225Sgarrison # include <assert.h>
1112283Stut extern char refdir[];
1212283Stut extern int keepold;
1312283Stut extern char *fgnames[];
1412283Stut extern char **fgnamp;
1513225Sgarrison FILE *fd =NULL;
1613225Sgarrison int lmaster =500;
1712283Stut int *hfreq, hfrflg;
1813225Sgarrison int colevel =0;
1913225Sgarrison int measure=0;
2013225Sgarrison int soutlen =1000;
2113225Sgarrison int reached =0;
2213225Sgarrison int iflong =0;
2313225Sgarrison int prfreqs =0;
2412283Stut char usedir[100];
2513225Sgarrison char * calloc();
2613225Sgarrison char * todir();
2712283Stut char gfile[50];
2813225Sgarrison static int full =1000;
2913225Sgarrison static int tags =0;
3012283Stut char *sinput, *soutput, *tagout;
3113225Sgarrison long indexdate =0, gdate();
3212283Stut
main(argc,argv)3312283Stut main(argc,argv)
3412283Stut char *argv[];
3512283Stut {
3612283Stut /* read query from stdin, expect name of indexes in argv[1] */
3712283Stut static FILE *fa, *fb, *fc;
3813225Sgarrison char nma[100], nmb[100], nmc[100], *qitem[100], *rprog = NULL;
3912283Stut char nmd[100], grepquery[256];
4012283Stut static char oldname[30] ;
4113225Sgarrison static int was =0;
4212283Stut /* these pointers are unions of pointer to int and pointer to long */
4312283Stut long *hpt;
4413225Sgarrison unsigned *master =0;
4512283Stut int falseflg, nhash, nitem, nfound, frtbl, kk;
4612283Stut
4712283Stut /* special wart for refpart: default is tags only */
4812283Stut
4912283Stut while (argv[1][0] == '-')
5012283Stut {
5112283Stut switch(argv[1][1])
5212283Stut {
5312283Stut case 'a': /* all output, incl. false drops */
5412283Stut falseflg = 1;
5512283Stut break;
5612283Stut case 'r':
5712283Stut argc--;
5812283Stut argv++;
5912283Stut rprog = argv[1];
6012283Stut break;
6112283Stut case 'F': /* put out full text */
6212283Stut full = setfrom(argv[1][2]);
6312283Stut break;
6412283Stut case 'T': /* put out tags */
6512283Stut tags = setfrom(argv[1][2]);
6612283Stut break;
6712283Stut case 'i': /* input in argument string */
6812283Stut argc--;
6912283Stut argv++;
7012283Stut sinput = argv[1];
7112283Stut break;
7212283Stut case 's': /*text output to string */
7312283Stut case 'o':
7412283Stut argc--;
7512283Stut argv++;
7612283Stut soutput = argv[1];
7717679Sralph if ((int) argv[2]<16000)
7812283Stut {
7913225Sgarrison soutlen = (int)argv[2];
8012283Stut argc--;
8112283Stut argv++;
8212283Stut }
8312283Stut break;
8412283Stut case 't': /*tag output to string */
8512283Stut argc--;
8612283Stut argv++;
8712283Stut tagout = argv[1];
8812283Stut break;
8912283Stut case 'l': /* length of internal lists */
9012283Stut argc--;
9112283Stut argv++;
9212283Stut lmaster = atoi(argv[1]);
9312283Stut break;
9412283Stut case 'g': /* suppress fgrep search on old files */
9512283Stut keepold = 0;
9612283Stut break;
9712283Stut case 'C': /* coordination level */
9812283Stut colevel = atoi(argv[1]+2);
9912283Stut # if D1
10012283Stut fprintf(stderr, "colevel set to %d\n",colevel);
10112283Stut # endif
10212283Stut break;
10312283Stut case 'P': /* print term freqs */
10412283Stut prfreqs=1;
10512283Stut break;
10613225Sgarrison case 'm':
10713225Sgarrison measure=1;
10813225Sgarrison break;
10912283Stut }
11012283Stut argc--;
11112283Stut argv++;
11212283Stut }
11312283Stut strcpy (nma, todir(argv[1]));
11412283Stut if (was == 0 || strcmp (oldname, nma) !=0)
11512283Stut {
11612283Stut strcpy (oldname,nma);
11712283Stut strcpy (nmb, nma);
11812283Stut strcpy (nmc, nmb);
11912283Stut strcpy(nmd,nma);
12012283Stut strcat (nma, ".ia");
12112283Stut strcat (nmb, ".ib");
12212283Stut strcat (nmc, ".ic");
12312283Stut strcat (nmd, ".id");
12412283Stut if (was)
12512283Stut {
12612283Stut fclose(fa);
12712283Stut fclose(fb);
12812283Stut fclose(fc);
12912283Stut }
13012283Stut
13112283Stut fa = fopen(nma, "r");
13212283Stut if (fa==NULL)
13312283Stut {
13413225Sgarrison strcpy(*fgnamp++ = calloc(strlen(oldname)+2,1), oldname);
13513225Sgarrison fb=NULL;
13613225Sgarrison goto search;
13712283Stut }
13812283Stut fb = fopen(nmb, "r");
13912283Stut fc = fopen(nmc, "r");
14012283Stut was =1;
14112283Stut if (fb== NULL || fc ==NULL)
14212283Stut {
14312283Stut err("Index incomplete %s", nmb);
14412283Stut exit(1);
14512283Stut }
14612283Stut indexdate = gdate(fb);
14712283Stut fd = fopen(nmd, "r");
14812283Stut }
14912283Stut fseek (fa, 0L, 0);
15012283Stut fread (&nhash, sizeof(nhash), 1, fa);
15112283Stut fread (&iflong, sizeof(iflong), 1, fa);
15212283Stut if(master==0)
15317679Sralph master = (unsigned *) calloc (lmaster, iflong? sizeof(long): sizeof(unsigned));
15417679Sralph hpt = (long *) calloc(nhash, sizeof(*hpt));
15512283Stut kk=fread( hpt, sizeof(*hpt), nhash, fa);
15612283Stut # if D1
15712283Stut fprintf(stderr,"read %d hashes, iflong %d, nhash %d\n", kk, iflong, nhash);
15812283Stut # endif
15912283Stut _assert (kk==nhash);
16017679Sralph hfreq = (int *) calloc(nhash, sizeof(*hfreq));
16112283Stut _assert (hfreq != NULL);
16212283Stut frtbl = fread(hfreq, sizeof(*hfreq), nhash, fa);
16312283Stut hfrflg = (frtbl == nhash);
16412283Stut # if D1
16512283Stut fprintf(stderr, "read freqs %d\n", frtbl);
16612283Stut # endif
16712283Stut
16813225Sgarrison search:
16912283Stut while (1)
17012283Stut {
17112283Stut nitem = getq(qitem);
17213225Sgarrison if (measure) tick();
17312283Stut if (nitem==0) continue;
17412283Stut if (nitem < 0) break;
17513225Sgarrison if (tagout) tagout[0]=0;
17613225Sgarrison if (fb!=NULL)
17713225Sgarrison {
17813225Sgarrison nfound = doquery(hpt, nhash, fb, nitem, qitem, master);
17912283Stut # if D1
18013225Sgarrison fprintf(stderr,"after doquery nfound %d\n", nfound);
18112283Stut # endif
18213225Sgarrison fgnamp=fgnames;
18313225Sgarrison if (falseflg == 0)
18413225Sgarrison nfound = baddrop(master, nfound, fc, nitem, qitem, rprog, full);
18512283Stut # if D1
18613225Sgarrison fprintf(stderr,"after baddrop nfound %d\n", nfound);
18712283Stut # endif
18813225Sgarrison }
18912283Stut if (fgnamp>fgnames)
19012283Stut {
19112283Stut char **fgp, tgbuff[100];
19212283Stut int k;
19312283Stut # if D1
19412283Stut fprintf(stderr, "were %d bad files\n", fgnamp-fgnames);
19512283Stut # endif
19612283Stut grepquery[0]=0;
19712283Stut for(k=0; k<nitem; k++)
19812283Stut {
19912283Stut strcat(grepquery, " ");
20012283Stut strcat(grepquery, qitem[k]);
20112283Stut }
20212283Stut # if D1
20312283Stut fprintf(stderr, "grepquery %s\n",grepquery);
20412283Stut # endif
20512283Stut for(fgp=fgnames; fgp<fgnamp; fgp++)
20612283Stut {
20712283Stut # if D1
20812283Stut fprintf(stderr, "Now on %s query /%s/\n", *fgp, grepquery);
20912283Stut # endif
21012283Stut makefgrep(*fgp);
21112283Stut # if D1
21212283Stut fprintf(stderr, "grepmade\n");
21312283Stut # endif
21412283Stut if (tagout==0)
21512283Stut tagout=tgbuff;
21612283Stut grepcall(grepquery, tagout, *fgp);
21712283Stut # if D1
21812283Stut fprintf(stderr, "tagout now /%s/\n", tagout);
21912283Stut # endif
22012283Stut if (full)
22112283Stut {
22212283Stut char bout[1000];
22313225Sgarrison char *tagp;
22413225Sgarrison char *oldtagp;
22513225Sgarrison tagp = tagout;
22613225Sgarrison while (*tagp) {
22713225Sgarrison oldtagp = tagp;
22813225Sgarrison while (*tagp && (*tagp != '\n'))
22913225Sgarrison tagp++;
23013225Sgarrison if (*tagp)
23113225Sgarrison tagp++;
23213225Sgarrison findline(oldtagp, bout, 1000);
23313225Sgarrison fputs(bout,stdout);
23413225Sgarrison }
23512283Stut }
23612283Stut }
23712283Stut }
23812283Stut if (tags)
23912283Stut result (master, nfound >tags ? tags: nfound, fc);
24013225Sgarrison if (measure) tock();
24112283Stut }
24212283Stut }
24312283Stut
24412283Stut char *
todir(t)24512283Stut todir(t)
24612283Stut char *t;
24712283Stut {
24812283Stut char *s;
24912283Stut s=t;
25012283Stut while (*s) s++;
25112283Stut while (s>=t && *s != '/') s--;
25212283Stut if (s<t) return(t);
25312283Stut *s++ = 0;
25412283Stut t = (*t ? t : "/");
25512283Stut chdir (t);
25612283Stut strcpy (usedir,t);
25712283Stut return(s);
25812283Stut }
setfrom(c)25912283Stut setfrom(c)
26012283Stut {
26112283Stut switch(c)
26212283Stut {
26312283Stut case 'y':
26412283Stut case '\0':
26512283Stut default:
26612283Stut return(1000);
26712283Stut case '1':
26812283Stut case '2':
26912283Stut case '3':
27012283Stut case '4':
27112283Stut case '5':
27212283Stut case '6':
27312283Stut case '7':
27412283Stut case '8':
27512283Stut case '9':
27612283Stut return(c-'0');
27712283Stut case 'n':
27812283Stut case '0':
27912283Stut return(0);
28012283Stut }
28112283Stut }
282