xref: /onnv-gate/usr/src/cmd/spell/spellprog.c (revision 239:22a33675e457)
10Sstevel@tonic-gate /*
20Sstevel@tonic-gate  * CDDL HEADER START
30Sstevel@tonic-gate  *
40Sstevel@tonic-gate  * The contents of this file are subject to the terms of the
50Sstevel@tonic-gate  * Common Development and Distribution License, Version 1.0 only
60Sstevel@tonic-gate  * (the "License").  You may not use this file except in compliance
70Sstevel@tonic-gate  * with the License.
80Sstevel@tonic-gate  *
90Sstevel@tonic-gate  * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE
100Sstevel@tonic-gate  * or http://www.opensolaris.org/os/licensing.
110Sstevel@tonic-gate  * See the License for the specific language governing permissions
120Sstevel@tonic-gate  * and limitations under the License.
130Sstevel@tonic-gate  *
140Sstevel@tonic-gate  * When distributing Covered Code, include this CDDL HEADER in each
150Sstevel@tonic-gate  * file and include the License file at usr/src/OPENSOLARIS.LICENSE.
160Sstevel@tonic-gate  * If applicable, add the following below this CDDL HEADER, with the
170Sstevel@tonic-gate  * fields enclosed by brackets "[]" replaced with your own identifying
180Sstevel@tonic-gate  * information: Portions Copyright [yyyy] [name of copyright owner]
190Sstevel@tonic-gate  *
200Sstevel@tonic-gate  * CDDL HEADER END
210Sstevel@tonic-gate  */
22*239Sceastha /*
23*239Sceastha  * Copyright 2005 Sun Microsystems, Inc.  All rights reserved.
24*239Sceastha  * Use is subject to license terms.
25*239Sceastha  */
26*239Sceastha 
270Sstevel@tonic-gate /*	Copyright (c) 1984, 1986, 1987, 1988, 1989 AT&T	*/
280Sstevel@tonic-gate /*	  All Rights Reserved  	*/
290Sstevel@tonic-gate 
300Sstevel@tonic-gate #pragma ident	"%Z%%M%	%I%	%E% SMI"
310Sstevel@tonic-gate 
320Sstevel@tonic-gate #include <stdlib.h>
330Sstevel@tonic-gate #include <unistd.h>
340Sstevel@tonic-gate #include <limits.h>
350Sstevel@tonic-gate #include <string.h>
360Sstevel@tonic-gate #include <stdio.h>
370Sstevel@tonic-gate #include <ctype.h>
380Sstevel@tonic-gate #include <locale.h>
390Sstevel@tonic-gate #include "hash.h"
400Sstevel@tonic-gate 
410Sstevel@tonic-gate #define	Tolower(c) (isupper(c)?tolower(c):c)
420Sstevel@tonic-gate #define	DLEV 2
430Sstevel@tonic-gate 
440Sstevel@tonic-gate /*
450Sstevel@tonic-gate  * ANSI prototypes
460Sstevel@tonic-gate  */
470Sstevel@tonic-gate static int	ily(char *, char *, char *, int);
480Sstevel@tonic-gate static int	s(char *, char *, char *, int);
490Sstevel@tonic-gate static int	es(char *, char *, char *, int);
500Sstevel@tonic-gate static int	subst(char *, char *, char *, int);
510Sstevel@tonic-gate static int	nop(void);
520Sstevel@tonic-gate static int	bility(char *, char *, char *, int);
530Sstevel@tonic-gate static int	i_to_y(char *, char *, char *, int);
540Sstevel@tonic-gate static int	CCe(char *, char *, char *, int);
550Sstevel@tonic-gate static int	y_to_e(char *, char *, char *, int);
560Sstevel@tonic-gate static int	strip(char *, char *, char *, int);
570Sstevel@tonic-gate static int	ize(char *, char *, char *, int);
580Sstevel@tonic-gate static int	tion(char *, char *, char *, int);
590Sstevel@tonic-gate static int	an(char *, char *, char *, int);
600Sstevel@tonic-gate int		prime(char *);
610Sstevel@tonic-gate static void	ise(void);
620Sstevel@tonic-gate static int	tryword(char *, char *, int);
630Sstevel@tonic-gate static int	trypref(char *, char *, int);
640Sstevel@tonic-gate static int	trysuff(char *, int);
650Sstevel@tonic-gate static int	vowel(int);
660Sstevel@tonic-gate static int	dict(char *, char *);
670Sstevel@tonic-gate static int	monosyl(char *, char *);
680Sstevel@tonic-gate static int	VCe(char *, char *, char *, int);
690Sstevel@tonic-gate static char	*skipv(char *);
700Sstevel@tonic-gate static void	ztos(char *);
710Sstevel@tonic-gate 
720Sstevel@tonic-gate static struct suftab {
730Sstevel@tonic-gate 	char *suf;
740Sstevel@tonic-gate 	int (*p1)();
750Sstevel@tonic-gate 	int n1;
760Sstevel@tonic-gate 	char *d1;
770Sstevel@tonic-gate 	char *a1;
780Sstevel@tonic-gate 	int (*p2)();
790Sstevel@tonic-gate 	int n2;
800Sstevel@tonic-gate 	char *d2;
810Sstevel@tonic-gate 	char *a2;
820Sstevel@tonic-gate } suftab[] = {
830Sstevel@tonic-gate 	{"ssen", ily, 4, "-y+iness", "+ness" },
840Sstevel@tonic-gate 	{"ssel", ily, 4, "-y+i+less", "+less" },
850Sstevel@tonic-gate 	{"se", s, 1, "", "+s", 	es, 2, "-y+ies", "+es" },
860Sstevel@tonic-gate 	{"s'", s, 2, "", "+'s"},
870Sstevel@tonic-gate 	{"s", s, 1, "", "+s"},
880Sstevel@tonic-gate 	{"ecn", subst, 1, "-t+ce", ""},
890Sstevel@tonic-gate 	{"ycn", subst, 1, "-t+cy", ""},
900Sstevel@tonic-gate 	{"ytilb", nop, 0, "", ""},
910Sstevel@tonic-gate 	{"ytilib", bility, 5, "-le+ility", ""},
920Sstevel@tonic-gate 	{"elbaif", i_to_y, 4, "-y+iable", ""},
930Sstevel@tonic-gate 	{"elba", CCe, 4, "-e+able", "+able"},
940Sstevel@tonic-gate 	{"yti", CCe, 3, "-e+ity", "+ity"},
950Sstevel@tonic-gate 	{"ylb", y_to_e, 1, "-e+y", ""},
960Sstevel@tonic-gate 	{"yl", ily, 2, "-y+ily", "+ly"},
970Sstevel@tonic-gate 	{"laci", strip, 2, "", "+al"},
980Sstevel@tonic-gate 	{"latnem", strip, 2, "", "+al"},
990Sstevel@tonic-gate 	{"lanoi", strip, 2, "", "+al"},
1000Sstevel@tonic-gate 	{"tnem", strip, 4, "", "+ment"},
1010Sstevel@tonic-gate 	{"gni", CCe, 3, "-e+ing", "+ing"},
1020Sstevel@tonic-gate 	{"reta", nop, 0, "", ""},
1030Sstevel@tonic-gate 	{"retc", nop, 0, "", ""},
1040Sstevel@tonic-gate 	{"re", strip, 1, "", "+r", i_to_y, 2, "-y+ier", "+er"},
1050Sstevel@tonic-gate 	{"de", strip, 1, "", "+d", i_to_y, 2, "-y+ied", "+ed"},
1060Sstevel@tonic-gate 	{"citsi", strip, 2, "", "+ic"},
1070Sstevel@tonic-gate 	{"citi", ize, 1, "-ic+e", ""},
1080Sstevel@tonic-gate 	{"cihparg", i_to_y, 1, "-y+ic", ""},
1090Sstevel@tonic-gate 	{"tse", strip, 2, "", "+st", 	i_to_y, 3, "-y+iest", "+est"},
1100Sstevel@tonic-gate 	{"cirtem", i_to_y, 1, "-y+ic", ""},
1110Sstevel@tonic-gate 	{"yrtem", subst, 0, "-er+ry", ""},
1120Sstevel@tonic-gate 	{"cigol", i_to_y, 1, "-y+ic", ""},
1130Sstevel@tonic-gate 	{"tsigol", i_to_y, 2, "-y+ist", ""},
1140Sstevel@tonic-gate 	{"tsi", CCe, 3, "-e+ist", "+ist"},
1150Sstevel@tonic-gate 	{"msi", CCe, 3, "-e+ism", "+ist"},
1160Sstevel@tonic-gate 	{"noitacifi", i_to_y, 6, "-y+ication", ""},
1170Sstevel@tonic-gate 	{"noitazi", ize, 4, "-e+ation", ""},
1180Sstevel@tonic-gate 	{"rota", tion, 2, "-e+or", ""},
1190Sstevel@tonic-gate 	{"rotc", tion, 2, "", "+or"},
1200Sstevel@tonic-gate 	{"noit", tion, 3, "-e+ion", "+ion"},
1210Sstevel@tonic-gate 	{"naino", an, 3, "", "+ian"},
1220Sstevel@tonic-gate 	{"na", an, 1, "", "+n"},
1230Sstevel@tonic-gate 	{"evi", subst, 0, "-ion+ive", ""},
1240Sstevel@tonic-gate 	{"ezi", CCe, 3, "-e+ize", "+ize"},
1250Sstevel@tonic-gate 	{"pihs", strip, 4, "", "+ship"},
1260Sstevel@tonic-gate 	{"dooh", ily, 4, "-y+ihood", "+hood"},
1270Sstevel@tonic-gate 	{"luf", ily, 3, "-y+iful", "+ful"},
1280Sstevel@tonic-gate 	{"ekil", strip, 4, "", "+like"},
1290Sstevel@tonic-gate 	0
1300Sstevel@tonic-gate };
1310Sstevel@tonic-gate 
1320Sstevel@tonic-gate static char *preftab[] = {
1330Sstevel@tonic-gate 	"anti",
1340Sstevel@tonic-gate 	"auto",
1350Sstevel@tonic-gate 	"bio",
1360Sstevel@tonic-gate 	"counter",
1370Sstevel@tonic-gate 	"dis",
1380Sstevel@tonic-gate 	"electro",
1390Sstevel@tonic-gate 	"en",
1400Sstevel@tonic-gate 	"fore",
1410Sstevel@tonic-gate 	"geo",
1420Sstevel@tonic-gate 	"hyper",
1430Sstevel@tonic-gate 	"intra",
1440Sstevel@tonic-gate 	"inter",
1450Sstevel@tonic-gate 	"iso",
1460Sstevel@tonic-gate 	"kilo",
1470Sstevel@tonic-gate 	"magneto",
1480Sstevel@tonic-gate 	"meta",
1490Sstevel@tonic-gate 	"micro",
1500Sstevel@tonic-gate 	"mid",
1510Sstevel@tonic-gate 	"milli",
1520Sstevel@tonic-gate 	"mis",
1530Sstevel@tonic-gate 	"mono",
1540Sstevel@tonic-gate 	"multi",
1550Sstevel@tonic-gate 	"non",
1560Sstevel@tonic-gate 	"out",
1570Sstevel@tonic-gate 	"over",
1580Sstevel@tonic-gate 	"photo",
1590Sstevel@tonic-gate 	"poly",
1600Sstevel@tonic-gate 	"pre",
1610Sstevel@tonic-gate 	"pseudo",
1620Sstevel@tonic-gate 	"psycho",
1630Sstevel@tonic-gate 	"re",
1640Sstevel@tonic-gate 	"semi",
1650Sstevel@tonic-gate 	"stereo",
1660Sstevel@tonic-gate 	"sub",
1670Sstevel@tonic-gate 	"super",
1680Sstevel@tonic-gate 	"tele",
1690Sstevel@tonic-gate 	"thermo",
1700Sstevel@tonic-gate 	"ultra",
1710Sstevel@tonic-gate 	"under",	/* must precede un */
1720Sstevel@tonic-gate 	"un",
1730Sstevel@tonic-gate 	0
1740Sstevel@tonic-gate };
1750Sstevel@tonic-gate 
1760Sstevel@tonic-gate static int vflag;
1770Sstevel@tonic-gate static int xflag;
1780Sstevel@tonic-gate static char *prog;
1790Sstevel@tonic-gate static char word[LINE_MAX];
1800Sstevel@tonic-gate static char original[LINE_MAX];
1810Sstevel@tonic-gate static char *deriv[LINE_MAX];
1820Sstevel@tonic-gate static char affix[LINE_MAX];
1830Sstevel@tonic-gate static FILE *file, *found;
1840Sstevel@tonic-gate /*
1850Sstevel@tonic-gate  *	deriv is stack of pointers to notes like +micro +ed
1860Sstevel@tonic-gate  *	affix is concatenated string of notes
1870Sstevel@tonic-gate  *	the buffer size 141 stems from the sizes of original and affix.
1880Sstevel@tonic-gate  */
1890Sstevel@tonic-gate 
1900Sstevel@tonic-gate /*
1910Sstevel@tonic-gate  *	in an attempt to defray future maintenance misunderstandings, here is
1920Sstevel@tonic-gate  *	an attempt to describe the input/output expectations of the spell
1930Sstevel@tonic-gate  *	program.
1940Sstevel@tonic-gate  *
1950Sstevel@tonic-gate  *	spellprog is intended to be called from the shell file spell.
1960Sstevel@tonic-gate  *	because of this, there is little error checking (this is historical, not
1970Sstevel@tonic-gate  *	necessarily advisable).
1980Sstevel@tonic-gate  *
1990Sstevel@tonic-gate  *	spellprog options hashed-list pass
2000Sstevel@tonic-gate  *
2010Sstevel@tonic-gate  *	the hashed-list is a list of the form made by spellin.
2020Sstevel@tonic-gate  *	there are 2 types of hashed lists:
2030Sstevel@tonic-gate  *		1. a stop list: this specifies words that by the rules embodied
2040Sstevel@tonic-gate  *		   in spellprog would be recognized as correct, BUT are really
2050Sstevel@tonic-gate  *		   errors.
2060Sstevel@tonic-gate  *		2. a dictionary of correctly spelled words.
2070Sstevel@tonic-gate  *	the pass number determines how the words found in the specified
2080Sstevel@tonic-gate  *	hashed-list are treated. If the pass number is 1, the hashed-list is
2090Sstevel@tonic-gate  *	treated as the stop-list, otherwise, it is treated as the regular
2100Sstevel@tonic-gate  *	dictionary list. in this case, the value of "pass" is a filename. Found
2110Sstevel@tonic-gate  *	words are written to this file.
2120Sstevel@tonic-gate  *
2130Sstevel@tonic-gate  *	In the normal case, the filename = /dev/null. However, if the v option
2140Sstevel@tonic-gate  *	is specified, the derivations are written to this file.
2150Sstevel@tonic-gate  *	The spellprog looks up words in the hashed-list; if a word is found, it
2160Sstevel@tonic-gate  *	is printed to the stdout. If the hashed-list was the stop-list, the
2170Sstevel@tonic-gate  *	words found are presumed to be misspellings. in this case,
2180Sstevel@tonic-gate  *	a control character is printed ( a "-" is appended to the word.
2190Sstevel@tonic-gate  *	a hyphen will never occur naturally in the input list because deroff
2200Sstevel@tonic-gate  *	is used in the shell file before calling spellprog.)
2210Sstevel@tonic-gate  *	If the regualar spelling list was used (hlista or hlistb), the words
2220Sstevel@tonic-gate  *	are correct, and may be ditched. (unless the -v option was used -
2230Sstevel@tonic-gate  *	see the manual page).
2240Sstevel@tonic-gate  *
2250Sstevel@tonic-gate  *	spellprog should be called twice : first with the stop-list, to flag all
2260Sstevel@tonic-gate  *	a priori incorrectly spelled words; second with the dictionary.
2270Sstevel@tonic-gate  *
2280Sstevel@tonic-gate  *	spellprog hstop 1 |\
2290Sstevel@tonic-gate  *	spellprog hlista /dev/null
2300Sstevel@tonic-gate  *
2310Sstevel@tonic-gate  *	for a complete scenario, see the shell file: spell.
2320Sstevel@tonic-gate  *
2330Sstevel@tonic-gate  */
2340Sstevel@tonic-gate 
235*239Sceastha int
main(int argc,char ** argv)2360Sstevel@tonic-gate main(int argc, char **argv)
2370Sstevel@tonic-gate {
238*239Sceastha 	char *ep, *cp;
239*239Sceastha 	char *dp;
2400Sstevel@tonic-gate 	int fold;
2410Sstevel@tonic-gate 	int c, j;
2420Sstevel@tonic-gate 	int pass;
2430Sstevel@tonic-gate 
2440Sstevel@tonic-gate 	/* Set locale environment variables local definitions */
2450Sstevel@tonic-gate 	(void) setlocale(LC_ALL, "");
2460Sstevel@tonic-gate #if !defined(TEXT_DOMAIN)	/* Should be defined by cc -D */
2470Sstevel@tonic-gate #define	TEXT_DOMAIN "SYS_TEST"	/* Use this only if it wasn't */
2480Sstevel@tonic-gate #endif
2490Sstevel@tonic-gate 	(void) textdomain(TEXT_DOMAIN);
2500Sstevel@tonic-gate 
2510Sstevel@tonic-gate 
2520Sstevel@tonic-gate 	prog = argv[0];
2530Sstevel@tonic-gate 	while ((c = getopt(argc, argv, "bvx")) != EOF) {
2540Sstevel@tonic-gate 		switch (c) {
2550Sstevel@tonic-gate 		case 'b':
2560Sstevel@tonic-gate 			ise();
2570Sstevel@tonic-gate 			break;
2580Sstevel@tonic-gate 		case 'v':
2590Sstevel@tonic-gate 			vflag++;
2600Sstevel@tonic-gate 			break;
2610Sstevel@tonic-gate 		case 'x':
2620Sstevel@tonic-gate 			xflag++;
2630Sstevel@tonic-gate 			break;
2640Sstevel@tonic-gate 		}
2650Sstevel@tonic-gate 	}
2660Sstevel@tonic-gate 
2670Sstevel@tonic-gate 	argc -= optind;
2680Sstevel@tonic-gate 	argv = &argv[optind];
2690Sstevel@tonic-gate 
2700Sstevel@tonic-gate 	if ((argc < 2) || !prime(*argv)) {
2710Sstevel@tonic-gate 		(void) fprintf(stderr,
2720Sstevel@tonic-gate 		    gettext("%s: cannot initialize hash table\n"), prog);
2730Sstevel@tonic-gate 		exit(1);
2740Sstevel@tonic-gate 	}
2750Sstevel@tonic-gate 	argc--;
2760Sstevel@tonic-gate 	argv++;
2770Sstevel@tonic-gate 
2780Sstevel@tonic-gate /*
2790Sstevel@tonic-gate  *	if pass is not 1, it is assumed to be a filename.
2800Sstevel@tonic-gate  *	found words are written to this file.
2810Sstevel@tonic-gate  */
2820Sstevel@tonic-gate 	pass = **argv;
2830Sstevel@tonic-gate 	if (pass != '1')
2840Sstevel@tonic-gate 		found = fopen(*argv, "w");
2850Sstevel@tonic-gate 
2860Sstevel@tonic-gate 	for (;;) {
2870Sstevel@tonic-gate 		affix[0] = 0;
2880Sstevel@tonic-gate 		file = stdout;
2890Sstevel@tonic-gate 		for (ep = word; (*ep = j = getchar()) != '\n'; ep++)
2900Sstevel@tonic-gate 			if (j == EOF)
2910Sstevel@tonic-gate 				exit(0);
2920Sstevel@tonic-gate /*
2930Sstevel@tonic-gate  *	here is the hyphen processing. these words were found in the stop
2940Sstevel@tonic-gate  *	list. however, if they exist as is, (no derivations tried) in the
2950Sstevel@tonic-gate  *	dictionary, let them through as correct.
2960Sstevel@tonic-gate  *
2970Sstevel@tonic-gate  */
2980Sstevel@tonic-gate 		if (ep[-1] == '-') {
2990Sstevel@tonic-gate 			*--ep = 0;
3000Sstevel@tonic-gate 			if (!tryword(word, ep, 0))
3010Sstevel@tonic-gate 				(void) fprintf(file, "%s\n", word);
3020Sstevel@tonic-gate 			continue;
3030Sstevel@tonic-gate 		}
3040Sstevel@tonic-gate 		for (cp = word, dp = original; cp < ep; )
3050Sstevel@tonic-gate 			*dp++ = *cp++;
3060Sstevel@tonic-gate 		*dp = 0;
3070Sstevel@tonic-gate 		fold = 0;
3080Sstevel@tonic-gate 		for (cp = word; cp < ep; cp++)
3090Sstevel@tonic-gate 			if (islower(*cp))
3100Sstevel@tonic-gate 				goto lcase;
3110Sstevel@tonic-gate 		if (((ep - word) == 1) &&
3120Sstevel@tonic-gate 		    ((word[0] == 'A') || (word[0] == 'I')))
3130Sstevel@tonic-gate 			continue;
3140Sstevel@tonic-gate 		if (trypref(ep, ".", 0))
3150Sstevel@tonic-gate 			goto foundit;
3160Sstevel@tonic-gate 		++fold;
3170Sstevel@tonic-gate 		for (cp = original+1, dp = word+1; dp < ep; dp++, cp++)
3180Sstevel@tonic-gate 			*dp = Tolower(*cp);
3190Sstevel@tonic-gate lcase:
3200Sstevel@tonic-gate 		if (((ep - word) == 1) && (word[0] == 'a'))
3210Sstevel@tonic-gate 			continue;
3220Sstevel@tonic-gate 		if (trypref(ep, ".", 0)||trysuff(ep, 0))
3230Sstevel@tonic-gate 			goto foundit;
3240Sstevel@tonic-gate 		if (isupper(word[0])) {
3250Sstevel@tonic-gate 			for (cp = original, dp = word; *dp = *cp++; dp++)
3260Sstevel@tonic-gate 				if (fold) *dp = Tolower(*dp);
3270Sstevel@tonic-gate 			word[0] = Tolower(word[0]);
3280Sstevel@tonic-gate 			goto lcase;
3290Sstevel@tonic-gate 		}
3300Sstevel@tonic-gate 		(void) fprintf(file, "%s\n", original);
3310Sstevel@tonic-gate 		continue;
3320Sstevel@tonic-gate 
3330Sstevel@tonic-gate foundit:
3340Sstevel@tonic-gate 		if (pass == '1')
3350Sstevel@tonic-gate 			(void) fprintf(file, "%s-\n", original);
3360Sstevel@tonic-gate 		else if (affix[0] != 0 && affix[0] != '.') {
3370Sstevel@tonic-gate 			file = found;
3380Sstevel@tonic-gate 			(void) fprintf(file, "%s\t%s\n", affix,
3390Sstevel@tonic-gate 			    original);
3400Sstevel@tonic-gate 		}
3410Sstevel@tonic-gate 	}
3420Sstevel@tonic-gate }
3430Sstevel@tonic-gate 
3440Sstevel@tonic-gate /*
3450Sstevel@tonic-gate  *	strip exactly one suffix and do
3460Sstevel@tonic-gate  *	indicated routine(s), which may recursively
3470Sstevel@tonic-gate  *	strip suffixes
3480Sstevel@tonic-gate  */
3490Sstevel@tonic-gate 
3500Sstevel@tonic-gate static int
trysuff(char * ep,int lev)3510Sstevel@tonic-gate trysuff(char *ep, int lev)
3520Sstevel@tonic-gate {
353*239Sceastha 	struct suftab	*t;
354*239Sceastha 	char *cp, *sp;
3550Sstevel@tonic-gate 
3560Sstevel@tonic-gate 	lev += DLEV;
3570Sstevel@tonic-gate 	deriv[lev] = deriv[lev-1] = 0;
3580Sstevel@tonic-gate 	for (t = &suftab[0]; (sp = t->suf) != 0; t++) {
3590Sstevel@tonic-gate 		cp = ep;
3600Sstevel@tonic-gate 		while (*sp)
3610Sstevel@tonic-gate 			if (*--cp != *sp++)
3620Sstevel@tonic-gate 				goto next;
3630Sstevel@tonic-gate 		for (sp = cp; --sp >= word && !vowel(*sp); );
3640Sstevel@tonic-gate 		if (sp < word)
3650Sstevel@tonic-gate 			return (0);
3660Sstevel@tonic-gate 		if ((*t->p1)(ep-t->n1, t->d1, t->a1, lev+1))
3670Sstevel@tonic-gate 			return (1);
3680Sstevel@tonic-gate 		if (t->p2 != 0) {
3690Sstevel@tonic-gate 			deriv[lev] = deriv[lev+1] = 0;
3700Sstevel@tonic-gate 			return ((*t->p2)(ep-t->n2, t->d2, t->a2, lev));
3710Sstevel@tonic-gate 		}
3720Sstevel@tonic-gate 		return (0);
3730Sstevel@tonic-gate next:;
3740Sstevel@tonic-gate 	}
3750Sstevel@tonic-gate 	return (0);
3760Sstevel@tonic-gate }
3770Sstevel@tonic-gate 
3780Sstevel@tonic-gate static int
nop(void)3790Sstevel@tonic-gate nop(void)
3800Sstevel@tonic-gate {
3810Sstevel@tonic-gate 	return (0);
3820Sstevel@tonic-gate }
3830Sstevel@tonic-gate 
3840Sstevel@tonic-gate /* ARGSUSED */
3850Sstevel@tonic-gate static int
strip(char * ep,char * d,char * a,int lev)3860Sstevel@tonic-gate strip(char *ep, char *d, char *a, int lev)
3870Sstevel@tonic-gate {
3880Sstevel@tonic-gate 	return (trypref(ep, a, lev)||trysuff(ep, lev));
3890Sstevel@tonic-gate }
3900Sstevel@tonic-gate 
3910Sstevel@tonic-gate static int
s(char * ep,char * d,char * a,int lev)3920Sstevel@tonic-gate s(char *ep, char *d, char *a, int lev)
3930Sstevel@tonic-gate {
3940Sstevel@tonic-gate 	if (lev > DLEV+1)
3950Sstevel@tonic-gate 		return (0);
3960Sstevel@tonic-gate 	if (*ep == 's' && ep[-1] == 's')
3970Sstevel@tonic-gate 		return (0);
3980Sstevel@tonic-gate 	return (strip(ep, d, a, lev));
3990Sstevel@tonic-gate }
4000Sstevel@tonic-gate 
4010Sstevel@tonic-gate /* ARGSUSED */
4020Sstevel@tonic-gate static int
an(char * ep,char * d,char * a,int lev)4030Sstevel@tonic-gate an(char *ep, char *d, char *a, int lev)
4040Sstevel@tonic-gate {
4050Sstevel@tonic-gate 	if (!isupper(*word))	/* must be proper name */
4060Sstevel@tonic-gate 		return (0);
4070Sstevel@tonic-gate 	return (trypref(ep, a, lev));
4080Sstevel@tonic-gate }
4090Sstevel@tonic-gate 
4100Sstevel@tonic-gate /* ARGSUSED */
4110Sstevel@tonic-gate static int
ize(char * ep,char * d,char * a,int lev)4120Sstevel@tonic-gate ize(char *ep, char *d, char *a, int lev)
4130Sstevel@tonic-gate {
4140Sstevel@tonic-gate 	ep[-1] = 'e';
4150Sstevel@tonic-gate 	return (strip(ep, "", d, lev));
4160Sstevel@tonic-gate }
4170Sstevel@tonic-gate 
4180Sstevel@tonic-gate /* ARGSUSED */
4190Sstevel@tonic-gate static int
y_to_e(char * ep,char * d,char * a,int lev)4200Sstevel@tonic-gate y_to_e(char *ep, char *d, char *a, int lev)
4210Sstevel@tonic-gate {
4220Sstevel@tonic-gate 	*ep++ = 'e';
4230Sstevel@tonic-gate 	return (strip(ep, "", d, lev));
4240Sstevel@tonic-gate }
4250Sstevel@tonic-gate 
4260Sstevel@tonic-gate static int
ily(char * ep,char * d,char * a,int lev)4270Sstevel@tonic-gate ily(char *ep, char *d, char *a, int lev)
4280Sstevel@tonic-gate {
4290Sstevel@tonic-gate 	if (ep[-1] == 'i')
4300Sstevel@tonic-gate 		return (i_to_y(ep, d, a, lev));
4310Sstevel@tonic-gate 	else
4320Sstevel@tonic-gate 		return (strip(ep, d, a, lev));
4330Sstevel@tonic-gate }
4340Sstevel@tonic-gate 
4350Sstevel@tonic-gate static int
bility(char * ep,char * d,char * a,int lev)4360Sstevel@tonic-gate bility(char *ep, char *d, char *a, int lev)
4370Sstevel@tonic-gate {
4380Sstevel@tonic-gate 	*ep++ = 'l';
4390Sstevel@tonic-gate 	return (y_to_e(ep, d, a, lev));
4400Sstevel@tonic-gate }
4410Sstevel@tonic-gate 
4420Sstevel@tonic-gate static int
i_to_y(char * ep,char * d,char * a,int lev)4430Sstevel@tonic-gate i_to_y(char *ep, char *d, char *a, int lev)
4440Sstevel@tonic-gate {
4450Sstevel@tonic-gate 	if (ep[-1] == 'i') {
4460Sstevel@tonic-gate 		ep[-1] = 'y';
4470Sstevel@tonic-gate 		a = d;
4480Sstevel@tonic-gate 	}
4490Sstevel@tonic-gate 	return (strip(ep, "", a, lev));
4500Sstevel@tonic-gate }
4510Sstevel@tonic-gate 
4520Sstevel@tonic-gate static int
es(char * ep,char * d,char * a,int lev)4530Sstevel@tonic-gate es(char *ep, char *d, char *a, int lev)
4540Sstevel@tonic-gate {
4550Sstevel@tonic-gate 	if (lev > DLEV)
4560Sstevel@tonic-gate 		return (0);
4570Sstevel@tonic-gate 	switch (ep[-1]) {
4580Sstevel@tonic-gate 	default:
4590Sstevel@tonic-gate 		return (0);
4600Sstevel@tonic-gate 	case 'i':
4610Sstevel@tonic-gate 		return (i_to_y(ep, d, a, lev));
4620Sstevel@tonic-gate 	case 's':
4630Sstevel@tonic-gate 	case 'h':
4640Sstevel@tonic-gate 	case 'z':
4650Sstevel@tonic-gate 	case 'x':
4660Sstevel@tonic-gate 		return (strip(ep, d, a, lev));
4670Sstevel@tonic-gate 	}
4680Sstevel@tonic-gate }
4690Sstevel@tonic-gate 
4700Sstevel@tonic-gate /* ARGSUSED */
4710Sstevel@tonic-gate static int
subst(char * ep,char * d,char * a,int lev)4720Sstevel@tonic-gate subst(char *ep, char *d, char *a, int lev)
4730Sstevel@tonic-gate {
4740Sstevel@tonic-gate 	char *u, *t;
4750Sstevel@tonic-gate 
4760Sstevel@tonic-gate 	if (skipv(skipv(ep-1)) < word)
4770Sstevel@tonic-gate 		return (0);
4780Sstevel@tonic-gate 	for (t = d; *t != '+'; t++)
4790Sstevel@tonic-gate 		continue;
4800Sstevel@tonic-gate 	for (u = ep; *--t != '-'; )
4810Sstevel@tonic-gate 		*--u = *t;
4820Sstevel@tonic-gate 	return (strip(ep, "", d, lev));
4830Sstevel@tonic-gate }
4840Sstevel@tonic-gate 
4850Sstevel@tonic-gate 
4860Sstevel@tonic-gate static int
tion(char * ep,char * d,char * a,int lev)4870Sstevel@tonic-gate tion(char *ep, char *d, char *a, int lev)
4880Sstevel@tonic-gate {
4890Sstevel@tonic-gate 	switch (ep[-2]) {
4900Sstevel@tonic-gate 	case 'c':
4910Sstevel@tonic-gate 	case 'r':
4920Sstevel@tonic-gate 		return (trypref(ep, a, lev));
4930Sstevel@tonic-gate 	case 'a':
4940Sstevel@tonic-gate 		return (y_to_e(ep, d, a, lev));
4950Sstevel@tonic-gate 	}
4960Sstevel@tonic-gate 	return (0);
4970Sstevel@tonic-gate }
4980Sstevel@tonic-gate 
4990Sstevel@tonic-gate /*	possible consonant-consonant-e ending */
5000Sstevel@tonic-gate static int
CCe(char * ep,char * d,char * a,int lev)5010Sstevel@tonic-gate CCe(char *ep, char *d, char *a, int lev)
5020Sstevel@tonic-gate {
5030Sstevel@tonic-gate 	switch (ep[-1]) {
5040Sstevel@tonic-gate 	case 'r':
5050Sstevel@tonic-gate 		if (ep[-2] == 't')
5060Sstevel@tonic-gate 			return (y_to_e(ep, d, a, lev));
5070Sstevel@tonic-gate 		break;
5080Sstevel@tonic-gate 	case 'l':
5090Sstevel@tonic-gate 		if (vowel(ep[-2]))
5100Sstevel@tonic-gate 			break;
5110Sstevel@tonic-gate 		switch (ep[-2]) {
5120Sstevel@tonic-gate 		case 'l':
5130Sstevel@tonic-gate 		case 'r':
5140Sstevel@tonic-gate 		case 'w':
5150Sstevel@tonic-gate 			break;
5160Sstevel@tonic-gate 		default:
5170Sstevel@tonic-gate 			return (y_to_e(ep, d, a, lev));
5180Sstevel@tonic-gate 		}
5190Sstevel@tonic-gate 		break;
5200Sstevel@tonic-gate 	case 's':
5210Sstevel@tonic-gate 		if (ep[-2] == 's')
5220Sstevel@tonic-gate 			break;
5230Sstevel@tonic-gate 		if (*ep == 'a')
5240Sstevel@tonic-gate 			return (0);
5250Sstevel@tonic-gate 		if (vowel(ep[-2]))
5260Sstevel@tonic-gate 			break;
5270Sstevel@tonic-gate 		if (y_to_e(ep, d, a, lev))
5280Sstevel@tonic-gate 			return (1);
5290Sstevel@tonic-gate 		if (!(ep[-2] == 'n' && ep[-1] == 'g'))
5300Sstevel@tonic-gate 			return (0);
5310Sstevel@tonic-gate 		break;
5320Sstevel@tonic-gate 	case 'c':
5330Sstevel@tonic-gate 	case 'g':
5340Sstevel@tonic-gate 		if (*ep == 'a')
5350Sstevel@tonic-gate 			return (0);
5360Sstevel@tonic-gate 		if (vowel(ep[-2]))
5370Sstevel@tonic-gate 			break;
5380Sstevel@tonic-gate 		if (y_to_e(ep, d, a, lev))
5390Sstevel@tonic-gate 			return (1);
5400Sstevel@tonic-gate 		if (!(ep[-2] == 'n' && ep[-1] == 'g'))
5410Sstevel@tonic-gate 			return (0);
5420Sstevel@tonic-gate 		break;
5430Sstevel@tonic-gate 	case 'v':
5440Sstevel@tonic-gate 	case 'z':
5450Sstevel@tonic-gate 		if (vowel(ep[-2]))
5460Sstevel@tonic-gate 			break;
5470Sstevel@tonic-gate 		if (y_to_e(ep, d, a, lev))
5480Sstevel@tonic-gate 			return (1);
5490Sstevel@tonic-gate 		if (!(ep[-2] == 'n' && ep[-1] == 'g'))
5500Sstevel@tonic-gate 			return (0);
5510Sstevel@tonic-gate 		break;
5520Sstevel@tonic-gate 	case 'u':
5530Sstevel@tonic-gate 		if (y_to_e(ep, d, a, lev))
5540Sstevel@tonic-gate 			return (1);
5550Sstevel@tonic-gate 		if (!(ep[-2] == 'n' && ep[-1] == 'g'))
5560Sstevel@tonic-gate 			return (0);
5570Sstevel@tonic-gate 		break;
5580Sstevel@tonic-gate 	}
5590Sstevel@tonic-gate 	return (VCe(ep, d, a, lev));
5600Sstevel@tonic-gate }
5610Sstevel@tonic-gate 
5620Sstevel@tonic-gate /*	possible consonant-vowel-consonant-e ending */
5630Sstevel@tonic-gate static int
VCe(char * ep,char * d,char * a,int lev)5640Sstevel@tonic-gate VCe(char *ep, char *d, char *a, int lev)
5650Sstevel@tonic-gate {
5660Sstevel@tonic-gate 	char c;
5670Sstevel@tonic-gate 	c = ep[-1];
5680Sstevel@tonic-gate 	if (c == 'e')
5690Sstevel@tonic-gate 		return (0);
5700Sstevel@tonic-gate 	if (!vowel(c) && vowel(ep[-2])) {
5710Sstevel@tonic-gate 		c = *ep;
5720Sstevel@tonic-gate 		*ep++ = 'e';
5730Sstevel@tonic-gate 		if (trypref(ep, d, lev)||trysuff(ep, lev))
5740Sstevel@tonic-gate 			return (1);
5750Sstevel@tonic-gate 		ep--;
5760Sstevel@tonic-gate 		*ep = c;
5770Sstevel@tonic-gate 	}
5780Sstevel@tonic-gate 	return (strip(ep, d, a, lev));
5790Sstevel@tonic-gate }
5800Sstevel@tonic-gate 
5810Sstevel@tonic-gate static char *
lookuppref(char ** wp,char * ep)5820Sstevel@tonic-gate lookuppref(char **wp, char *ep)
5830Sstevel@tonic-gate {
584*239Sceastha 	char **sp;
585*239Sceastha 	char *bp, *cp;
5860Sstevel@tonic-gate 
5870Sstevel@tonic-gate 	for (sp = preftab; *sp; sp++) {
5880Sstevel@tonic-gate 		bp = *wp;
5890Sstevel@tonic-gate 		for (cp = *sp; *cp; cp++, bp++)
5900Sstevel@tonic-gate 			if (Tolower(*bp) != *cp)
5910Sstevel@tonic-gate 				goto next;
5920Sstevel@tonic-gate 		for (cp = bp; cp < ep; cp++)
5930Sstevel@tonic-gate 			if (vowel(*cp)) {
5940Sstevel@tonic-gate 				*wp = bp;
5950Sstevel@tonic-gate 				return (*sp);
5960Sstevel@tonic-gate 			}
5970Sstevel@tonic-gate next:;
5980Sstevel@tonic-gate 	}
5990Sstevel@tonic-gate 	return (0);
6000Sstevel@tonic-gate }
6010Sstevel@tonic-gate 
6020Sstevel@tonic-gate /*
6030Sstevel@tonic-gate  *	while word is not in dictionary try stripping
6040Sstevel@tonic-gate  *	prefixes. Fail if no more prefixes.
6050Sstevel@tonic-gate  */
6060Sstevel@tonic-gate static int
trypref(char * ep,char * a,int lev)6070Sstevel@tonic-gate trypref(char *ep, char *a, int lev)
6080Sstevel@tonic-gate {
609*239Sceastha 	char *cp;
6100Sstevel@tonic-gate 	char *bp;
611*239Sceastha 	char *pp;
6120Sstevel@tonic-gate 	int val = 0;
6130Sstevel@tonic-gate 	char space[LINE_MAX * 2];
6140Sstevel@tonic-gate 	deriv[lev] = a;
6150Sstevel@tonic-gate 	if (tryword(word, ep, lev))
6160Sstevel@tonic-gate 		return (1);
6170Sstevel@tonic-gate 	bp = word;
6180Sstevel@tonic-gate 	pp = space;
6190Sstevel@tonic-gate 	deriv[lev+1] = pp;
6200Sstevel@tonic-gate 	while (cp = lookuppref(&bp, ep)) {
6210Sstevel@tonic-gate 		*pp++ = '+';
6220Sstevel@tonic-gate 		while (*pp = *cp++)
6230Sstevel@tonic-gate 			pp++;
6240Sstevel@tonic-gate 		if (tryword(bp, ep, lev+1)) {
6250Sstevel@tonic-gate 			val = 1;
6260Sstevel@tonic-gate 			break;
6270Sstevel@tonic-gate 		}
6280Sstevel@tonic-gate 	}
6290Sstevel@tonic-gate 	deriv[lev+1] = deriv[lev+2] = 0;
6300Sstevel@tonic-gate 	return (val);
6310Sstevel@tonic-gate }
6320Sstevel@tonic-gate 
6330Sstevel@tonic-gate static int
tryword(char * bp,char * ep,int lev)6340Sstevel@tonic-gate tryword(char *bp, char *ep, int lev)
6350Sstevel@tonic-gate {
636*239Sceastha 	int i, j;
6370Sstevel@tonic-gate 	char duple[3];
6380Sstevel@tonic-gate 	if (ep-bp <= 1)
6390Sstevel@tonic-gate 		return (0);
6400Sstevel@tonic-gate 	if (vowel(*ep)) {
6410Sstevel@tonic-gate 		if (monosyl(bp, ep))
6420Sstevel@tonic-gate 			return (0);
6430Sstevel@tonic-gate 	}
6440Sstevel@tonic-gate 	i = dict(bp, ep);
6450Sstevel@tonic-gate 	if (i == 0 && vowel(*ep) && ep[-1] == ep[-2] && monosyl(bp, ep-1)) {
6460Sstevel@tonic-gate 		ep--;
6470Sstevel@tonic-gate 		deriv[++lev] = duple;
6480Sstevel@tonic-gate 		duple[0] = '+';
6490Sstevel@tonic-gate 		duple[1] = *ep;
6500Sstevel@tonic-gate 		duple[2] = 0;
6510Sstevel@tonic-gate 		i = dict(bp, ep);
6520Sstevel@tonic-gate 	}
6530Sstevel@tonic-gate 	if (vflag == 0 || i == 0)
6540Sstevel@tonic-gate 		return (i);
6550Sstevel@tonic-gate 	/*
6560Sstevel@tonic-gate 	 *	when derivations are wanted, collect them
6570Sstevel@tonic-gate 	 *	for printing
6580Sstevel@tonic-gate 	 */
6590Sstevel@tonic-gate 	j = lev;
6600Sstevel@tonic-gate 	do {
6610Sstevel@tonic-gate 		if (deriv[j])
6620Sstevel@tonic-gate 			(void) strcat(affix, deriv[j]);
6630Sstevel@tonic-gate 	} while (--j > 0);
6640Sstevel@tonic-gate 	return (i);
6650Sstevel@tonic-gate }
6660Sstevel@tonic-gate 
6670Sstevel@tonic-gate 
6680Sstevel@tonic-gate static int
monosyl(char * bp,char * ep)6690Sstevel@tonic-gate monosyl(char *bp, char *ep)
6700Sstevel@tonic-gate {
6710Sstevel@tonic-gate 	if (ep < bp+2)
6720Sstevel@tonic-gate 		return (0);
6730Sstevel@tonic-gate 	if (vowel(*--ep) || !vowel(*--ep) || ep[1] == 'x' || ep[1] == 'w')
6740Sstevel@tonic-gate 		return (0);
6750Sstevel@tonic-gate 	while (--ep >= bp)
6760Sstevel@tonic-gate 		if (vowel(*ep))
6770Sstevel@tonic-gate 			return (0);
6780Sstevel@tonic-gate 	return (1);
6790Sstevel@tonic-gate }
6800Sstevel@tonic-gate 
6810Sstevel@tonic-gate static char *
skipv(char * s)6820Sstevel@tonic-gate skipv(char *s)
6830Sstevel@tonic-gate {
6840Sstevel@tonic-gate 	if (s >= word&&vowel(*s))
6850Sstevel@tonic-gate 		s--;
6860Sstevel@tonic-gate 	while (s >= word && !vowel(*s))
6870Sstevel@tonic-gate 		s--;
6880Sstevel@tonic-gate 	return (s);
6890Sstevel@tonic-gate }
6900Sstevel@tonic-gate 
6910Sstevel@tonic-gate static int
vowel(int c)6920Sstevel@tonic-gate vowel(int c)
6930Sstevel@tonic-gate {
6940Sstevel@tonic-gate 	switch (Tolower(c)) {
6950Sstevel@tonic-gate 	case 'a':
6960Sstevel@tonic-gate 	case 'e':
6970Sstevel@tonic-gate 	case 'i':
6980Sstevel@tonic-gate 	case 'o':
6990Sstevel@tonic-gate 	case 'u':
7000Sstevel@tonic-gate 	case 'y':
7010Sstevel@tonic-gate 		return (1);
7020Sstevel@tonic-gate 	}
7030Sstevel@tonic-gate 	return (0);
7040Sstevel@tonic-gate }
7050Sstevel@tonic-gate 
7060Sstevel@tonic-gate /* crummy way to Britishise */
7070Sstevel@tonic-gate static void
ise(void)7080Sstevel@tonic-gate ise(void)
7090Sstevel@tonic-gate {
710*239Sceastha 	struct suftab *p;
7110Sstevel@tonic-gate 
7120Sstevel@tonic-gate 	for (p = suftab; p->suf; p++) {
7130Sstevel@tonic-gate 		ztos(p->suf);
7140Sstevel@tonic-gate 		ztos(p->d1);
7150Sstevel@tonic-gate 		ztos(p->a1);
7160Sstevel@tonic-gate 	}
7170Sstevel@tonic-gate }
7180Sstevel@tonic-gate 
7190Sstevel@tonic-gate static void
ztos(char * s)7200Sstevel@tonic-gate ztos(char *s)
7210Sstevel@tonic-gate {
7220Sstevel@tonic-gate 	for (; *s; s++)
7230Sstevel@tonic-gate 		if (*s == 'z')
7240Sstevel@tonic-gate 			*s = 's';
7250Sstevel@tonic-gate }
7260Sstevel@tonic-gate 
7270Sstevel@tonic-gate static int
dict(char * bp,char * ep)7280Sstevel@tonic-gate dict(char *bp, char *ep)
7290Sstevel@tonic-gate {
730*239Sceastha 	int temp, result;
7310Sstevel@tonic-gate 	if (xflag)
7320Sstevel@tonic-gate 		(void) fprintf(stdout, "=%.*s\n", ep-bp, bp);
7330Sstevel@tonic-gate 	temp = *ep;
7340Sstevel@tonic-gate 	*ep = 0;
7350Sstevel@tonic-gate 	result = hashlook(bp);
7360Sstevel@tonic-gate 	*ep = temp;
7370Sstevel@tonic-gate 	return (result);
7380Sstevel@tonic-gate }
739