13e12c5d1SDavid du Colombier #include <u.h> 23e12c5d1SDavid du Colombier #include <libc.h> 33e12c5d1SDavid du Colombier #include <bio.h> 43e12c5d1SDavid du Colombier #include <ctype.h> 53e12c5d1SDavid du Colombier #include "code.h" 63e12c5d1SDavid du Colombier 7*219b2ee8SDavid du Colombier /* fig leaves for possibly signed char quantities */ 8*219b2ee8SDavid du Colombier #define ISUPPER(c) isupper((c)&0xff) 9*219b2ee8SDavid du Colombier #define ISLOWER(c) islower((c)&0xff) 10*219b2ee8SDavid du Colombier #define ISALPHA(c) isalpha((c)&0xff) 11*219b2ee8SDavid du Colombier #define ISDIGIT(c) isdigit((c)&0xff) 12*219b2ee8SDavid du Colombier #define ISVOWEL(c) voweltab[(c)&0xff] 13*219b2ee8SDavid du Colombier #define Tolower(c) (ISUPPER(c)? (c)-'A'+'a': (c)) 143e12c5d1SDavid du Colombier #define pair(a,b) (((a)<<8) | (b)) 153e12c5d1SDavid du Colombier #define DLEV 2 16*219b2ee8SDavid du Colombier #define DSIZ 40 173e12c5d1SDavid du Colombier 183e12c5d1SDavid du Colombier typedef long Bits; 193e12c5d1SDavid du Colombier #define Set(h, f) ((long)(h) & (f)) 203e12c5d1SDavid du Colombier 213e12c5d1SDavid du Colombier Bits nop(char*, char*, char*, int, int); 223e12c5d1SDavid du Colombier Bits strip(char*, char*, char*, int, int); 233e12c5d1SDavid du Colombier Bits ize(char*, char*, char*, int, int); 243e12c5d1SDavid du Colombier Bits i_to_y(char*, char*, char*, int, int); 253e12c5d1SDavid du Colombier Bits ily(char*, char*, char*, int, int); 263e12c5d1SDavid du Colombier Bits subst(char*, char*, char*, int, int); 273e12c5d1SDavid du Colombier Bits CCe(char*, char*, char*, int, int); 283e12c5d1SDavid du Colombier Bits tion(char*, char*, char*, int, int); 293e12c5d1SDavid du Colombier Bits an(char*, char*, char*, int, int); 303e12c5d1SDavid du Colombier Bits s(char*, char*, char*, int, int); 313e12c5d1SDavid du Colombier Bits es(char*, char*, char*, int, int); 323e12c5d1SDavid du Colombier Bits bility(char*, char*, char*, int, int); 333e12c5d1SDavid du Colombier Bits y_to_e(char*, char*, char*, int, int); 343e12c5d1SDavid du Colombier Bits VCe(char*, char*, char*, int, int); 353e12c5d1SDavid du Colombier 363e12c5d1SDavid du Colombier Bits trypref(char*, char*, int, int); 373e12c5d1SDavid du Colombier Bits tryword(char*, char*, int, int); 383e12c5d1SDavid du Colombier Bits trysuff(char*, int, int); 393e12c5d1SDavid du Colombier Bits dict(char*, char*); 403e12c5d1SDavid du Colombier void typeprint(Bits); 413e12c5d1SDavid du Colombier void pcomma(char*); 423e12c5d1SDavid du Colombier 433e12c5d1SDavid du Colombier void ise(void); 443e12c5d1SDavid du Colombier int ordinal(void); 453e12c5d1SDavid du Colombier char* skipv(char*); 463e12c5d1SDavid du Colombier int inun(char*, Bits); 473e12c5d1SDavid du Colombier char* ztos(char*); 483e12c5d1SDavid du Colombier void readdict(char*); 493e12c5d1SDavid du Colombier 503e12c5d1SDavid du Colombier typedef struct Ptab Ptab; 513e12c5d1SDavid du Colombier struct Ptab 523e12c5d1SDavid du Colombier { 533e12c5d1SDavid du Colombier char* s; 543e12c5d1SDavid du Colombier int flag; 553e12c5d1SDavid du Colombier }; 563e12c5d1SDavid du Colombier 573e12c5d1SDavid du Colombier typedef struct Suftab Suftab; 583e12c5d1SDavid du Colombier struct Suftab 593e12c5d1SDavid du Colombier { 603e12c5d1SDavid du Colombier char *suf; 613e12c5d1SDavid du Colombier Bits (*p1)(char*, char*, char*, int, int); 623e12c5d1SDavid du Colombier int n1; 633e12c5d1SDavid du Colombier char *d1; 643e12c5d1SDavid du Colombier char *a1; 653e12c5d1SDavid du Colombier int flag; 663e12c5d1SDavid du Colombier int affixable; 673e12c5d1SDavid du Colombier Bits (*p2)(char*, char*, char*, int, int); 683e12c5d1SDavid du Colombier int n2; 693e12c5d1SDavid du Colombier char *d2; 703e12c5d1SDavid du Colombier char *a2; 713e12c5d1SDavid du Colombier }; 723e12c5d1SDavid du Colombier 73*219b2ee8SDavid du Colombier Suftab staba[] = { 74*219b2ee8SDavid du Colombier {"aibohp",subst,1,"-e+ia","",NOUN, NOUN}, 75*219b2ee8SDavid du Colombier 0 76*219b2ee8SDavid du Colombier }; 77*219b2ee8SDavid du Colombier 783e12c5d1SDavid du Colombier Suftab stabc[] = 793e12c5d1SDavid du Colombier { 80*219b2ee8SDavid du Colombier {"cai",strip,1,"","+c",N_AFFIX, ADJ|NOUN}, 813e12c5d1SDavid du Colombier {"citsi",strip,2,"","+ic",N_AFFIX, ADJ | N_AFFIX | NOUN}, 823e12c5d1SDavid du Colombier {"citi",ize,1,"-e+ic","",N_AFFIX, ADJ }, 833e12c5d1SDavid du Colombier {"cihparg",i_to_y,1,"-y+ic","",NOUN, ADJ|NOUN }, 843e12c5d1SDavid du Colombier {"cipocs",ize,1,"-e+ic","",NOUN, ADJ }, 853e12c5d1SDavid du Colombier {"cirtem",i_to_y,1,"-y+ic","",NOUN, ADJ }, 863e12c5d1SDavid du Colombier {"cigol",i_to_y,1,"-y+ic","",NOUN, ADJ }, 873e12c5d1SDavid du Colombier {"cimono",i_to_y,1,"-y+ic","",NOUN, ADJ }, 88*219b2ee8SDavid du Colombier {"cibohp",subst,1,"-e+ic","",NOUN, ADJ }, 893e12c5d1SDavid du Colombier 0 903e12c5d1SDavid du Colombier }; 913e12c5d1SDavid du Colombier Suftab stabd[] = 923e12c5d1SDavid du Colombier { 93*219b2ee8SDavid du Colombier {"de",strip,1,"","+d",ED,ADJ |COMP,i_to_y,2,"-y+ied","+ed"}, 943e12c5d1SDavid du Colombier {"dooh",ily,4,"-y+ihood","+hood",NOUN | ADV, NOUN}, 953e12c5d1SDavid du Colombier 0 963e12c5d1SDavid du Colombier }; 973e12c5d1SDavid du Colombier Suftab stabe[] = 983e12c5d1SDavid du Colombier { 993e12c5d1SDavid du Colombier /* 1003e12c5d1SDavid du Colombier * V_affix for comment ->commence->commentment?? 1013e12c5d1SDavid du Colombier */ 102*219b2ee8SDavid du Colombier {"ecna",subst,1,"-t+ce","",ADJ,N_AFFIX|_Y|NOUN|VERB|ACTOR|V_AFFIX}, 103*219b2ee8SDavid du Colombier {"ecne",subst,1,"-t+ce","",ADJ,N_AFFIX|_Y|NOUN|VERB|ACTOR|V_AFFIX}, 1043e12c5d1SDavid du Colombier {"elbaif",i_to_y,4,"-y+iable","",V_IRREG,ADJ}, 1053e12c5d1SDavid du Colombier {"elba",CCe,4,"-e+able","+able",V_AFFIX,ADJ}, 1063e12c5d1SDavid du Colombier {"evi",subst,0,"-ion+ive","",N_AFFIX | V_AFFIX,NOUN | N_AFFIX| ADJ}, 1073e12c5d1SDavid du Colombier {"ezi",CCe,3,"-e+ize","+ize",N_AFFIX|ADJ ,V_AFFIX | VERB |ION | COMP}, 1083e12c5d1SDavid du Colombier {"ekil",strip,4,"","+like",N_AFFIX ,ADJ}, 1093e12c5d1SDavid du Colombier 0 1103e12c5d1SDavid du Colombier }; 1113e12c5d1SDavid du Colombier Suftab stabg[] = 1123e12c5d1SDavid du Colombier { 113*219b2ee8SDavid du Colombier {"gniee",strip,3,"","+ing",V_IRREG ,ADJ|NOUN}, 114*219b2ee8SDavid du Colombier {"gnikam",strip,6,"","+making",NOUN,NOUN}, 115*219b2ee8SDavid du Colombier {"gnipeek",strip,7,"","+keeping",NOUN,NOUN}, 1163e12c5d1SDavid du Colombier {"gni",CCe,3,"-e+ing","+ing",V_IRREG ,ADJ|ED|NOUN}, 1173e12c5d1SDavid du Colombier 0 1183e12c5d1SDavid du Colombier }; 1193e12c5d1SDavid du Colombier Suftab stabl[] = 1203e12c5d1SDavid du Colombier { 121*219b2ee8SDavid du Colombier {"ladio",strip,2,"","+al",NOUN |ADJ,ADJ}, 1223e12c5d1SDavid du Colombier {"laci",strip,2,"","+al",NOUN |ADJ,ADJ |NOUN|N_AFFIX}, 1233e12c5d1SDavid du Colombier {"latnem",strip,2,"","+al",N_AFFIX,ADJ}, 1243e12c5d1SDavid du Colombier {"lanoi",strip,2,"","+al",N_AFFIX,ADJ|NOUN}, 1253e12c5d1SDavid du Colombier {"luf",ily,3,"-y+iful","+ful",N_AFFIX,ADJ | NOUN}, 1263e12c5d1SDavid du Colombier 0 1273e12c5d1SDavid du Colombier }; 1283e12c5d1SDavid du Colombier Suftab stabm[] = 1293e12c5d1SDavid du Colombier { 1303e12c5d1SDavid du Colombier /* congregational + ism */ 1313e12c5d1SDavid du Colombier {"msi",CCe,3,"-e+ism","ism",N_AFFIX|ADJ,NOUN}, 1323e12c5d1SDavid du Colombier {"margo",subst,-1,"-ph+m","",NOUN,NOUN}, 1333e12c5d1SDavid du Colombier 0 1343e12c5d1SDavid du Colombier }; 1353e12c5d1SDavid du Colombier Suftab stabn[] = 1363e12c5d1SDavid du Colombier { 1373e12c5d1SDavid du Colombier {"noitacifi",i_to_y,6,"-y+ication","",ION,NOUN | N_AFFIX}, 1383e12c5d1SDavid du Colombier {"noitazi",ize,4,"-e+ation","",ION,NOUN| N_AFFIX}, 1393e12c5d1SDavid du Colombier {"noit",tion,3,"-e+ion","+ion",ION,NOUN| N_AFFIX | V_AFFIX |VERB|ACTOR}, 1403e12c5d1SDavid du Colombier {"naino",an,3,"","+ian",NOUN|PROP_COLLECT,NOUN| N_AFFIX}, 1413e12c5d1SDavid du Colombier {"namow",strip,5,"","+woman",MAN,PROP_COLLECT|N_AFFIX}, 1423e12c5d1SDavid du Colombier {"nam",strip,3,"","+man",MAN,PROP_COLLECT | N_AFFIX | VERB}, 1433e12c5d1SDavid du Colombier {"na",an,1,"","+n",NOUN|PROP_COLLECT,NOUN | N_AFFIX}, 1443e12c5d1SDavid du Colombier {"nemow",strip,5,"","+women",MAN,PROP_COLLECT}, 1453e12c5d1SDavid du Colombier {"nem",strip,3,"","+man",MAN,PROP_COLLECT}, 146*219b2ee8SDavid du Colombier {"nosrep",strip,6,"","+person",MAN,PROP_COLLECT}, 1473e12c5d1SDavid du Colombier 0 1483e12c5d1SDavid du Colombier }; 1493e12c5d1SDavid du Colombier Suftab stabp[] = 1503e12c5d1SDavid du Colombier { 1513e12c5d1SDavid du Colombier {"pihs",strip,4,"","+ship",NOUN|PROP_COLLECT,NOUN| N_AFFIX}, 1523e12c5d1SDavid du Colombier 0 1533e12c5d1SDavid du Colombier }; 1543e12c5d1SDavid du Colombier Suftab stabr[] = 1553e12c5d1SDavid du Colombier { 1563e12c5d1SDavid du Colombier {"rehparg",subst,1,"-y+er","",ACTOR,NOUN,strip,2,"","+er"}, 1573e12c5d1SDavid du Colombier {"reyhparg",nop,0,"","",0,NOUN}, 158*219b2ee8SDavid du Colombier {"reyl",nop,0,"","",0,NOUN}, 159*219b2ee8SDavid du Colombier {"rekam",strip,5,"","+maker",NOUN,NOUN}, 160*219b2ee8SDavid du Colombier {"repeek",strip,6,"","+keeper",NOUN,NOUN}, 1613e12c5d1SDavid du Colombier {"re",strip,1,"","+r",ACTOR,NOUN | N_AFFIX|VERB|ADJ, i_to_y,2,"-y+ier","+er"}, 1623e12c5d1SDavid du Colombier {"rota",tion,2,"-e+or","",ION,NOUN| N_AFFIX|_Y}, 1633e12c5d1SDavid du Colombier {"rotc",tion,2,"","+or",ION,NOUN| N_AFFIX}, 1643e12c5d1SDavid du Colombier {"rotp",tion,2,"","+or",ION,NOUN| N_AFFIX}, 1653e12c5d1SDavid du Colombier 0 1663e12c5d1SDavid du Colombier }; 1673e12c5d1SDavid du Colombier Suftab stabs[] = 1683e12c5d1SDavid du Colombier { 1693e12c5d1SDavid du Colombier {"ssen",ily,4,"-y+iness","+ness",ADJ|ADV,NOUN| N_AFFIX}, 170*219b2ee8SDavid du Colombier {"ssel",ily,4,"-y+iless","+less",NOUN | PROP_COLLECT,ADJ }, 1713e12c5d1SDavid du Colombier {"se",s,1,"","+s",NOUN | V_IRREG,DONT_TOUCH , es,2,"-y+ies","+es"}, 1723e12c5d1SDavid du Colombier {"s'",s,2,"","+'s",PROP_COLLECT | NOUN,DONT_TOUCH }, 1733e12c5d1SDavid du Colombier {"s",s,1,"","+s",NOUN | V_IRREG,DONT_TOUCH }, 1743e12c5d1SDavid du Colombier 0 1753e12c5d1SDavid du Colombier }; 1763e12c5d1SDavid du Colombier Suftab stabt[] = 1773e12c5d1SDavid du Colombier { 1783e12c5d1SDavid du Colombier {"tnem",strip,4,"","+ment",V_AFFIX,NOUN | N_AFFIX | ADJ|VERB}, 1793e12c5d1SDavid du Colombier {"tse",strip,2,"","+st",EST,DONT_TOUCH, i_to_y,3,"-y+iest","+est" }, 1803e12c5d1SDavid du Colombier {"tsigol",i_to_y,2,"-y+ist","",N_AFFIX,NOUN | N_AFFIX}, 1813e12c5d1SDavid du Colombier {"tsi",CCe,3,"-e+ist","+ist",N_AFFIX|ADJ,NOUN | N_AFFIX|COMP}, 1823e12c5d1SDavid du Colombier 0 1833e12c5d1SDavid du Colombier }; 1843e12c5d1SDavid du Colombier Suftab staby[] = 1853e12c5d1SDavid du Colombier { 186*219b2ee8SDavid du Colombier {"ycna",subst,1,"-t+cy","",ADJ | N_AFFIX,NOUN | N_AFFIX}, 187*219b2ee8SDavid du Colombier {"ycne",subst,1,"-t+cy","",ADJ | N_AFFIX,NOUN | N_AFFIX}, 1883e12c5d1SDavid du Colombier {"ytilib",bility,5,"-le+ility","",ADJ | V_AFFIX,NOUN | N_AFFIX}, 1893e12c5d1SDavid du Colombier {"ytisuo",nop,0,"","",NOUN}, 190*219b2ee8SDavid du Colombier {"ytilb",nop,0,"","",0,NOUN}, 1913e12c5d1SDavid du Colombier {"yti",CCe,3,"-e+ity","+ity",ADJ ,NOUN | N_AFFIX }, 1923e12c5d1SDavid du Colombier {"ylb",y_to_e,1,"-e+y","",ADJ,ADV}, 1933e12c5d1SDavid du Colombier {"ylc",nop,0,"","",0}, 194*219b2ee8SDavid du Colombier {"ylelb",nop,0,"","",0}, 195*219b2ee8SDavid du Colombier {"ylelp",nop,0,"","",0}, 1963e12c5d1SDavid du Colombier {"yl",ily,2,"-y+ily","+ly",ADJ,ADV|COMP}, 1973e12c5d1SDavid du Colombier {"yrtem",subst,0,"-er+ry","",NOUN,NOUN | N_AFFIX}, 1983e12c5d1SDavid du Colombier {"y",CCe,1,"-e+y","+y",_Y,ADJ|COMP}, 1993e12c5d1SDavid du Colombier 0 2003e12c5d1SDavid du Colombier }; 2013e12c5d1SDavid du Colombier Suftab stabz[] = 2023e12c5d1SDavid du Colombier { 2033e12c5d1SDavid du Colombier 0 2043e12c5d1SDavid du Colombier }; 2053e12c5d1SDavid du Colombier Suftab* suftab[] = 2063e12c5d1SDavid du Colombier { 207*219b2ee8SDavid du Colombier staba, 2083e12c5d1SDavid du Colombier stabz, 2093e12c5d1SDavid du Colombier stabc, 2103e12c5d1SDavid du Colombier stabd, 2113e12c5d1SDavid du Colombier stabe, 2123e12c5d1SDavid du Colombier stabz, 2133e12c5d1SDavid du Colombier stabg, 2143e12c5d1SDavid du Colombier stabz, 2153e12c5d1SDavid du Colombier stabz, 2163e12c5d1SDavid du Colombier stabz, 2173e12c5d1SDavid du Colombier stabz, 2183e12c5d1SDavid du Colombier stabl, 2193e12c5d1SDavid du Colombier stabm, 2203e12c5d1SDavid du Colombier stabn, 2213e12c5d1SDavid du Colombier stabz, 2223e12c5d1SDavid du Colombier stabp, 2233e12c5d1SDavid du Colombier stabz, 2243e12c5d1SDavid du Colombier stabr, 2253e12c5d1SDavid du Colombier stabs, 2263e12c5d1SDavid du Colombier stabt, 2273e12c5d1SDavid du Colombier stabz, 2283e12c5d1SDavid du Colombier stabz, 2293e12c5d1SDavid du Colombier stabz, 2303e12c5d1SDavid du Colombier stabz, 2313e12c5d1SDavid du Colombier staby, 2323e12c5d1SDavid du Colombier stabz, 2333e12c5d1SDavid du Colombier }; 2343e12c5d1SDavid du Colombier 2353e12c5d1SDavid du Colombier Ptab ptaba[] = 2363e12c5d1SDavid du Colombier { 2373e12c5d1SDavid du Colombier "anti", 0, 2383e12c5d1SDavid du Colombier "auto", 0, 2393e12c5d1SDavid du Colombier 0 2403e12c5d1SDavid du Colombier }; 2413e12c5d1SDavid du Colombier Ptab ptabb[] = 2423e12c5d1SDavid du Colombier { 2433e12c5d1SDavid du Colombier "bio", 0, 2443e12c5d1SDavid du Colombier 0 2453e12c5d1SDavid du Colombier }; 2463e12c5d1SDavid du Colombier Ptab ptabc[] = 2473e12c5d1SDavid du Colombier { 2483e12c5d1SDavid du Colombier "counter", 0, 2493e12c5d1SDavid du Colombier 0 2503e12c5d1SDavid du Colombier }; 2513e12c5d1SDavid du Colombier Ptab ptabd[] = 2523e12c5d1SDavid du Colombier { 2533e12c5d1SDavid du Colombier "dis", 0, 2543e12c5d1SDavid du Colombier 0 2553e12c5d1SDavid du Colombier }; 2563e12c5d1SDavid du Colombier Ptab ptabe[] = 2573e12c5d1SDavid du Colombier { 2583e12c5d1SDavid du Colombier "electro", 0, 2593e12c5d1SDavid du Colombier 0 2603e12c5d1SDavid du Colombier }; 2613e12c5d1SDavid du Colombier Ptab ptabf[] = 2623e12c5d1SDavid du Colombier { 2633e12c5d1SDavid du Colombier "femto", 0, 2643e12c5d1SDavid du Colombier 0 2653e12c5d1SDavid du Colombier }; 2663e12c5d1SDavid du Colombier Ptab ptabg[] = 2673e12c5d1SDavid du Colombier { 2683e12c5d1SDavid du Colombier "geo", 0, 2693e12c5d1SDavid du Colombier "giga", 0, 2703e12c5d1SDavid du Colombier 0 2713e12c5d1SDavid du Colombier }; 2723e12c5d1SDavid du Colombier Ptab ptabh[] = 2733e12c5d1SDavid du Colombier { 2743e12c5d1SDavid du Colombier "hyper", 0, 2753e12c5d1SDavid du Colombier 0 2763e12c5d1SDavid du Colombier }; 2773e12c5d1SDavid du Colombier Ptab ptabi[] = 2783e12c5d1SDavid du Colombier { 279*219b2ee8SDavid du Colombier "immuno", 0, 2803e12c5d1SDavid du Colombier "im", IN, 2813e12c5d1SDavid du Colombier "intra", 0, 2823e12c5d1SDavid du Colombier "inter", 0, 2833e12c5d1SDavid du Colombier "in", IN, 2843e12c5d1SDavid du Colombier "ir", IN, 2853e12c5d1SDavid du Colombier "iso", 0, 2863e12c5d1SDavid du Colombier 0 2873e12c5d1SDavid du Colombier }; 2883e12c5d1SDavid du Colombier Ptab ptabj[] = 2893e12c5d1SDavid du Colombier { 2903e12c5d1SDavid du Colombier 0 2913e12c5d1SDavid du Colombier }; 2923e12c5d1SDavid du Colombier Ptab ptabk[] = 2933e12c5d1SDavid du Colombier { 2943e12c5d1SDavid du Colombier "kilo", 0, 2953e12c5d1SDavid du Colombier 0 2963e12c5d1SDavid du Colombier }; 2973e12c5d1SDavid du Colombier Ptab ptabl[] = 2983e12c5d1SDavid du Colombier { 2993e12c5d1SDavid du Colombier 0 3003e12c5d1SDavid du Colombier }; 3013e12c5d1SDavid du Colombier Ptab ptabm[] = 3023e12c5d1SDavid du Colombier { 3033e12c5d1SDavid du Colombier "magneto", 0, 3043e12c5d1SDavid du Colombier "mega", 0, 3053e12c5d1SDavid du Colombier "meta", 0, 3063e12c5d1SDavid du Colombier "micro", 0, 3073e12c5d1SDavid du Colombier "mid", 0, 3083e12c5d1SDavid du Colombier "milli", 0, 309*219b2ee8SDavid du Colombier "mini", 0, 3103e12c5d1SDavid du Colombier "mis", 0, 3113e12c5d1SDavid du Colombier "mono", 0, 3123e12c5d1SDavid du Colombier "multi", 0, 3133e12c5d1SDavid du Colombier 0 3143e12c5d1SDavid du Colombier }; 3153e12c5d1SDavid du Colombier Ptab ptabn[] = 3163e12c5d1SDavid du Colombier { 3173e12c5d1SDavid du Colombier "nano", 0, 318*219b2ee8SDavid du Colombier "neuro", 0, 3193e12c5d1SDavid du Colombier "non", 0, 3203e12c5d1SDavid du Colombier 0 3213e12c5d1SDavid du Colombier }; 3223e12c5d1SDavid du Colombier Ptab ptabo[] = 3233e12c5d1SDavid du Colombier { 3243e12c5d1SDavid du Colombier "out", 0, 3253e12c5d1SDavid du Colombier "over", 0, 3263e12c5d1SDavid du Colombier 0 3273e12c5d1SDavid du Colombier }; 3283e12c5d1SDavid du Colombier Ptab ptabp[] = 3293e12c5d1SDavid du Colombier { 3303e12c5d1SDavid du Colombier "para", 0, 3313e12c5d1SDavid du Colombier "photo", 0, 3323e12c5d1SDavid du Colombier "pico", 0, 3333e12c5d1SDavid du Colombier "poly", 0, 3343e12c5d1SDavid du Colombier "pre", 0, 3353e12c5d1SDavid du Colombier "pseudo", 0, 3363e12c5d1SDavid du Colombier "psycho", 0, 3373e12c5d1SDavid du Colombier 0 3383e12c5d1SDavid du Colombier }; 3393e12c5d1SDavid du Colombier Ptab ptabq[] = 3403e12c5d1SDavid du Colombier { 3413e12c5d1SDavid du Colombier "quasi", 0, 3423e12c5d1SDavid du Colombier 0 3433e12c5d1SDavid du Colombier }; 3443e12c5d1SDavid du Colombier Ptab ptabr[] = 3453e12c5d1SDavid du Colombier { 346*219b2ee8SDavid du Colombier "radio", 0, 3473e12c5d1SDavid du Colombier "re", 0, 3483e12c5d1SDavid du Colombier 0 3493e12c5d1SDavid du Colombier }; 3503e12c5d1SDavid du Colombier Ptab ptabs[] = 3513e12c5d1SDavid du Colombier { 3523e12c5d1SDavid du Colombier "semi", 0, 3533e12c5d1SDavid du Colombier "stereo", 0, 3543e12c5d1SDavid du Colombier "sub", 0, 3553e12c5d1SDavid du Colombier "super", 0, 3563e12c5d1SDavid du Colombier 0 3573e12c5d1SDavid du Colombier }; 3583e12c5d1SDavid du Colombier Ptab ptabt[] = 3593e12c5d1SDavid du Colombier { 3603e12c5d1SDavid du Colombier "tele", 0, 361*219b2ee8SDavid du Colombier "tera", 0, 3623e12c5d1SDavid du Colombier "thermo", 0, 3633e12c5d1SDavid du Colombier 0 3643e12c5d1SDavid du Colombier }; 3653e12c5d1SDavid du Colombier Ptab ptabu[] = 3663e12c5d1SDavid du Colombier { 3673e12c5d1SDavid du Colombier "ultra", 0, 3683e12c5d1SDavid du Colombier "under", 0, /*must precede un*/ 3693e12c5d1SDavid du Colombier "un", IN, 3703e12c5d1SDavid du Colombier 0 3713e12c5d1SDavid du Colombier }; 3723e12c5d1SDavid du Colombier Ptab ptabv[] = 3733e12c5d1SDavid du Colombier { 3743e12c5d1SDavid du Colombier 0 3753e12c5d1SDavid du Colombier }; 3763e12c5d1SDavid du Colombier Ptab ptabw[] = 3773e12c5d1SDavid du Colombier { 3783e12c5d1SDavid du Colombier 0 3793e12c5d1SDavid du Colombier }; 3803e12c5d1SDavid du Colombier Ptab ptabx[] = 3813e12c5d1SDavid du Colombier { 3823e12c5d1SDavid du Colombier 0 3833e12c5d1SDavid du Colombier }; 3843e12c5d1SDavid du Colombier Ptab ptaby[] = 3853e12c5d1SDavid du Colombier { 3863e12c5d1SDavid du Colombier 0 3873e12c5d1SDavid du Colombier }; 3883e12c5d1SDavid du Colombier Ptab ptabz[] = 3893e12c5d1SDavid du Colombier { 3903e12c5d1SDavid du Colombier 0 3913e12c5d1SDavid du Colombier }; 3923e12c5d1SDavid du Colombier 3933e12c5d1SDavid du Colombier Ptab* preftab[] = 3943e12c5d1SDavid du Colombier { 3953e12c5d1SDavid du Colombier ptaba, 3963e12c5d1SDavid du Colombier ptabb, 3973e12c5d1SDavid du Colombier ptabc, 3983e12c5d1SDavid du Colombier ptabd, 3993e12c5d1SDavid du Colombier ptabe, 4003e12c5d1SDavid du Colombier ptabf, 4013e12c5d1SDavid du Colombier ptabg, 4023e12c5d1SDavid du Colombier ptabh, 4033e12c5d1SDavid du Colombier ptabi, 4043e12c5d1SDavid du Colombier ptabj, 4053e12c5d1SDavid du Colombier ptabk, 4063e12c5d1SDavid du Colombier ptabl, 4073e12c5d1SDavid du Colombier ptabm, 4083e12c5d1SDavid du Colombier ptabn, 4093e12c5d1SDavid du Colombier ptabo, 4103e12c5d1SDavid du Colombier ptabp, 4113e12c5d1SDavid du Colombier ptabq, 4123e12c5d1SDavid du Colombier ptabr, 4133e12c5d1SDavid du Colombier ptabs, 4143e12c5d1SDavid du Colombier ptabt, 4153e12c5d1SDavid du Colombier ptabu, 4163e12c5d1SDavid du Colombier ptabv, 4173e12c5d1SDavid du Colombier ptabw, 4183e12c5d1SDavid du Colombier ptabx, 4193e12c5d1SDavid du Colombier ptaby, 4203e12c5d1SDavid du Colombier ptabz, 4213e12c5d1SDavid du Colombier }; 4223e12c5d1SDavid du Colombier 423*219b2ee8SDavid du Colombier typedef struct { 424*219b2ee8SDavid du Colombier char *mesg; 425*219b2ee8SDavid du Colombier enum { NONE, SUFF, PREF} type; 426*219b2ee8SDavid du Colombier } Deriv; 427*219b2ee8SDavid du Colombier 428*219b2ee8SDavid du Colombier int aflag; 4293e12c5d1SDavid du Colombier int cflag; 430*219b2ee8SDavid du Colombier int fflag; 4313e12c5d1SDavid du Colombier int vflag; 4323e12c5d1SDavid du Colombier int xflag; 433*219b2ee8SDavid du Colombier int nflag; 434*219b2ee8SDavid du Colombier char word[500]; 4353e12c5d1SDavid du Colombier char* original; 436*219b2ee8SDavid du Colombier Deriv emptyderiv; 437*219b2ee8SDavid du Colombier Deriv deriv[DSIZ+3]; 438*219b2ee8SDavid du Colombier char affix[DSIZ*10]; /* 10 is longest affix message */ 439*219b2ee8SDavid du Colombier int prefcount; 440*219b2ee8SDavid du Colombier int suffcount; 441*219b2ee8SDavid du Colombier char* acmeid; 4423e12c5d1SDavid du Colombier char space[300000]; /* must be as large as "words"+"space" in pcode run */ 4433e12c5d1SDavid du Colombier Bits encode[2048]; /* must be as long as "codes" in pcode run */ 4443e12c5d1SDavid du Colombier int nencode; 445*219b2ee8SDavid du Colombier char voweltab[256]; 4463e12c5d1SDavid du Colombier char* spacep[128*128+1]; /* pointer to words starting with 'xx' */ 4473e12c5d1SDavid du Colombier Biobuf bin; 448*219b2ee8SDavid du Colombier Biobuf bout; 4493e12c5d1SDavid du Colombier 4503e12c5d1SDavid du Colombier char* codefile = "/sys/lib/amspell"; 4513e12c5d1SDavid du Colombier char* brfile = "/sys/lib/brspell"; 4523e12c5d1SDavid du Colombier char* Usage = "usage"; 4533e12c5d1SDavid du Colombier 4543e12c5d1SDavid du Colombier void 4553e12c5d1SDavid du Colombier main(int argc, char *argv[]) 4563e12c5d1SDavid du Colombier { 4573e12c5d1SDavid du Colombier char *ep, *cp; 4583e12c5d1SDavid du Colombier char *dp; 4593e12c5d1SDavid du Colombier int j, i, c; 4603e12c5d1SDavid du Colombier int low; 4613e12c5d1SDavid du Colombier Bits h; 4623e12c5d1SDavid du Colombier 4633e12c5d1SDavid du Colombier Binit(&bin, 0, OREAD); 464*219b2ee8SDavid du Colombier Binit(&bout, 1, OWRITE); 4653e12c5d1SDavid du Colombier for(i=0; c = "aeiouyAEIOUY"[i]; i++) 4663e12c5d1SDavid du Colombier voweltab[c] = 1; 4673e12c5d1SDavid du Colombier while(argc > 1) { 4683e12c5d1SDavid du Colombier if(argv[1][0] != '-') 4693e12c5d1SDavid du Colombier break; 4703e12c5d1SDavid du Colombier for(i=1; c = argv[1][i]; i++) 4713e12c5d1SDavid du Colombier switch(c) { 4723e12c5d1SDavid du Colombier default: 473*219b2ee8SDavid du Colombier fprint(2, "usage: spell [-bcCvx] [-f file]\n"); 4743e12c5d1SDavid du Colombier exits(Usage); 4753e12c5d1SDavid du Colombier 476*219b2ee8SDavid du Colombier case 'a': 477*219b2ee8SDavid du Colombier aflag++; 478*219b2ee8SDavid du Colombier continue; 479*219b2ee8SDavid du Colombier 4803e12c5d1SDavid du Colombier case 'b': 4813e12c5d1SDavid du Colombier ise(); 482*219b2ee8SDavid du Colombier if(!fflag) 4833e12c5d1SDavid du Colombier codefile = brfile; 4843e12c5d1SDavid du Colombier continue; 4853e12c5d1SDavid du Colombier 486*219b2ee8SDavid du Colombier case 'C': /* for "correct" */ 487*219b2ee8SDavid du Colombier vflag++; 488*219b2ee8SDavid du Colombier case 'c': /* for ocr */ 4893e12c5d1SDavid du Colombier cflag++; 4903e12c5d1SDavid du Colombier continue; 4913e12c5d1SDavid du Colombier 4923e12c5d1SDavid du Colombier case 'v': 4933e12c5d1SDavid du Colombier vflag++; 4943e12c5d1SDavid du Colombier continue; 4953e12c5d1SDavid du Colombier 4963e12c5d1SDavid du Colombier case 'x': 4973e12c5d1SDavid du Colombier xflag++; 4983e12c5d1SDavid du Colombier continue; 4993e12c5d1SDavid du Colombier 5003e12c5d1SDavid du Colombier case 'f': 5013e12c5d1SDavid du Colombier if(argc <= 2) { 5023e12c5d1SDavid du Colombier fprint(2, "spell: -f requires another argument\n"); 5033e12c5d1SDavid du Colombier exits(Usage); 5043e12c5d1SDavid du Colombier } 5053e12c5d1SDavid du Colombier argv++; 5063e12c5d1SDavid du Colombier argc--; 5073e12c5d1SDavid du Colombier codefile = argv[1]; 508*219b2ee8SDavid du Colombier fflag++; 5093e12c5d1SDavid du Colombier goto brk; 5103e12c5d1SDavid du Colombier } 5113e12c5d1SDavid du Colombier brk: 5123e12c5d1SDavid du Colombier argv++; 5133e12c5d1SDavid du Colombier argc--; 5143e12c5d1SDavid du Colombier } 5153e12c5d1SDavid du Colombier readdict(codefile); 5163e12c5d1SDavid du Colombier if(argc > 1) { 517*219b2ee8SDavid du Colombier fprint(2, "usage: spell [-bcCvx] [-f file]\n"); 5183e12c5d1SDavid du Colombier exits(Usage); 5193e12c5d1SDavid du Colombier } 520*219b2ee8SDavid du Colombier if(aflag) 521*219b2ee8SDavid du Colombier cflag = vflag = 0; 5223e12c5d1SDavid du Colombier 5233e12c5d1SDavid du Colombier for(;;) { 5243e12c5d1SDavid du Colombier affix[0] = 0; 5253e12c5d1SDavid du Colombier original = Brdline(&bin, '\n'); 5263e12c5d1SDavid du Colombier if(original == 0) 5273e12c5d1SDavid du Colombier exits(0); 5283e12c5d1SDavid du Colombier original[Blinelen(&bin)-1] = 0; 5293e12c5d1SDavid du Colombier low = 0; 530*219b2ee8SDavid du Colombier 531*219b2ee8SDavid du Colombier if(aflag) { 532*219b2ee8SDavid du Colombier acmeid = original; 533*219b2ee8SDavid du Colombier while(*original != ':') 534*219b2ee8SDavid du Colombier if(*original++ == 0) 535*219b2ee8SDavid du Colombier exits(0); 536*219b2ee8SDavid du Colombier while(*++original != ':') 537*219b2ee8SDavid du Colombier if(*original == 0) 538*219b2ee8SDavid du Colombier exits(0); 539*219b2ee8SDavid du Colombier *original++ = 0; 540*219b2ee8SDavid du Colombier } 5413e12c5d1SDavid du Colombier for(ep=word,dp=original; j = *dp; ep++,dp++) { 542*219b2ee8SDavid du Colombier if(ISLOWER(j)) 5433e12c5d1SDavid du Colombier low++; 5443e12c5d1SDavid du Colombier if(ep >= word+sizeof(word)-1) 5453e12c5d1SDavid du Colombier break; 5463e12c5d1SDavid du Colombier *ep = j; 5473e12c5d1SDavid du Colombier } 5483e12c5d1SDavid du Colombier *ep = 0; 5493e12c5d1SDavid du Colombier 550*219b2ee8SDavid du Colombier if(ISDIGIT(word[0]) && ordinal()) 5513e12c5d1SDavid du Colombier continue; 5523e12c5d1SDavid du Colombier 5533e12c5d1SDavid du Colombier h = 0; 5543e12c5d1SDavid du Colombier if(!low && !(h = trypref(ep,".",0,ALL|STOP|DONT_TOUCH))) 5553e12c5d1SDavid du Colombier for(cp=original+1,dp=word+1; dp<ep; dp++,cp++) 5563e12c5d1SDavid du Colombier *dp = Tolower(*cp); 5573e12c5d1SDavid du Colombier if(!h) 5583e12c5d1SDavid du Colombier for(;;) { /* at most twice */ 5593e12c5d1SDavid du Colombier if(h = trypref(ep,".",0,ALL|STOP|DONT_TOUCH)) 5603e12c5d1SDavid du Colombier break; 5613e12c5d1SDavid du Colombier if(h = trysuff(ep,0,ALL|STOP|DONT_TOUCH)) 5623e12c5d1SDavid du Colombier break; 563*219b2ee8SDavid du Colombier if(!ISUPPER(word[0])) 5643e12c5d1SDavid du Colombier break; 5653e12c5d1SDavid du Colombier cp = original; 5663e12c5d1SDavid du Colombier dp = word; 5673e12c5d1SDavid du Colombier while(*dp = *cp++) { 5683e12c5d1SDavid du Colombier if(!low) 5693e12c5d1SDavid du Colombier *dp = Tolower(*dp); 5703e12c5d1SDavid du Colombier dp++; 5713e12c5d1SDavid du Colombier } 5723e12c5d1SDavid du Colombier word[0] = Tolower(word[0]); 5733e12c5d1SDavid du Colombier } 5743e12c5d1SDavid du Colombier 5753e12c5d1SDavid du Colombier if(cflag) { 5763e12c5d1SDavid du Colombier if(!h || Set(h,STOP)) 577*219b2ee8SDavid du Colombier print("-"); 578*219b2ee8SDavid du Colombier else if(!vflag) 579*219b2ee8SDavid du Colombier print("+"); 5803e12c5d1SDavid du Colombier else 581*219b2ee8SDavid du Colombier print("%c",'0' + (suffcount>0) + 582*219b2ee8SDavid du Colombier (prefcount>4? 8: 2*prefcount)); 583*219b2ee8SDavid du Colombier } else if(!h || Set(h,STOP)) { 584*219b2ee8SDavid du Colombier if(aflag) 585*219b2ee8SDavid du Colombier Bprint(&bout, "%s:%s\n", acmeid, original); 586*219b2ee8SDavid du Colombier else 587*219b2ee8SDavid du Colombier Bprint(&bout, "%s\n", original); 588*219b2ee8SDavid du Colombier } else if(affix[0] != 0 && affix[0] != '.') 589*219b2ee8SDavid du Colombier print("%s\t%s\n", affix, original); 5903e12c5d1SDavid du Colombier } 591*219b2ee8SDavid du Colombier exits(0); 5923e12c5d1SDavid du Colombier } 5933e12c5d1SDavid du Colombier 5943e12c5d1SDavid du Colombier /* strip exactly one suffix and do 5953e12c5d1SDavid du Colombier * indicated routine(s), which may recursively 5963e12c5d1SDavid du Colombier * strip suffixes 5973e12c5d1SDavid du Colombier */ 5983e12c5d1SDavid du Colombier Bits 5993e12c5d1SDavid du Colombier trysuff(char* ep, int lev, int flag) 6003e12c5d1SDavid du Colombier { 6013e12c5d1SDavid du Colombier Suftab *t; 6023e12c5d1SDavid du Colombier char *cp, *sp; 6033e12c5d1SDavid du Colombier Bits h = 0; 6043e12c5d1SDavid du Colombier int initchar = ep[-1]; 6053e12c5d1SDavid du Colombier 6063e12c5d1SDavid du Colombier flag &= ~MONO; 6073e12c5d1SDavid du Colombier lev += DLEV; 608*219b2ee8SDavid du Colombier if(lev < DSIZ) { 609*219b2ee8SDavid du Colombier deriv[lev] = emptyderiv; 610*219b2ee8SDavid du Colombier deriv[lev-1] = emptyderiv; 611*219b2ee8SDavid du Colombier } 612*219b2ee8SDavid du Colombier if(!ISLOWER(initchar)) 6133e12c5d1SDavid du Colombier return h; 6143e12c5d1SDavid du Colombier for(t=suftab[initchar-'a']; sp=t->suf; t++) { 6153e12c5d1SDavid du Colombier cp = ep; 6163e12c5d1SDavid du Colombier while(*sp) 6173e12c5d1SDavid du Colombier if(*--cp != *sp++) 6183e12c5d1SDavid du Colombier goto next; 619*219b2ee8SDavid du Colombier for(sp=ep-t->n1; --sp >= word && !ISVOWEL(*sp);) 6203e12c5d1SDavid du Colombier ; 6213e12c5d1SDavid du Colombier if(sp < word) 622*219b2ee8SDavid du Colombier continue; 6233e12c5d1SDavid du Colombier if(!(t->affixable & flag)) 6243e12c5d1SDavid du Colombier return 0; 6253e12c5d1SDavid du Colombier h = (*t->p1)(ep-t->n1, t->d1, t->a1, lev+1, t->flag|STOP); 6263e12c5d1SDavid du Colombier if(!h && t->p2!=0) { 627*219b2ee8SDavid du Colombier if(lev < DSIZ) { 628*219b2ee8SDavid du Colombier deriv[lev] = emptyderiv; 629*219b2ee8SDavid du Colombier deriv[lev+1] = emptyderiv; 630*219b2ee8SDavid du Colombier } 6313e12c5d1SDavid du Colombier h = (*t->p2)(ep-t->n2, t->d2, t->a2, lev, t->flag|STOP); 6323e12c5d1SDavid du Colombier } 6333e12c5d1SDavid du Colombier break; 6343e12c5d1SDavid du Colombier next:; 6353e12c5d1SDavid du Colombier } 6363e12c5d1SDavid du Colombier return h; 6373e12c5d1SDavid du Colombier } 6383e12c5d1SDavid du Colombier 6393e12c5d1SDavid du Colombier Bits 6403e12c5d1SDavid du Colombier nop(char* ep, char* d, char* a, int lev, int flag) 6413e12c5d1SDavid du Colombier { 6423e12c5d1SDavid du Colombier USED(ep, d, a, lev, flag); 6433e12c5d1SDavid du Colombier return 0; 6443e12c5d1SDavid du Colombier } 6453e12c5d1SDavid du Colombier 6463e12c5d1SDavid du Colombier Bits 6473e12c5d1SDavid du Colombier cstrip(char* ep, char* d, char* a, int lev, int flag) 6483e12c5d1SDavid du Colombier { 6493e12c5d1SDavid du Colombier int temp = ep[0]; 6503e12c5d1SDavid du Colombier 651*219b2ee8SDavid du Colombier if(ISVOWEL(temp) && ISVOWEL(ep[-1])) { 6523e12c5d1SDavid du Colombier switch(pair(ep[-1],ep[0])) { 6533e12c5d1SDavid du Colombier case pair('a', 'a'): 6543e12c5d1SDavid du Colombier case pair('a', 'e'): 6553e12c5d1SDavid du Colombier case pair('a', 'i'): 6563e12c5d1SDavid du Colombier case pair('e', 'a'): 6573e12c5d1SDavid du Colombier case pair('e', 'e'): 6583e12c5d1SDavid du Colombier case pair('e', 'i'): 6593e12c5d1SDavid du Colombier case pair('i', 'i'): 6603e12c5d1SDavid du Colombier case pair('o', 'a'): 6613e12c5d1SDavid du Colombier return 0; 6623e12c5d1SDavid du Colombier } 6633e12c5d1SDavid du Colombier } else 6643e12c5d1SDavid du Colombier if(temp==ep[-1]&&temp==ep[-2]) 6653e12c5d1SDavid du Colombier return 0; 6663e12c5d1SDavid du Colombier return strip(ep,d,a,lev,flag); 6673e12c5d1SDavid du Colombier } 6683e12c5d1SDavid du Colombier 6693e12c5d1SDavid du Colombier Bits 6703e12c5d1SDavid du Colombier strip(char* ep, char* d, char* a, int lev, int flag) 6713e12c5d1SDavid du Colombier { 6723e12c5d1SDavid du Colombier Bits h = trypref(ep, a, lev, flag); 6733e12c5d1SDavid du Colombier 6743e12c5d1SDavid du Colombier USED(d); 675*219b2ee8SDavid du Colombier if(Set(h,MONO) && ISVOWEL(*ep) && ISVOWEL(ep[-2])) 6763e12c5d1SDavid du Colombier h = 0; 6773e12c5d1SDavid du Colombier if(h) 6783e12c5d1SDavid du Colombier return h; 679*219b2ee8SDavid du Colombier if(ISVOWEL(*ep) && !ISVOWEL(ep[-1]) && ep[-1]==ep[-2]) { 6803e12c5d1SDavid du Colombier h = trypref(ep-1,a,lev,flag|MONO); 6813e12c5d1SDavid du Colombier if(h) 6823e12c5d1SDavid du Colombier return h; 6833e12c5d1SDavid du Colombier } 6843e12c5d1SDavid du Colombier return trysuff(ep,lev,flag); 6853e12c5d1SDavid du Colombier } 6863e12c5d1SDavid du Colombier 6873e12c5d1SDavid du Colombier Bits 6883e12c5d1SDavid du Colombier s(char* ep, char* d, char* a, int lev, int flag) 6893e12c5d1SDavid du Colombier { 6903e12c5d1SDavid du Colombier if(lev > DLEV+1) 6913e12c5d1SDavid du Colombier return 0; 6923e12c5d1SDavid du Colombier if(*ep=='s') { 6933e12c5d1SDavid du Colombier switch(ep[-1]) { 6943e12c5d1SDavid du Colombier case 'y': 695*219b2ee8SDavid du Colombier if(ISVOWEL(ep[-2])||ISUPPER(*word)) 6963e12c5d1SDavid du Colombier break; /*says Kennedys*/ 6973e12c5d1SDavid du Colombier case 'x': 6983e12c5d1SDavid du Colombier case 'z': 6993e12c5d1SDavid du Colombier case 's': 7003e12c5d1SDavid du Colombier return 0; 7013e12c5d1SDavid du Colombier case 'h': 7023e12c5d1SDavid du Colombier switch(ep[-2]) { 7033e12c5d1SDavid du Colombier case 'c': 7043e12c5d1SDavid du Colombier case 's': 7053e12c5d1SDavid du Colombier return 0; 7063e12c5d1SDavid du Colombier } 7073e12c5d1SDavid du Colombier } 7083e12c5d1SDavid du Colombier } 7093e12c5d1SDavid du Colombier return strip(ep,d,a,lev,flag); 7103e12c5d1SDavid du Colombier } 7113e12c5d1SDavid du Colombier 7123e12c5d1SDavid du Colombier Bits 7133e12c5d1SDavid du Colombier an(char* ep, char* d, char* a, int lev, int flag) 7143e12c5d1SDavid du Colombier { 7153e12c5d1SDavid du Colombier USED(d); 716*219b2ee8SDavid du Colombier if(!ISUPPER(*word)) /*must be proper name*/ 7173e12c5d1SDavid du Colombier return 0; 7183e12c5d1SDavid du Colombier return trypref(ep,a,lev,flag); 7193e12c5d1SDavid du Colombier } 7203e12c5d1SDavid du Colombier 7213e12c5d1SDavid du Colombier Bits 7223e12c5d1SDavid du Colombier ize(char* ep, char* d, char* a, int lev, int flag) 7233e12c5d1SDavid du Colombier { 7243e12c5d1SDavid du Colombier int temp = ep[-1]; 7253e12c5d1SDavid du Colombier Bits h; 7263e12c5d1SDavid du Colombier 7273e12c5d1SDavid du Colombier USED(a); 7283e12c5d1SDavid du Colombier ep[-1] = 'e'; 7293e12c5d1SDavid du Colombier h = strip(ep,"",d,lev,flag); 7303e12c5d1SDavid du Colombier ep[-1] = temp; 7313e12c5d1SDavid du Colombier return h; 7323e12c5d1SDavid du Colombier } 7333e12c5d1SDavid du Colombier 7343e12c5d1SDavid du Colombier Bits 7353e12c5d1SDavid du Colombier y_to_e(char* ep, char* d, char* a, int lev, int flag) 7363e12c5d1SDavid du Colombier { 7373e12c5d1SDavid du Colombier Bits h; 7383e12c5d1SDavid du Colombier int temp; 7393e12c5d1SDavid du Colombier 7403e12c5d1SDavid du Colombier USED(a); 7413e12c5d1SDavid du Colombier switch(ep[-1]) { 7423e12c5d1SDavid du Colombier case 'a': 7433e12c5d1SDavid du Colombier case 'e': 7443e12c5d1SDavid du Colombier case 'i': 7453e12c5d1SDavid du Colombier return 0; 7463e12c5d1SDavid du Colombier } 7473e12c5d1SDavid du Colombier temp = *ep; 7483e12c5d1SDavid du Colombier *ep++ = 'e'; 7493e12c5d1SDavid du Colombier h = strip(ep,"",d,lev,flag); 7503e12c5d1SDavid du Colombier ep[-1] = temp; 7513e12c5d1SDavid du Colombier return h; 7523e12c5d1SDavid du Colombier } 7533e12c5d1SDavid du Colombier 7543e12c5d1SDavid du Colombier Bits 7553e12c5d1SDavid du Colombier ily(char* ep, char* d, char* a, int lev, int flag) 7563e12c5d1SDavid du Colombier { 7573e12c5d1SDavid du Colombier int temp = ep[0]; 7583e12c5d1SDavid du Colombier char *cp = ep; 7593e12c5d1SDavid du Colombier 7603e12c5d1SDavid du Colombier if(temp==ep[-1]&&temp==ep[-2]) /* sillly */ 7613e12c5d1SDavid du Colombier return 0; 762*219b2ee8SDavid du Colombier if(*--cp=='y' && !ISVOWEL(*--cp)) /* happyly */ 7633e12c5d1SDavid du Colombier while(cp>word) 764*219b2ee8SDavid du Colombier if(ISVOWEL(*--cp)) /* shyness */ 7653e12c5d1SDavid du Colombier return 0; 7663e12c5d1SDavid du Colombier if(ep[-1]=='i') 7673e12c5d1SDavid du Colombier return i_to_y(ep,d,a,lev,flag); 7683e12c5d1SDavid du Colombier return cstrip(ep,d,a,lev,flag); 7693e12c5d1SDavid du Colombier } 7703e12c5d1SDavid du Colombier 7713e12c5d1SDavid du Colombier Bits 7723e12c5d1SDavid du Colombier bility(char* ep, char* d, char* a, int lev, int flag) 7733e12c5d1SDavid du Colombier { 7743e12c5d1SDavid du Colombier *ep++ = 'l'; 7753e12c5d1SDavid du Colombier return y_to_e(ep,d,a,lev,flag); 7763e12c5d1SDavid du Colombier } 7773e12c5d1SDavid du Colombier 7783e12c5d1SDavid du Colombier Bits 7793e12c5d1SDavid du Colombier i_to_y(char* ep, char* d, char* a, int lev, int flag) 7803e12c5d1SDavid du Colombier { 7813e12c5d1SDavid du Colombier Bits h; 7823e12c5d1SDavid du Colombier int temp; 7833e12c5d1SDavid du Colombier 784*219b2ee8SDavid du Colombier if(ISUPPER(*word)) 7853e12c5d1SDavid du Colombier return 0; 786*219b2ee8SDavid du Colombier if((temp=ep[-1])=='i' && !ISVOWEL(ep[-2])) { 7873e12c5d1SDavid du Colombier ep[-1] = 'y'; 7883e12c5d1SDavid du Colombier a = d; 7893e12c5d1SDavid du Colombier } 7903e12c5d1SDavid du Colombier h = cstrip(ep,"",a,lev,flag); 7913e12c5d1SDavid du Colombier ep[-1] = temp; 7923e12c5d1SDavid du Colombier return h; 7933e12c5d1SDavid du Colombier } 7943e12c5d1SDavid du Colombier 7953e12c5d1SDavid du Colombier Bits 7963e12c5d1SDavid du Colombier es(char* ep, char* d, char* a, int lev, int flag) 7973e12c5d1SDavid du Colombier { 7983e12c5d1SDavid du Colombier if(lev>DLEV) 7993e12c5d1SDavid du Colombier return 0; 8003e12c5d1SDavid du Colombier switch(ep[-1]) { 8013e12c5d1SDavid du Colombier default: 8023e12c5d1SDavid du Colombier return 0; 8033e12c5d1SDavid du Colombier case 'i': 8043e12c5d1SDavid du Colombier return i_to_y(ep,d,a,lev,flag); 8053e12c5d1SDavid du Colombier case 'h': 8063e12c5d1SDavid du Colombier switch(ep[-2]) { 8073e12c5d1SDavid du Colombier default: 8083e12c5d1SDavid du Colombier return 0; 8093e12c5d1SDavid du Colombier case 'c': 8103e12c5d1SDavid du Colombier case 's': 8113e12c5d1SDavid du Colombier break; 8123e12c5d1SDavid du Colombier } 8133e12c5d1SDavid du Colombier case 's': 8143e12c5d1SDavid du Colombier case 'z': 8153e12c5d1SDavid du Colombier case 'x': 8163e12c5d1SDavid du Colombier return strip(ep,d,a,lev,flag); 8173e12c5d1SDavid du Colombier } 8183e12c5d1SDavid du Colombier } 8193e12c5d1SDavid du Colombier 8203e12c5d1SDavid du Colombier Bits 8213e12c5d1SDavid du Colombier subst(char* ep, char* d, char* a, int lev, int flag) 8223e12c5d1SDavid du Colombier { 8233e12c5d1SDavid du Colombier char *u,*t; 8243e12c5d1SDavid du Colombier Bits h; 8253e12c5d1SDavid du Colombier 8263e12c5d1SDavid du Colombier USED(a); 8273e12c5d1SDavid du Colombier if(skipv(skipv(ep-1)) < word) 8283e12c5d1SDavid du Colombier return 0; 8293e12c5d1SDavid du Colombier for(t=d; *t!='+'; t++) 8303e12c5d1SDavid du Colombier continue; 8313e12c5d1SDavid du Colombier for(u=ep; *--t!='-';) 8323e12c5d1SDavid du Colombier *--u = *t; 8333e12c5d1SDavid du Colombier h = strip(ep,"",d,lev,flag); 8343e12c5d1SDavid du Colombier while(*++t != '+') 8353e12c5d1SDavid du Colombier continue; 8363e12c5d1SDavid du Colombier while(*++t) 8373e12c5d1SDavid du Colombier *u++ = *t; 8383e12c5d1SDavid du Colombier return h; 8393e12c5d1SDavid du Colombier } 8403e12c5d1SDavid du Colombier 8413e12c5d1SDavid du Colombier Bits 8423e12c5d1SDavid du Colombier tion(char* ep, char* d, char* a, int lev, int flag) 8433e12c5d1SDavid du Colombier { 8443e12c5d1SDavid du Colombier switch(ep[-2]) { 845*219b2ee8SDavid du Colombier default: 8463e12c5d1SDavid du Colombier return trypref(ep,a,lev,flag); 8473e12c5d1SDavid du Colombier case 'a': 8483e12c5d1SDavid du Colombier case 'e': 8493e12c5d1SDavid du Colombier case 'i': 8503e12c5d1SDavid du Colombier case 'o': 8513e12c5d1SDavid du Colombier case 'u': 8523e12c5d1SDavid du Colombier return y_to_e(ep,d,a,lev,flag); 8533e12c5d1SDavid du Colombier } 8543e12c5d1SDavid du Colombier } 8553e12c5d1SDavid du Colombier 8563e12c5d1SDavid du Colombier /* 8573e12c5d1SDavid du Colombier * possible consonant-consonant-e ending 8583e12c5d1SDavid du Colombier */ 8593e12c5d1SDavid du Colombier Bits 8603e12c5d1SDavid du Colombier CCe(char* ep, char* d, char* a, int lev, int flag) 8613e12c5d1SDavid du Colombier { 8623e12c5d1SDavid du Colombier Bits h; 8633e12c5d1SDavid du Colombier 8643e12c5d1SDavid du Colombier switch(ep[-1]) { 8653e12c5d1SDavid du Colombier case 'l': 866*219b2ee8SDavid du Colombier if(ISVOWEL(ep[-2])) 8673e12c5d1SDavid du Colombier break; 8683e12c5d1SDavid du Colombier switch(ep[-2]) { 8693e12c5d1SDavid du Colombier case 'l': 8703e12c5d1SDavid du Colombier case 'r': 8713e12c5d1SDavid du Colombier case 'w': 8723e12c5d1SDavid du Colombier break; 8733e12c5d1SDavid du Colombier default: 8743e12c5d1SDavid du Colombier return y_to_e(ep,d,a,lev,flag); 8753e12c5d1SDavid du Colombier } 8763e12c5d1SDavid du Colombier break; 8773e12c5d1SDavid du Colombier case 'c': 8783e12c5d1SDavid du Colombier case 'g': 8793e12c5d1SDavid du Colombier if(*ep == 'a') /* prevent -able for -eable */ 8803e12c5d1SDavid du Colombier return 0; 8813e12c5d1SDavid du Colombier case 's': 8823e12c5d1SDavid du Colombier case 'v': 8833e12c5d1SDavid du Colombier case 'z': 8843e12c5d1SDavid du Colombier if(ep[-2]==ep[-1]) 8853e12c5d1SDavid du Colombier break; 886*219b2ee8SDavid du Colombier if(ISVOWEL(ep[-2])) 8873e12c5d1SDavid du Colombier break; 8883e12c5d1SDavid du Colombier case 'u': 8893e12c5d1SDavid du Colombier if(h = y_to_e(ep,d,a,lev,flag)) 8903e12c5d1SDavid du Colombier return h; 8913e12c5d1SDavid du Colombier if(!(ep[-2]=='n' && ep[-1]=='g')) 8923e12c5d1SDavid du Colombier return 0; 8933e12c5d1SDavid du Colombier } 8943e12c5d1SDavid du Colombier return VCe(ep,d,a,lev,flag); 8953e12c5d1SDavid du Colombier } 8963e12c5d1SDavid du Colombier 8973e12c5d1SDavid du Colombier /* 8983e12c5d1SDavid du Colombier * possible consonant-vowel-consonant-e ending 8993e12c5d1SDavid du Colombier */ 9003e12c5d1SDavid du Colombier Bits 9013e12c5d1SDavid du Colombier VCe(char* ep, char* d, char* a, int lev, int flag) 9023e12c5d1SDavid du Colombier { 9033e12c5d1SDavid du Colombier int c; 9043e12c5d1SDavid du Colombier Bits h; 9053e12c5d1SDavid du Colombier 9063e12c5d1SDavid du Colombier c = ep[-1]; 9073e12c5d1SDavid du Colombier if(c=='e') 9083e12c5d1SDavid du Colombier return 0; 909*219b2ee8SDavid du Colombier if(!ISVOWEL(c) && ISVOWEL(ep[-2])) { 9103e12c5d1SDavid du Colombier c = *ep; 9113e12c5d1SDavid du Colombier *ep++ = 'e'; 9123e12c5d1SDavid du Colombier h = trypref(ep,d,lev,flag); 9133e12c5d1SDavid du Colombier if(!h) 9143e12c5d1SDavid du Colombier h = trysuff(ep,lev,flag); 9153e12c5d1SDavid du Colombier if(h) 9163e12c5d1SDavid du Colombier return h; 9173e12c5d1SDavid du Colombier ep--; 9183e12c5d1SDavid du Colombier *ep = c; 9193e12c5d1SDavid du Colombier } 9203e12c5d1SDavid du Colombier return cstrip(ep,d,a,lev,flag); 9213e12c5d1SDavid du Colombier } 9223e12c5d1SDavid du Colombier 9233e12c5d1SDavid du Colombier Ptab* 924*219b2ee8SDavid du Colombier lookuppref(uchar** wp, char* ep) 9253e12c5d1SDavid du Colombier { 9263e12c5d1SDavid du Colombier Ptab *sp; 927*219b2ee8SDavid du Colombier uchar *bp,*cp; 928*219b2ee8SDavid du Colombier unsigned int initchar = Tolower(**wp); 9293e12c5d1SDavid du Colombier 930*219b2ee8SDavid du Colombier if(!ISALPHA(initchar)) 9313e12c5d1SDavid du Colombier return 0; 9323e12c5d1SDavid du Colombier for(sp=preftab[initchar-'a'];sp->s;sp++) { 9333e12c5d1SDavid du Colombier bp = *wp; 934*219b2ee8SDavid du Colombier for(cp= (uchar*)sp->s;*cp; ) 9353e12c5d1SDavid du Colombier if(*bp++!=*cp++) 9363e12c5d1SDavid du Colombier goto next; 937*219b2ee8SDavid du Colombier for(cp=bp;cp<(uchar*)ep;cp++) 938*219b2ee8SDavid du Colombier if(ISVOWEL(*cp)) { 9393e12c5d1SDavid du Colombier *wp = bp; 9403e12c5d1SDavid du Colombier return sp; 9413e12c5d1SDavid du Colombier } 9423e12c5d1SDavid du Colombier next:; 9433e12c5d1SDavid du Colombier } 9443e12c5d1SDavid du Colombier return 0; 9453e12c5d1SDavid du Colombier } 9463e12c5d1SDavid du Colombier 9473e12c5d1SDavid du Colombier /* while word is not in dictionary try stripping 9483e12c5d1SDavid du Colombier * prefixes. Fail if no more prefixes. 9493e12c5d1SDavid du Colombier */ 9503e12c5d1SDavid du Colombier Bits 9513e12c5d1SDavid du Colombier trypref(char* ep, char* a, int lev, int flag) 9523e12c5d1SDavid du Colombier { 9533e12c5d1SDavid du Colombier Ptab *tp; 9543e12c5d1SDavid du Colombier char *bp, *cp; 9553e12c5d1SDavid du Colombier char *pp; 9563e12c5d1SDavid du Colombier Bits h; 9573e12c5d1SDavid du Colombier char space[20]; 9583e12c5d1SDavid du Colombier 959*219b2ee8SDavid du Colombier if(lev<DSIZ) { 960*219b2ee8SDavid du Colombier deriv[lev].mesg = a; 961*219b2ee8SDavid du Colombier deriv[lev].type = *a=='.'? NONE: SUFF; 962*219b2ee8SDavid du Colombier } 9633e12c5d1SDavid du Colombier if(h = tryword(word,ep,lev,flag)) { 9643e12c5d1SDavid du Colombier if(Set(h, flag&~MONO) && (flag&MONO) <= Set(h, MONO)) 9653e12c5d1SDavid du Colombier return h; 9663e12c5d1SDavid du Colombier h = 0; 9673e12c5d1SDavid du Colombier } 9683e12c5d1SDavid du Colombier bp = word; 9693e12c5d1SDavid du Colombier pp = space; 970*219b2ee8SDavid du Colombier if(lev<DSIZ) { 971*219b2ee8SDavid du Colombier deriv[lev+1].mesg = pp; 972*219b2ee8SDavid du Colombier deriv[lev+1].type = 0; 973*219b2ee8SDavid du Colombier } 974*219b2ee8SDavid du Colombier while(tp=lookuppref((uchar**)&bp,ep)) { 9753e12c5d1SDavid du Colombier *pp++ = '+'; 9763e12c5d1SDavid du Colombier cp = tp->s; 977*219b2ee8SDavid du Colombier while(pp<space+sizeof(space) && (*pp = *cp++)) 9783e12c5d1SDavid du Colombier pp++; 979*219b2ee8SDavid du Colombier deriv[lev+1].type += PREF; 9803e12c5d1SDavid du Colombier h = tryword(bp,ep,lev+1,flag); 9813e12c5d1SDavid du Colombier if(Set(h,NOPREF) || 9823e12c5d1SDavid du Colombier ((tp->flag&IN) && inun(bp-2,h)==0)) { 9833e12c5d1SDavid du Colombier h = 0; 9843e12c5d1SDavid du Colombier break; 9853e12c5d1SDavid du Colombier } 9863e12c5d1SDavid du Colombier if(Set(h,flag&~MONO) && (flag&MONO) <= Set(h, MONO)) 9873e12c5d1SDavid du Colombier break; 9883e12c5d1SDavid du Colombier h = 0; 9893e12c5d1SDavid du Colombier } 990*219b2ee8SDavid du Colombier if(lev < DSIZ) { 991*219b2ee8SDavid du Colombier deriv[lev+1] = emptyderiv; 992*219b2ee8SDavid du Colombier deriv[lev+2] = emptyderiv; 993*219b2ee8SDavid du Colombier } 9943e12c5d1SDavid du Colombier return h; 9953e12c5d1SDavid du Colombier } 9963e12c5d1SDavid du Colombier 9973e12c5d1SDavid du Colombier Bits 9983e12c5d1SDavid du Colombier tryword(char* bp, char* ep, int lev, int flag) 9993e12c5d1SDavid du Colombier { 10003e12c5d1SDavid du Colombier int j; 10013e12c5d1SDavid du Colombier Bits h = 0; 10023e12c5d1SDavid du Colombier char duple[3]; 10033e12c5d1SDavid du Colombier 10043e12c5d1SDavid du Colombier if(ep-bp <= 1) 10053e12c5d1SDavid du Colombier return h; 10063e12c5d1SDavid du Colombier if(flag&MONO) { 1007*219b2ee8SDavid du Colombier if(lev<DSIZ) { 1008*219b2ee8SDavid du Colombier deriv[++lev].mesg = duple; 1009*219b2ee8SDavid du Colombier deriv[lev].type = SUFF; 1010*219b2ee8SDavid du Colombier } 10113e12c5d1SDavid du Colombier duple[0] = '+'; 10123e12c5d1SDavid du Colombier duple[1] = *ep; 10133e12c5d1SDavid du Colombier duple[2] = 0; 10143e12c5d1SDavid du Colombier } 10153e12c5d1SDavid du Colombier h = dict(bp, ep); 10163e12c5d1SDavid du Colombier if(vflag==0 || h==0) 10173e12c5d1SDavid du Colombier return h; 10183e12c5d1SDavid du Colombier /* 10193e12c5d1SDavid du Colombier * when derivations are wanted, collect them 10203e12c5d1SDavid du Colombier * for printing 10213e12c5d1SDavid du Colombier */ 10223e12c5d1SDavid du Colombier j = lev; 1023*219b2ee8SDavid du Colombier prefcount = suffcount = 0; 10243e12c5d1SDavid du Colombier do { 1025*219b2ee8SDavid du Colombier if(j<DSIZ && deriv[j].type) { 1026*219b2ee8SDavid du Colombier strcat(affix, deriv[j].mesg); 1027*219b2ee8SDavid du Colombier if(deriv[j].type == SUFF) 1028*219b2ee8SDavid du Colombier suffcount++; 1029*219b2ee8SDavid du Colombier else if(deriv[j].type != NONE) 1030*219b2ee8SDavid du Colombier prefcount = deriv[j].type/PREF; 1031*219b2ee8SDavid du Colombier } 10323e12c5d1SDavid du Colombier } while(--j > 0); 10333e12c5d1SDavid du Colombier return h; 10343e12c5d1SDavid du Colombier } 10353e12c5d1SDavid du Colombier 10363e12c5d1SDavid du Colombier int 10373e12c5d1SDavid du Colombier inun(char* bp, Bits h) 10383e12c5d1SDavid du Colombier { 10393e12c5d1SDavid du Colombier if(*bp == 'u') 10403e12c5d1SDavid du Colombier return Set(h, IN) == 0; 10413e12c5d1SDavid du Colombier /* *bp == 'i' */ 10423e12c5d1SDavid du Colombier if(Set(h, IN) == 0) 10433e12c5d1SDavid du Colombier return 0; 10443e12c5d1SDavid du Colombier switch(bp[2]) { 10453e12c5d1SDavid du Colombier case 'r': 10463e12c5d1SDavid du Colombier return bp[1] == 'r'; 10473e12c5d1SDavid du Colombier case 'm': 10483e12c5d1SDavid du Colombier case 'p': 10493e12c5d1SDavid du Colombier return bp[1] == 'm'; 10503e12c5d1SDavid du Colombier } 1051*219b2ee8SDavid du Colombier return bp[1] == 'n'; 10523e12c5d1SDavid du Colombier } 10533e12c5d1SDavid du Colombier 10543e12c5d1SDavid du Colombier char* 10553e12c5d1SDavid du Colombier skipv(char *s) 10563e12c5d1SDavid du Colombier { 1057*219b2ee8SDavid du Colombier if(s >= word && ISVOWEL(*s)) 10583e12c5d1SDavid du Colombier s--; 1059*219b2ee8SDavid du Colombier while(s >= word && !ISVOWEL(*s)) 10603e12c5d1SDavid du Colombier s--; 10613e12c5d1SDavid du Colombier return s; 10623e12c5d1SDavid du Colombier } 10633e12c5d1SDavid du Colombier 10643e12c5d1SDavid du Colombier /* 10653e12c5d1SDavid du Colombier * crummy way to Britishise 10663e12c5d1SDavid du Colombier */ 10673e12c5d1SDavid du Colombier void 10683e12c5d1SDavid du Colombier ise(void) 10693e12c5d1SDavid du Colombier { 10703e12c5d1SDavid du Colombier Suftab *p; 10713e12c5d1SDavid du Colombier int i; 10723e12c5d1SDavid du Colombier 10733e12c5d1SDavid du Colombier for(i=0; i<26; i++) 10743e12c5d1SDavid du Colombier for(p = suftab[i]; p->suf; p++) { 10753e12c5d1SDavid du Colombier p->suf = ztos(p->suf); 10763e12c5d1SDavid du Colombier p->d1 = ztos(p->d1); 10773e12c5d1SDavid du Colombier p->a1 = ztos(p->a1); 10783e12c5d1SDavid du Colombier } 10793e12c5d1SDavid du Colombier } 10803e12c5d1SDavid du Colombier 10813e12c5d1SDavid du Colombier char* 10823e12c5d1SDavid du Colombier ztos(char *as) 10833e12c5d1SDavid du Colombier { 10843e12c5d1SDavid du Colombier char *s, *ds; 10853e12c5d1SDavid du Colombier 10863e12c5d1SDavid du Colombier for(s=as; *s; s++) 10873e12c5d1SDavid du Colombier if(*s == 'z') 10883e12c5d1SDavid du Colombier goto copy; 10893e12c5d1SDavid du Colombier return as; 10903e12c5d1SDavid du Colombier 10913e12c5d1SDavid du Colombier copy: 10923e12c5d1SDavid du Colombier ds = strdup(as); 10933e12c5d1SDavid du Colombier for(s=ds; *s; s++) 10943e12c5d1SDavid du Colombier if(*s == 'z') 10953e12c5d1SDavid du Colombier *s = 's'; 10963e12c5d1SDavid du Colombier return ds; 10973e12c5d1SDavid du Colombier } 10983e12c5d1SDavid du Colombier 10993e12c5d1SDavid du Colombier Bits 11003e12c5d1SDavid du Colombier dict(char* bp, char* ep) 11013e12c5d1SDavid du Colombier { 11023e12c5d1SDavid du Colombier char *cp, *cp1, *w, *wp, *we; 11033e12c5d1SDavid du Colombier int n, f; 11043e12c5d1SDavid du Colombier 11053e12c5d1SDavid du Colombier w = bp; 11063e12c5d1SDavid du Colombier we = ep; 11073e12c5d1SDavid du Colombier n = ep-bp; 11083e12c5d1SDavid du Colombier if(n <= 1) 11093e12c5d1SDavid du Colombier return NOUN; 11103e12c5d1SDavid du Colombier 11113e12c5d1SDavid du Colombier f = w[0] & 0x7f; 11123e12c5d1SDavid du Colombier f *= 128; 11133e12c5d1SDavid du Colombier f += w[1] & 0x7f; 11143e12c5d1SDavid du Colombier bp = spacep[f]; 11153e12c5d1SDavid du Colombier ep = spacep[f+1]; 11163e12c5d1SDavid du Colombier 11173e12c5d1SDavid du Colombier loop: 11183e12c5d1SDavid du Colombier if(bp >= ep) { 11193e12c5d1SDavid du Colombier if(xflag) 11203e12c5d1SDavid du Colombier fprint(2, "=%.*s\n", n, w); 11213e12c5d1SDavid du Colombier return 0; 11223e12c5d1SDavid du Colombier } 11233e12c5d1SDavid du Colombier /* 11243e12c5d1SDavid du Colombier * find the beginning of some word in the middle 11253e12c5d1SDavid du Colombier */ 11263e12c5d1SDavid du Colombier cp = bp + (ep-bp)/2; 11273e12c5d1SDavid du Colombier 11283e12c5d1SDavid du Colombier while(cp > bp && !(*cp & 0x80)) 11293e12c5d1SDavid du Colombier cp--; 11303e12c5d1SDavid du Colombier while(cp > bp && (cp[-1] & 0x80)) 11313e12c5d1SDavid du Colombier cp--; 11323e12c5d1SDavid du Colombier 11333e12c5d1SDavid du Colombier wp = w + 2; /* skip two letters */ 1134*219b2ee8SDavid du Colombier cp1 = cp + 2; /* skip affix code */ 11353e12c5d1SDavid du Colombier for(;;) { 11363e12c5d1SDavid du Colombier if(wp >= we) { 11373e12c5d1SDavid du Colombier if(*cp1 & 0x80) 11383e12c5d1SDavid du Colombier goto found; 1139*219b2ee8SDavid du Colombier else 11403e12c5d1SDavid du Colombier f = 1; 11413e12c5d1SDavid du Colombier break; 11423e12c5d1SDavid du Colombier } 11433e12c5d1SDavid du Colombier if(*cp1 & 0x80) { 11443e12c5d1SDavid du Colombier f = -1; 11453e12c5d1SDavid du Colombier break; 11463e12c5d1SDavid du Colombier } 11473e12c5d1SDavid du Colombier f = *cp1++ - *wp++; 11483e12c5d1SDavid du Colombier if(f != 0) 11493e12c5d1SDavid du Colombier break; 11503e12c5d1SDavid du Colombier } 11513e12c5d1SDavid du Colombier 11523e12c5d1SDavid du Colombier if(f < 0) { 11533e12c5d1SDavid du Colombier while(!(*cp1 & 0x80)) 11543e12c5d1SDavid du Colombier cp1++; 11553e12c5d1SDavid du Colombier bp = cp1; 11563e12c5d1SDavid du Colombier goto loop; 11573e12c5d1SDavid du Colombier } 11583e12c5d1SDavid du Colombier ep = cp; 11593e12c5d1SDavid du Colombier goto loop; 11603e12c5d1SDavid du Colombier 11613e12c5d1SDavid du Colombier found: 11623e12c5d1SDavid du Colombier f = ((cp[0] & 0x7) << 8) | 11633e12c5d1SDavid du Colombier (cp[1] & 0xff); 11643e12c5d1SDavid du Colombier if(xflag) { 11653e12c5d1SDavid du Colombier fprint(2, "=%.*s ", n, w); 11663e12c5d1SDavid du Colombier typeprint(encode[f]); 11673e12c5d1SDavid du Colombier } 11683e12c5d1SDavid du Colombier return encode[f]; 11693e12c5d1SDavid du Colombier } 11703e12c5d1SDavid du Colombier 11713e12c5d1SDavid du Colombier void 11723e12c5d1SDavid du Colombier typeprint(Bits h) 11733e12c5d1SDavid du Colombier { 11743e12c5d1SDavid du Colombier 11753e12c5d1SDavid du Colombier pcomma(""); 11763e12c5d1SDavid du Colombier if(h & NOUN) 11773e12c5d1SDavid du Colombier pcomma("n"); 11783e12c5d1SDavid du Colombier if(h & PROP_COLLECT) 11793e12c5d1SDavid du Colombier pcomma("pc"); 11803e12c5d1SDavid du Colombier if(h & VERB) { 11813e12c5d1SDavid du Colombier if((h & VERB) == VERB) 11823e12c5d1SDavid du Colombier pcomma("v"); 11833e12c5d1SDavid du Colombier else 11843e12c5d1SDavid du Colombier if((h & VERB) == V_IRREG) 11853e12c5d1SDavid du Colombier pcomma("vi"); 11863e12c5d1SDavid du Colombier else 11873e12c5d1SDavid du Colombier if(h & ED) 11883e12c5d1SDavid du Colombier pcomma("ed"); 11893e12c5d1SDavid du Colombier } 11903e12c5d1SDavid du Colombier if(h & ADJ) 11913e12c5d1SDavid du Colombier pcomma("a"); 11923e12c5d1SDavid du Colombier if(h & COMP) { 11933e12c5d1SDavid du Colombier if((h & COMP) == ACTOR) 11943e12c5d1SDavid du Colombier pcomma("er"); 11953e12c5d1SDavid du Colombier else 11963e12c5d1SDavid du Colombier pcomma("comp"); 11973e12c5d1SDavid du Colombier } 11983e12c5d1SDavid du Colombier if(h & DONT_TOUCH) 11993e12c5d1SDavid du Colombier pcomma("d"); 12003e12c5d1SDavid du Colombier if(h & N_AFFIX) 12013e12c5d1SDavid du Colombier pcomma("na"); 12023e12c5d1SDavid du Colombier if(h & ADV) 12033e12c5d1SDavid du Colombier pcomma("adv"); 12043e12c5d1SDavid du Colombier if(h & ION) 12053e12c5d1SDavid du Colombier pcomma("ion"); 12063e12c5d1SDavid du Colombier if(h & V_AFFIX) 12073e12c5d1SDavid du Colombier pcomma("va"); 12083e12c5d1SDavid du Colombier if(h & MAN) 12093e12c5d1SDavid du Colombier pcomma("man"); 12103e12c5d1SDavid du Colombier if(h & NOPREF) 12113e12c5d1SDavid du Colombier pcomma("nopref"); 12123e12c5d1SDavid du Colombier if(h & MONO) 12133e12c5d1SDavid du Colombier pcomma("ms"); 12143e12c5d1SDavid du Colombier if(h & IN) 12153e12c5d1SDavid du Colombier pcomma("in"); 12163e12c5d1SDavid du Colombier if(h & _Y) 12173e12c5d1SDavid du Colombier pcomma("y"); 12183e12c5d1SDavid du Colombier if(h & STOP) 12193e12c5d1SDavid du Colombier pcomma("s"); 12203e12c5d1SDavid du Colombier fprint(2, "\n"); 12213e12c5d1SDavid du Colombier } 12223e12c5d1SDavid du Colombier 12233e12c5d1SDavid du Colombier void 12243e12c5d1SDavid du Colombier pcomma(char *s) 12253e12c5d1SDavid du Colombier { 12263e12c5d1SDavid du Colombier static flag; 12273e12c5d1SDavid du Colombier 12283e12c5d1SDavid du Colombier if(*s == 0) { 12293e12c5d1SDavid du Colombier flag = 0; 12303e12c5d1SDavid du Colombier return; 12313e12c5d1SDavid du Colombier } 12323e12c5d1SDavid du Colombier if(!flag) { 12333e12c5d1SDavid du Colombier fprint(2, "%s", s); 12343e12c5d1SDavid du Colombier flag = 1; 12353e12c5d1SDavid du Colombier } else 12363e12c5d1SDavid du Colombier fprint(2, ",%s", s); 12373e12c5d1SDavid du Colombier } 12383e12c5d1SDavid du Colombier 12393e12c5d1SDavid du Colombier /* 12403e12c5d1SDavid du Colombier * is the word on of the following 12413e12c5d1SDavid du Colombier * 12th teen 12423e12c5d1SDavid du Colombier * 21st end in 1 12433e12c5d1SDavid du Colombier * 23rd end in 3 12443e12c5d1SDavid du Colombier * 77th default 12453e12c5d1SDavid du Colombier * called knowing word[0] is a digit 12463e12c5d1SDavid du Colombier */ 12473e12c5d1SDavid du Colombier int 12483e12c5d1SDavid du Colombier ordinal(void) 12493e12c5d1SDavid du Colombier { 1250*219b2ee8SDavid du Colombier char *cp = word; 1251*219b2ee8SDavid du Colombier static char sp[4]; 12523e12c5d1SDavid du Colombier 1253*219b2ee8SDavid du Colombier while(ISDIGIT(*cp)) 12543e12c5d1SDavid du Colombier cp++; 1255*219b2ee8SDavid du Colombier strncpy(sp,cp,3); 1256*219b2ee8SDavid du Colombier if(ISUPPER(cp[0]) && ISUPPER(cp[1])) { 1257*219b2ee8SDavid du Colombier sp[0] = Tolower(cp[0]); 1258*219b2ee8SDavid du Colombier sp[1] = Tolower(cp[1]); 12593e12c5d1SDavid du Colombier } 1260*219b2ee8SDavid du Colombier return 0 == strncmp(sp, 1261*219b2ee8SDavid du Colombier cp[-2]=='1'? "th": /* out of bounds if 1 digit */ 1262*219b2ee8SDavid du Colombier *--cp=='1'? "st": /* harmless */ 1263*219b2ee8SDavid du Colombier *cp=='2'? "nd": 1264*219b2ee8SDavid du Colombier *cp=='3'? "rd": 1265*219b2ee8SDavid du Colombier "th", 3); 12663e12c5d1SDavid du Colombier } 12673e12c5d1SDavid du Colombier 12683e12c5d1SDavid du Colombier /* 12693e12c5d1SDavid du Colombier * read in the dictionary. 12703e12c5d1SDavid du Colombier * format is 12713e12c5d1SDavid du Colombier * { 12723e12c5d1SDavid du Colombier * short nencode; 12733e12c5d1SDavid du Colombier * long encode[nencode]; 12743e12c5d1SDavid du Colombier * char space[*]; 12753e12c5d1SDavid du Colombier * }; 12763e12c5d1SDavid du Colombier * 12773e12c5d1SDavid du Colombier * the encodings are a table all different 12783e12c5d1SDavid du Colombier * affixes. 12793e12c5d1SDavid du Colombier * the dictionary proper has 2 bytes 12803e12c5d1SDavid du Colombier * that demark and then the rest of the 12813e12c5d1SDavid du Colombier * word. the 2 bytes have the following 12823e12c5d1SDavid du Colombier * 0x80 0x00 flag 12833e12c5d1SDavid du Colombier * 0x78 0x00 count of prefix bytes 12843e12c5d1SDavid du Colombier * common with prev word 12853e12c5d1SDavid du Colombier * 0x07 0xff affix code 12863e12c5d1SDavid du Colombier * 12873e12c5d1SDavid du Colombier * all ints are big endians in the file. 12883e12c5d1SDavid du Colombier */ 12893e12c5d1SDavid du Colombier void 12903e12c5d1SDavid du Colombier readdict(char *file) 12913e12c5d1SDavid du Colombier { 12923e12c5d1SDavid du Colombier char *s, *is, *lasts, *ls; 12933e12c5d1SDavid du Colombier int c, i, sp, p; 12943e12c5d1SDavid du Colombier int f; 12953e12c5d1SDavid du Colombier long l; 12963e12c5d1SDavid du Colombier 1297*219b2ee8SDavid du Colombier lasts = 0; 12983e12c5d1SDavid du Colombier f = open(file, 0); 12993e12c5d1SDavid du Colombier if(f == -1) { 13003e12c5d1SDavid du Colombier fprint(2, "cannot open %s\n", file); 13013e12c5d1SDavid du Colombier exits("open"); 13023e12c5d1SDavid du Colombier } 13033e12c5d1SDavid du Colombier if(read(f, space, 2) != 2) 13043e12c5d1SDavid du Colombier goto bad; 13053e12c5d1SDavid du Colombier nencode = ((space[0]&0xff)<<8) | (space[1]&0xff); 13063e12c5d1SDavid du Colombier if(read(f, space, 4*nencode) != 4*nencode) 13073e12c5d1SDavid du Colombier goto bad; 13083e12c5d1SDavid du Colombier s = space; 13093e12c5d1SDavid du Colombier for(i=0; i<nencode; i++) { 13103e12c5d1SDavid du Colombier l = (long)(s[0] & 0xff) << 24; 13113e12c5d1SDavid du Colombier l |= (s[1] & 0xff) << 16; 13123e12c5d1SDavid du Colombier l |= (s[2] & 0xff) << 8; 13133e12c5d1SDavid du Colombier l |= s[3] & 0xff; 13143e12c5d1SDavid du Colombier encode[i] = (Bits)l; 13153e12c5d1SDavid du Colombier s += 4; 13163e12c5d1SDavid du Colombier } 13173e12c5d1SDavid du Colombier l = read(f, space, sizeof(space)); 13183e12c5d1SDavid du Colombier if(l == sizeof(space)) 13193e12c5d1SDavid du Colombier goto noroom; 13203e12c5d1SDavid du Colombier is = space + (sizeof(space) - l); 13213e12c5d1SDavid du Colombier memmove(is, space, l); 13223e12c5d1SDavid du Colombier 13233e12c5d1SDavid du Colombier s = space; 13243e12c5d1SDavid du Colombier c = *is++ & 0xff; 13253e12c5d1SDavid du Colombier sp = -1; 13263e12c5d1SDavid du Colombier i = 0; 13273e12c5d1SDavid du Colombier 13283e12c5d1SDavid du Colombier loop: 13293e12c5d1SDavid du Colombier if(s > is) 13303e12c5d1SDavid du Colombier goto noroom; 13313e12c5d1SDavid du Colombier if(c < 0) { 13323e12c5d1SDavid du Colombier close(f); 13333e12c5d1SDavid du Colombier while(sp < 128*128) 13343e12c5d1SDavid du Colombier spacep[++sp] = s; 13353e12c5d1SDavid du Colombier *s = 0x80; /* fence */ 13363e12c5d1SDavid du Colombier return; 13373e12c5d1SDavid du Colombier } 13383e12c5d1SDavid du Colombier p = (c>>3) & 0xf; 13393e12c5d1SDavid du Colombier *s++ = c; 13403e12c5d1SDavid du Colombier *s++ = *is++ & 0xff; 13413e12c5d1SDavid du Colombier if(p <= 0) 13423e12c5d1SDavid du Colombier i = (*is++ & 0xff)*128; 13433e12c5d1SDavid du Colombier if(p <= 1) { 13443e12c5d1SDavid du Colombier if(!(*is & 0x80)) 13453e12c5d1SDavid du Colombier i = i/128*128 + (*is++ & 0xff); 13463e12c5d1SDavid du Colombier if(i <= sp) { 13473e12c5d1SDavid du Colombier fprint(2, "the dict isnt sorted or \n"); 13483e12c5d1SDavid du Colombier fprint(2, "memmove didn't work\n"); 13493e12c5d1SDavid du Colombier goto bad; 13503e12c5d1SDavid du Colombier } 13513e12c5d1SDavid du Colombier while(sp < i) 13523e12c5d1SDavid du Colombier spacep[++sp] = s-2; 13533e12c5d1SDavid du Colombier } 13543e12c5d1SDavid du Colombier ls = lasts; 13553e12c5d1SDavid du Colombier lasts = s; 13563e12c5d1SDavid du Colombier for(p-=2; p>0; p--) 13573e12c5d1SDavid du Colombier *s++ = *ls++; 13583e12c5d1SDavid du Colombier for(;;) { 13593e12c5d1SDavid du Colombier if(is >= space+sizeof(space)) { 13603e12c5d1SDavid du Colombier c = -1; 13613e12c5d1SDavid du Colombier break; 13623e12c5d1SDavid du Colombier } 13633e12c5d1SDavid du Colombier c = *is++ & 0xff; 13643e12c5d1SDavid du Colombier if(c & 0x80) 13653e12c5d1SDavid du Colombier break; 13663e12c5d1SDavid du Colombier *s++ = c; 13673e12c5d1SDavid du Colombier } 13683e12c5d1SDavid du Colombier *s = 0; 13693e12c5d1SDavid du Colombier goto loop; 13703e12c5d1SDavid du Colombier 13713e12c5d1SDavid du Colombier bad: 13723e12c5d1SDavid du Colombier fprint(2, "trouble reading %s\n", file); 13733e12c5d1SDavid du Colombier exits("read"); 13743e12c5d1SDavid du Colombier noroom: 13753e12c5d1SDavid du Colombier fprint(2, "not enough space for dictionary\n"); 13763e12c5d1SDavid du Colombier exits("space"); 13773e12c5d1SDavid du Colombier } 1378