1*4887Schin /*********************************************************************** 2*4887Schin * * 3*4887Schin * This software is part of the ast package * 4*4887Schin * Copyright (c) 1982-2007 AT&T Knowledge Ventures * 5*4887Schin * and is licensed under the * 6*4887Schin * Common Public License, Version 1.0 * 7*4887Schin * by AT&T Knowledge Ventures * 8*4887Schin * * 9*4887Schin * A copy of the License is available at * 10*4887Schin * http://www.opensource.org/licenses/cpl1.0.txt * 11*4887Schin * (with md5 checksum 059e8cd6165cb4c31e351f2b69388fd9) * 12*4887Schin * * 13*4887Schin * Information and Software Systems Research * 14*4887Schin * AT&T Research * 15*4887Schin * Florham Park NJ * 16*4887Schin * * 17*4887Schin * David Korn <dgk@research.att.com> * 18*4887Schin * * 19*4887Schin ***********************************************************************/ 20*4887Schin #pragma prototyped 21*4887Schin #ifndef S_BREAK 22*4887Schin #define S_BREAK 1 /* end of token */ 23*4887Schin #define S_EOF 2 /* end of buffer */ 24*4887Schin #define S_NL 3 /* new-line when not a token */ 25*4887Schin #define S_RES 4 /* first character of reserved word */ 26*4887Schin #define S_NAME 5 /* other identifier characters */ 27*4887Schin #define S_REG 6 /* non-special characters */ 28*4887Schin #define S_TILDE 7 /* first char is tilde */ 29*4887Schin #define S_PUSH 8 30*4887Schin #define S_POP 9 31*4887Schin #define S_BRACT 10 32*4887Schin #define S_LIT 11 /* literal quote character */ 33*4887Schin #define S_NLTOK 12 /* new-line token */ 34*4887Schin #define S_OP 13 /* operator character */ 35*4887Schin #define S_PAT 14 /* pattern characters * and ? */ 36*4887Schin #define S_EPAT 15 /* pattern char when followed by ( */ 37*4887Schin #define S_EQ 16 /* assignment character */ 38*4887Schin #define S_COM 17 /* comment character */ 39*4887Schin #define S_MOD1 18 /* ${...} modifier character - old quoting */ 40*4887Schin #define S_MOD2 19 /* ${...} modifier character - new quoting */ 41*4887Schin #define S_ERR 20 /* invalid character in ${...} */ 42*4887Schin #define S_SPC1 21 /* special prefix characters after $ */ 43*4887Schin #define S_SPC2 22 /* special characters after $ */ 44*4887Schin #define S_DIG 23 /* digit character after $*/ 45*4887Schin #define S_ALP 24 /* alpahbetic character after $ */ 46*4887Schin #define S_LBRA 25 /* left brace after $ */ 47*4887Schin #define S_RBRA 26 /* right brace after $ */ 48*4887Schin #define S_PAR 27 /* set for $( */ 49*4887Schin #define S_ENDCH 28 /* macro expansion terminator */ 50*4887Schin #define S_SLASH 29 /* / character terminates ~ expansion */ 51*4887Schin #define S_COLON 30 /* for character : */ 52*4887Schin #define S_LABEL 31 /* for goto label */ 53*4887Schin #define S_EDOL 32 /* ends $identifier */ 54*4887Schin #define S_BRACE 33 /* left brace */ 55*4887Schin #define S_DOT 34 /* . char */ 56*4887Schin #define S_META 35 /* | & ; < > inside ${...} reserved for future use */ 57*4887Schin #define S_SPACE S_BREAK /* IFS space characters */ 58*4887Schin #define S_DELIM S_RES /* IFS delimter characters */ 59*4887Schin #define S_MBYTE S_NAME /* IFS first byte of multi-byte char */ 60*4887Schin #define S_BLNK 36 /* space or tab */ 61*4887Schin /* The following must be the highest numbered states */ 62*4887Schin #define S_QUOTE 37 /* double quote character */ 63*4887Schin #define S_GRAVE 38 /* old comsub character */ 64*4887Schin #define S_ESC 39 /* escape character */ 65*4887Schin #define S_DOL 40 /* $ subsitution character */ 66*4887Schin #define S_ESC2 41 /* escape character inside '...' */ 67*4887Schin 68*4887Schin /* These are the lexical state table names */ 69*4887Schin #define ST_BEGIN 0 70*4887Schin #define ST_NAME 1 71*4887Schin #define ST_NORM 2 72*4887Schin #define ST_LIT 3 73*4887Schin #define ST_QUOTE 4 74*4887Schin #define ST_NESTED 5 75*4887Schin #define ST_DOL 6 76*4887Schin #define ST_BRACE 7 77*4887Schin #define ST_DOLNAME 8 78*4887Schin #define ST_MACRO 9 79*4887Schin #define ST_QNEST 10 80*4887Schin #define ST_NONE 11 81*4887Schin 82*4887Schin #include "FEATURE/locale" 83*4887Schin 84*4887Schin #if _hdr_wchar 85*4887Schin # include <wchar.h> 86*4887Schin # if _hdr_wctype 87*4887Schin # include <wctype.h> 88*4887Schin # undef isalpha 89*4887Schin # define isalpha(x) iswalpha(x) 90*4887Schin # if defined(iswblank) || _lib_iswblank 91*4887Schin # undef isblank 92*4887Schin # define isblank(x) iswblank(x) 93*4887Schin # else 94*4887Schin # if _lib_wctype && _lib_iswctype 95*4887Schin # define _lib_iswblank -1 96*4887Schin # undef isblank 97*4887Schin # define isblank(x) local_iswblank(x) 98*4887Schin extern int local_iswblank(wchar_t); 99*4887Schin # endif 100*4887Schin # endif 101*4887Schin # endif 102*4887Schin #endif 103*4887Schin #ifndef isblank 104*4887Schin # define isblank(x) ((x)==' '||(x)=='\t') 105*4887Schin #endif 106*4887Schin 107*4887Schin #undef LEN 108*4887Schin #if SHOPT_MULTIBYTE 109*4887Schin static int NXT, LEN; 110*4887Schin # define isaname(c) ((c)>0xff?isalpha(c): sh_lexstates[ST_NAME][(c)]==0) 111*4887Schin # define isaletter(c) ((c)>0xff?isalpha(c): sh_lexstates[ST_DOL][(c)]==S_ALP && (c)!='.') 112*4887Schin #else 113*4887Schin # undef mbwide 114*4887Schin # define mbwide() (0) 115*4887Schin # define LEN 1 116*4887Schin # define isaname(c) (sh_lexstates[ST_NAME][c]==0) 117*4887Schin # define isaletter(c) (sh_lexstates[ST_DOL][c]==S_ALP && (c)!='.') 118*4887Schin #endif 119*4887Schin #define STATE(s,c) (mbwide()?(c=fcmbstate(s,&NXT,&LEN),NXT):s[c=fcget()]) 120*4887Schin #define isadigit(c) (sh_lexstates[ST_DOL][c]==S_DIG) 121*4887Schin #define isastchar(c) ((c)=='@' || (c)=='*') 122*4887Schin #define isexp(c) (sh_lexstates[ST_MACRO][c]==S_PAT||(c)=='$'||(c)=='`') 123*4887Schin #define ismeta(c) (sh_lexstates[ST_NAME][c]==S_BREAK) 124*4887Schin 125*4887Schin extern char *sh_lexstates[ST_NONE]; 126*4887Schin extern const char *sh_lexrstates[ST_NONE]; 127*4887Schin extern const char e_lexversion[]; 128*4887Schin extern const char e_lexspace[]; 129*4887Schin extern const char e_lexslash[]; 130*4887Schin extern const char e_lexlabignore[]; 131*4887Schin extern const char e_lexlabunknown[]; 132*4887Schin extern const char e_lexsyntax1[]; 133*4887Schin extern const char e_lexsyntax2[]; 134*4887Schin extern const char e_lexsyntax3[]; 135*4887Schin extern const char e_lexobsolete1[]; 136*4887Schin extern const char e_lexobsolete2[]; 137*4887Schin extern const char e_lexobsolete3[]; 138*4887Schin extern const char e_lexobsolete4[]; 139*4887Schin extern const char e_lexobsolete5[]; 140*4887Schin extern const char e_lexobsolete6[]; 141*4887Schin extern const char e_lexusebrace[]; 142*4887Schin extern const char e_lexusequote[]; 143*4887Schin extern const char e_lexescape[]; 144*4887Schin extern const char e_lexquote[]; 145*4887Schin extern const char e_lexnested[]; 146*4887Schin extern const char e_lexbadchar[]; 147*4887Schin extern const char e_lexlongquote[]; 148*4887Schin extern const char e_lexfuture[]; 149*4887Schin extern const char e_lexzerobyte[]; 150*4887Schin extern const char e_lexemptyfor[]; 151*4887Schin #endif 152