| 1 | /* $Header: /p/tcsh/cvsroot/tcsh/sh.char.h,v 3.35 2008/09/25 14:41:34 christos Exp $ */ |
| 2 | /* |
| 3 | * sh.char.h: Table for spotting special characters quickly |
| 4 | * Makes for very obscure but efficient coding. |
| 5 | */ |
| 6 | /*- |
| 7 | * Copyright (c) 1980, 1991 The Regents of the University of California. |
| 8 | * All rights reserved. |
| 9 | * |
| 10 | * Redistribution and use in source and binary forms, with or without |
| 11 | * modification, are permitted provided that the following conditions |
| 12 | * are met: |
| 13 | * 1. Redistributions of source code must retain the above copyright |
| 14 | * notice, this list of conditions and the following disclaimer. |
| 15 | * 2. Redistributions in binary form must reproduce the above copyright |
| 16 | * notice, this list of conditions and the following disclaimer in the |
| 17 | * documentation and/or other materials provided with the distribution. |
| 18 | * 3. Neither the name of the University nor the names of its contributors |
| 19 | * may be used to endorse or promote products derived from this software |
| 20 | * without specific prior written permission. |
| 21 | * |
| 22 | * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND |
| 23 | * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE |
| 24 | * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE |
| 25 | * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE |
| 26 | * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL |
| 27 | * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS |
| 28 | * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) |
| 29 | * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT |
| 30 | * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY |
| 31 | * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF |
| 32 | * SUCH DAMAGE. |
| 33 | */ |
| 34 | #ifndef _h_sh_char |
| 35 | #define _h_sh_char |
| 36 | #if defined(NeXT) && defined(NLS) |
| 37 | # include <appkit/NXCType.h> |
| 38 | #else |
| 39 | # include <ctype.h> |
| 40 | # ifdef WIDE_STRINGS |
| 41 | # ifdef HAVE_WCTYPE_H |
| 42 | # include <wctype.h> |
| 43 | # else |
| 44 | # include <wchar.h> |
| 45 | # endif |
| 46 | # endif |
| 47 | #endif |
| 48 | |
| 49 | typedef unsigned char tcshuc; |
| 50 | #ifdef _MINIX |
| 51 | # undef _SP |
| 52 | #endif /* _MINIX */ |
| 53 | extern unsigned short _cmap[]; |
| 54 | #if defined(DSPMBYTE) |
| 55 | # define CHECK_MBYTEVAR STRdspmbyte |
| 56 | #endif |
| 57 | extern unsigned short _cmap_c[]; |
| 58 | extern unsigned short _cmap_mbyte[]; |
| 59 | extern short _enable_mbdisp; |
| 60 | extern unsigned short _mbmap[]; |
| 61 | extern unsigned short _mbmap_euc[]; |
| 62 | extern unsigned short _mbmap_sjis[]; |
| 63 | extern unsigned short _mbmap_big5[]; |
| 64 | extern unsigned short _mbmap_utf8[]; |
| 65 | /* VARIABLE Check str */ |
| 66 | /* same compiler require #define even not define DSPMBYTE */ |
| 67 | #undef _MB1 |
| 68 | #define _MB1 0x0001 |
| 69 | #undef _MB2 |
| 70 | #define _MB2 0x0002 |
| 71 | |
| 72 | #ifndef NLS |
| 73 | extern tcshuc _cmap_lower[], _cmap_upper[]; |
| 74 | |
| 75 | #endif |
| 76 | |
| 77 | #ifndef __QNXNTO__ |
| 78 | #undef _QF |
| 79 | #define _QF 0x0001 /* '" (Forward quotes) */ |
| 80 | #undef _QB |
| 81 | #define _QB 0x0002 /* ` (Backquote) */ |
| 82 | #undef _SP |
| 83 | #define _SP 0x0004 /* space and tab */ |
| 84 | #else |
| 85 | #undef _XD |
| 86 | #define _XD 0x0001 /* As in <ctype.h> */ |
| 87 | #undef _UP |
| 88 | #define _UP 0x0002 /* As in <ctype.h> */ |
| 89 | #undef _SP |
| 90 | #define _SP 0x0004 /* As in <ctype.h> */ |
| 91 | #endif |
| 92 | #undef _NL |
| 93 | #define _NL 0x0008 /* \n */ |
| 94 | #undef _META |
| 95 | #define _META 0x0010 /* lex meta characters, sp #'`";&<>()|\t\n */ |
| 96 | #undef _GLOB |
| 97 | #define _GLOB 0x0020 /* glob characters, *?{[` */ |
| 98 | #undef _ESC |
| 99 | #define _ESC 0x0040 /* \ */ |
| 100 | #undef _DOL |
| 101 | #define _DOL 0x0080 /* $ */ |
| 102 | #undef _DIG |
| 103 | #define _DIG 0x0100 /* 0-9 */ |
| 104 | #undef _LET |
| 105 | #define _LET 0x0200 /* a-z, A-Z, _, or locale-specific */ |
| 106 | #ifndef __QNXNTO__ |
| 107 | #undef _UP |
| 108 | #define _UP 0x0400 /* A-Z, or locale-specific */ |
| 109 | #else |
| 110 | #undef _QF |
| 111 | #define _QF 0x0400 /* '" (Forward quotes) */ |
| 112 | #endif |
| 113 | #undef _DOW |
| 114 | #define _DOW 0x0800 /* a-z, or locale-specific */ |
| 115 | #ifndef __QNXNTO__ |
| 116 | #undef _XD |
| 117 | #define _XD 0x1000 /* 0-9, a-f, A-F */ |
| 118 | #else |
| 119 | #undef _QB |
| 120 | #define _QB 0x1000 /* 0-9, a-f, A-F */ |
| 121 | #endif |
| 122 | #undef _CMD |
| 123 | #define _CMD 0x2000 /* lex end of command chars, ;&(|` */ |
| 124 | #undef _CTR |
| 125 | #define _CTR 0x4000 /* control */ |
| 126 | #undef _PUN |
| 127 | #define _PUN 0x8000 /* punctuation */ |
| 128 | |
| 129 | #ifdef IS_ASCII |
| 130 | # define ASC(ch) (ch) |
| 131 | # define CTL_ESC(ch) (ch) |
| 132 | #else |
| 133 | # ifdef _OSD_POSIX |
| 134 | /* "BS2000 OSD" is a POSIX on a main frame using a EBCDIC char set */ |
| 135 | # include <ascii_ebcdic.h> |
| 136 | # else |
| 137 | /* "OS/390 USS" is a POSIX on a main frame using an IBM1047 char set */ |
| 138 | # endif |
| 139 | extern unsigned short _toascii[256]; |
| 140 | extern unsigned short _toebcdic[256]; |
| 141 | |
| 142 | /* mainly for comparisons if (ASC(ch)=='\177')... */ |
| 143 | # define ASC(ch) _toascii[(tcshuc)(ch)] |
| 144 | |
| 145 | /* Literal escapes ('\010') must be mapped to EBCDIC, |
| 146 | * for C-Escapes ('\b'), the compiler already does it. |
| 147 | */ |
| 148 | # define CTL_ESC(ch) _toebcdic[(tcshuc)(ch)] |
| 149 | #endif /*IS_ASCII*/ |
| 150 | |
| 151 | #ifdef WIDE_STRINGS |
| 152 | # define cmap(c, bits) \ |
| 153 | (((c) < 0) ? 0 : \ |
| 154 | ((c) & QUOTE) || (c) >= 0x0080 ? 0 : (_cmap[(tcshuc)ASC(c)] & (bits))) |
| 155 | #elif defined(SHORT_STRINGS) && defined(KANJI) |
| 156 | # define cmap(c, bits) \ |
| 157 | (((c) < 0) ? 0 : \ |
| 158 | (((c) & QUOTE) || ((ASC(c) & 0x80) && adrof(STRnokanji))) ? \ |
| 159 | 0 : (_cmap[(tcshuc)ASC(c)] & (bits))) |
| 160 | #else /* SHORT_STRINGS && KANJI */ |
| 161 | # define cmap(c, bits) \ |
| 162 | (((c) < 0) ? 0 : \ |
| 163 | ((c) & QUOTE) ? 0 : (_cmap[(tcshuc)ASC(c)] & (bits))) |
| 164 | #endif /* SHORT_STRINGS && KANJI */ |
| 165 | |
| 166 | #define isglob(c) cmap((c), _GLOB) |
| 167 | #define isspc(c) cmap((c), _SP) |
| 168 | #define ismeta(c) cmap((c), _META) |
| 169 | #define iscmdmeta(c) cmap((c), _CMD) |
| 170 | #ifdef WIDE_STRINGS |
| 171 | #define letter(c) (((c) & QUOTE) ? 0 : \ |
| 172 | (iswalpha((tcshuc) (c)) || (c) == '_')) |
| 173 | #define alnum(c) (((c) & QUOTE) ? 0 : \ |
| 174 | (iswalnum((tcshuc) (c)) || (c) == '_')) |
| 175 | #else |
| 176 | #define letter(c) (((Char)(c) & QUOTE) ? 0 : \ |
| 177 | ((isalpha((tcshuc) (c)) && !(cmap((c), _PUN))) \ |
| 178 | || (c) == '_')) |
| 179 | #define alnum(c) (((Char)(c) & QUOTE) ? 0 : \ |
| 180 | ((isalnum((tcshuc) (c)) && !(cmap((c), _PUN))) \ |
| 181 | || (c) == '_')) |
| 182 | |
| 183 | #endif |
| 184 | |
| 185 | #if defined(DSPMBYTE) |
| 186 | # define IsmbyteU(c) (Ismbyte1((Char)(c))||(Ismbyte2((Char)(c))&&((c)&0200))) |
| 187 | #endif |
| 188 | |
| 189 | #ifdef NLS |
| 190 | # ifdef WIDE_STRINGS |
| 191 | # define Isspace(c) (((c) & QUOTE) ? 0 : iswspace(c)) |
| 192 | # define Isdigit(c) (((c) & QUOTE) ? 0 : iswdigit(c)) |
| 193 | # define Isalpha(c) (((c) & QUOTE) ? 0 : iswalpha(c)) |
| 194 | # define Islower(c) (((c) & QUOTE) ? 0 : iswlower(c)) |
| 195 | # define Isupper(c) (((c) & QUOTE) ? 0 : iswupper(c)) |
| 196 | # define Tolower(c) (((c) & QUOTE) ? 0 : (wchar_t)towlower(c)) |
| 197 | # define Toupper(c) (((c) & QUOTE) ? 0 : (wchar_t)towupper(c)) |
| 198 | # define Isxdigit(c) (((c) & QUOTE) ? 0 : iswxdigit(c)) |
| 199 | # define Isalnum(c) (((c) & QUOTE) ? 0 : iswalnum(c)) |
| 200 | # define Iscntrl(c) (((c) & QUOTE) ? 0 : iswcntrl(c)) |
| 201 | # define Isprint(c) (((c) & QUOTE) ? 0 : iswprint(c)) |
| 202 | # define Ispunct(c) (((c) & QUOTE) ? 0 : iswpunct(c)) |
| 203 | # elif defined (NeXT) |
| 204 | # define Isspace(c) (((Char)(c) & QUOTE) ? 0 : NXIsSpace((unsigned) (c))) |
| 205 | # define Isdigit(c) (((Char)(c) & QUOTE) ? 0 : NXIsDigit((unsigned) (c))) |
| 206 | # define Isalpha(c) (((Char)(c) & QUOTE) ? 0 : NXIsAlpha((unsigned) (c))) |
| 207 | # define Islower(c) (((Char)(c) & QUOTE) ? 0 : NXIsLower((unsigned) (c))) |
| 208 | # define Isupper(c) (((Char)(c) & QUOTE) ? 0 : NXIsUpper((unsigned) (c))) |
| 209 | # define Tolower(c) (((Char)(c) & QUOTE) ? 0 : NXToLower((unsigned) (c))) |
| 210 | # define Toupper(c) (((Char)(c) & QUOTE) ? 0 : NXToUpper((unsigned) (c))) |
| 211 | # define Isxdigit(c) (((Char)(c) & QUOTE) ? 0 : NXIsXDigit((unsigned) (c))) |
| 212 | #if defined(DSPMBYTE) |
| 213 | # define IscntrlM(c) (((Char)(c) & QUOTE) ? 0 : NXIsCntrl((unsigned) (c))) |
| 214 | # define Iscntrl(c) ( (IscntrlM(c)) && !(_enable_mbdisp&&(IsmbyteU((c)))) ) |
| 215 | # define IsprintM(c) (((Char)(c) & QUOTE) ? 0 : NXIsPrint((unsigned) (c))) |
| 216 | # define Isprint(c) ( (IsprintM(c)) || (_enable_mbdisp&&(IsmbyteU((c)))) ) |
| 217 | #else |
| 218 | # define Isalnum(c) (((Char)(c) & QUOTE) ? 0 : NXIsAlNum((unsigned) (c))) |
| 219 | # define Iscntrl(c) (((Char)(c) & QUOTE) ? 0 : NXIsCntrl((unsigned) (c))) |
| 220 | # define Isprint(c) (((Char)(c) & QUOTE) ? 0 : NXIsPrint((unsigned) (c))) |
| 221 | #endif /* !defined(DSPMBYTE) */ |
| 222 | # define Ispunct(c) (((Char)(c) & QUOTE) ? 0 : NXIsPunct((unsigned) (c))) |
| 223 | # else /* !NeXT */ |
| 224 | # ifndef WINNT_NATIVE |
| 225 | # define Isspace(c) (((Char)(c) & QUOTE) ? 0 : isspace((tcshuc) (c))) |
| 226 | # define Isdigit(c) (((Char)(c) & QUOTE) ? 0 : isdigit((tcshuc) (c))) |
| 227 | # define Isalpha(c) (((Char)(c) & QUOTE) ? 0 : isalpha((tcshuc) (c))) |
| 228 | # define Islower(c) (((Char)(c) & QUOTE) ? 0 : islower((tcshuc) (c))) |
| 229 | # define Isupper(c) (((Char)(c) & QUOTE) ? 0 : isupper((tcshuc) (c))) |
| 230 | # define Tolower(c) (((Char)(c) & QUOTE) ? 0 : tolower((tcshuc) (c))) |
| 231 | # define Toupper(c) (((Char)(c) & QUOTE) ? 0 : toupper((tcshuc) (c))) |
| 232 | # define Isxdigit(c) (((Char)(c) & QUOTE) ? 0 : isxdigit((tcshuc) (c))) |
| 233 | # define Isalnum(c) (((Char)(c) & QUOTE) ? 0 : isalnum((tcshuc) (c))) |
| 234 | #if defined(DSPMBYTE) |
| 235 | # define IscntrlM(c) (((Char)(c) & QUOTE) ? 0 : iscntrl((tcshuc) (c))) |
| 236 | # define Iscntrl(c) ( (IscntrlM(c)) && !(_enable_mbdisp&&(IsmbyteU((c)))) ) |
| 237 | #else |
| 238 | # define Iscntrl(c) (((Char)(c) & QUOTE) ? 0 : iscntrl((tcshuc) (c))) |
| 239 | #endif /* !defined(DSPMBYTE) */ |
| 240 | # if SOLARIS2 == 24 |
| 241 | /* |
| 242 | * From <casper@fwi.uva.nl> Casper Dik: |
| 243 | * In Solaris 2.4, isprint('\t') returns true after setlocal(LC_ALL,""). |
| 244 | * This breaks commandline editing when you include tabs. |
| 245 | * (This is in the en_US locale). |
| 246 | */ |
| 247 | #if defined(DSPMBYTE) |
| 248 | # define IsprintM(c) (((Char)(c) & QUOTE) ? 0 : \ |
| 249 | (isprint((tcshuc) (c)) && (c) != '\t')) |
| 250 | #else |
| 251 | # define Isprint(c) (((Char)(c) & QUOTE) ? 0 : \ |
| 252 | (isprint((tcshuc) (c)) && (c) != '\t')) |
| 253 | #endif /* !defined(DSPMBYTE) */ |
| 254 | # else |
| 255 | #if defined(DSPMBYTE) |
| 256 | # define IsprintM(c) (((Char)(c) & QUOTE) ? 0 : isprint((tcshuc) (c))) |
| 257 | #else |
| 258 | # define Isprint(c) (((Char)(c) & QUOTE) ? 0 : isprint((tcshuc) (c))) |
| 259 | #endif /* !defined(DSPMBYTE) */ |
| 260 | # endif /* SOLARIS2 == 24 */ |
| 261 | #if defined(DSPMBYTE) |
| 262 | # define Isprint(c) ( (IsprintM(c)) || (_enable_mbdisp&&(IsmbyteU((c)))) ) |
| 263 | #endif /* !defined(DSPMBYTE) */ |
| 264 | # define Ispunct(c) (((Char)(c) & QUOTE) ? 0 : ispunct((tcshuc) (c))) |
| 265 | # else /* WINNT_NATIVE */ |
| 266 | # define Isspace(c) (((Char)(c) & QUOTE) ? 0 : isspace( oem_it((tcshuc)(c)))) |
| 267 | # define Isdigit(c) (((Char)(c) & QUOTE) ? 0 : isdigit( oem_it((tcshuc)(c)))) |
| 268 | # define Isalpha(c) (((Char)(c) & QUOTE) ? 0 : isalpha( oem_it((tcshuc)(c)))) |
| 269 | # define Islower(c) (((Char)(c) & QUOTE) ? 0 : islower( oem_it((tcshuc)(c)))) |
| 270 | # define Isupper(c) (((Char)(c) & QUOTE) ? 0 : isupper( oem_it((tcshuc)(c)))) |
| 271 | # define Tolower(c) (((Char)(c) & QUOTE) ? 0 : tolower( oem_it((tcshuc)(c)))) |
| 272 | # define Toupper(c) (((Char)(c) & QUOTE) ? 0 : toupper( oem_it((tcshuc)(c)))) |
| 273 | # define Isxdigit(c)(((Char)(c) & QUOTE) ? 0 : isxdigit(oem_it((tcshuc)(c)))) |
| 274 | # define Isalnum(c) (((Char)(c) & QUOTE) ? 0 : isalnum( oem_it((tcshuc)(c)))) |
| 275 | # define Ispunct(c) (((Char)(c) & QUOTE) ? 0 : ispunct( oem_it((tcshuc)(c)))) |
| 276 | #if defined(DSPMBYTE) |
| 277 | # define IscntrlM(c) (((Char)(c) & QUOTE) ? 0 : iscntrl( oem_it((tcshuc)(c)))) |
| 278 | # define Iscntrl(c) ( (IscntrlM(c)) && !(_enable_mbdisp&&(IsmbyteU((c)))) ) |
| 279 | # define IsprintM(c) (((Char)(c) & QUOTE) ? 0 : isprint( oem_it((tcshuc)(c)))) |
| 280 | # define Isprint(c) ( (IsprintM(c)) || (_enable_mbdisp&&(IsmbyteU((c)))) ) |
| 281 | #else |
| 282 | # define Iscntrl(c) (((Char)(c) & QUOTE) ? 0 : iscntrl( oem_it((tcshuc)(c)))) |
| 283 | # define Isprint(c) (((Char)(c) & QUOTE) ? 0 : isprint( oem_it((tcshuc)(c)))) |
| 284 | #endif /* !defined(DSPMBYTE) */ |
| 285 | # endif /* WINNT_NATIVE */ |
| 286 | # endif /* !NeXT */ |
| 287 | #else /* !NLS */ |
| 288 | # define Isspace(c) cmap((c), _SP|_NL) |
| 289 | # define Isdigit(c) cmap((c), _DIG) |
| 290 | # define Isalpha(c) (cmap((c),_LET) && !(((c) & META) && AsciiOnly)) |
| 291 | # define Islower(c) (cmap((c),_DOW) && !(((c) & META) && AsciiOnly)) |
| 292 | # define Isupper(c) (cmap((c), _UP) && !(((c) & META) && AsciiOnly)) |
| 293 | # define Tolower(c) (_cmap_lower[ASC(c)]) |
| 294 | # define Toupper(c) (_cmap_upper[ASC(c)]) |
| 295 | # define Isxdigit(c) cmap((c), _XD) |
| 296 | # define Isalnum(c) (cmap((c), _DIG|_LET) && !(((Char)(c) & META) && AsciiOnly)) |
| 297 | #if defined(DSPMBYTE) |
| 298 | # define IscntrlM(c) (cmap((c),_CTR) && !(((c) & META) && AsciiOnly)) |
| 299 | # define Iscntrl(c) ( (IscntrlM(c)) && !(_enable_mbdisp&&(IsmbyteU((c)))) ) |
| 300 | # define IsprintM(c) (!cmap((c),_CTR) && !(((c) & META) && AsciiOnly)) |
| 301 | # define Isprint(c) ( (IsprintM(c)) || (_enable_mbdisp&&(IsmbyteU((c)))) ) |
| 302 | #else |
| 303 | # define Iscntrl(c) (cmap((c),_CTR) && !(((c) & META) && AsciiOnly)) |
| 304 | # define Isprint(c) (!cmap((c),_CTR) && !(((c) & META) && AsciiOnly)) |
| 305 | #endif /* !defined(DSPMBYTE) */ |
| 306 | # define Ispunct(c) (cmap((c),_PUN) && !(((c) & META) && AsciiOnly)) |
| 307 | |
| 308 | #endif /* !NLS */ |
| 309 | |
| 310 | #if defined(DSPMBYTE) |
| 311 | # define Ismbyte1(c) ((_mbmap[(c) & 0377] & _MB1) ? 1 : 0) |
| 312 | # define Ismbyte2(c) ((_mbmap[(c) & 0377] & _MB2) ? 1 : 0) |
| 313 | #endif |
| 314 | |
| 315 | #endif /* _h_sh_char */ |