/*============================================================================= Copyright (c) 2001-2011 Hartmut Kaiser Copyright (c) 2001-2011 Joel de Guzman Distributed under the Boost Software License, Version 1.0. (See accompanying file LICENSE_1_0.txt or copy at http://www.boost.org/LICENSE_1_0.txt) =============================================================================*/ #if !defined(BOOST_SPIRIT_ISO8859_1_APRIL_26_2006_1106PM) #define BOOST_SPIRIT_ISO8859_1_APRIL_26_2006_1106PM #if defined(_MSC_VER) #pragma once #endif #include #include #include /////////////////////////////////////////////////////////////////////////////// // constants used to classify the single characters /////////////////////////////////////////////////////////////////////////////// #define BOOST_CC_DIGIT 0x0001 #define BOOST_CC_XDIGIT 0x0002 #define BOOST_CC_ALPHA 0x0004 #define BOOST_CC_CTRL 0x0008 #define BOOST_CC_LOWER 0x0010 #define BOOST_CC_UPPER 0x0020 #define BOOST_CC_SPACE 0x0040 #define BOOST_CC_PUNCT 0x0080 namespace boost { namespace spirit { namespace char_encoding { // The detection of isgraph(), isprint() and isblank() is done programmatically // to keep the character type table small. Additionally, these functions are // rather seldom used and the programmatic detection is very simple. /////////////////////////////////////////////////////////////////////////// // ISO 8859-1 character classification table // // the comments intentionally contain non-ascii characters // boostinspect:noascii /////////////////////////////////////////////////////////////////////////// const unsigned char iso8859_1_char_types[] = { /* NUL 0 0 */ BOOST_CC_CTRL, /* SOH 1 1 */ BOOST_CC_CTRL, /* STX 2 2 */ BOOST_CC_CTRL, /* ETX 3 3 */ BOOST_CC_CTRL, /* EOT 4 4 */ BOOST_CC_CTRL, /* ENQ 5 5 */ BOOST_CC_CTRL, /* ACK 6 6 */ BOOST_CC_CTRL, /* BEL 7 7 */ BOOST_CC_CTRL, /* BS 8 8 */ BOOST_CC_CTRL, /* HT 9 9 */ BOOST_CC_CTRL|BOOST_CC_SPACE, /* NL 10 a */ BOOST_CC_CTRL|BOOST_CC_SPACE, /* VT 11 b */ BOOST_CC_CTRL|BOOST_CC_SPACE, /* NP 12 c */ BOOST_CC_CTRL|BOOST_CC_SPACE, /* CR 13 d */ BOOST_CC_CTRL|BOOST_CC_SPACE, /* SO 14 e */ BOOST_CC_CTRL, /* SI 15 f */ BOOST_CC_CTRL, /* DLE 16 10 */ BOOST_CC_CTRL, /* DC1 17 11 */ BOOST_CC_CTRL, /* DC2 18 12 */ BOOST_CC_CTRL, /* DC3 19 13 */ BOOST_CC_CTRL, /* DC4 20 14 */ BOOST_CC_CTRL, /* NAK 21 15 */ BOOST_CC_CTRL, /* SYN 22 16 */ BOOST_CC_CTRL, /* ETB 23 17 */ BOOST_CC_CTRL, /* CAN 24 18 */ BOOST_CC_CTRL, /* EM 25 19 */ BOOST_CC_CTRL, /* SUB 26 1a */ BOOST_CC_CTRL, /* ESC 27 1b */ BOOST_CC_CTRL, /* FS 28 1c */ BOOST_CC_CTRL, /* GS 29 1d */ BOOST_CC_CTRL, /* RS 30 1e */ BOOST_CC_CTRL, /* US 31 1f */ BOOST_CC_CTRL, /* SP 32 20 */ BOOST_CC_SPACE, /* ! 33 21 */ BOOST_CC_PUNCT, /* " 34 22 */ BOOST_CC_PUNCT, /* # 35 23 */ BOOST_CC_PUNCT, /* $ 36 24 */ BOOST_CC_PUNCT, /* % 37 25 */ BOOST_CC_PUNCT, /* & 38 26 */ BOOST_CC_PUNCT, /* ' 39 27 */ BOOST_CC_PUNCT, /* ( 40 28 */ BOOST_CC_PUNCT, /* ) 41 29 */ BOOST_CC_PUNCT, /* * 42 2a */ BOOST_CC_PUNCT, /* + 43 2b */ BOOST_CC_PUNCT, /* , 44 2c */ BOOST_CC_PUNCT, /* - 45 2d */ BOOST_CC_PUNCT, /* . 46 2e */ BOOST_CC_PUNCT, /* / 47 2f */ BOOST_CC_PUNCT, /* 0 48 30 */ BOOST_CC_DIGIT|BOOST_CC_XDIGIT, /* 1 49 31 */ BOOST_CC_DIGIT|BOOST_CC_XDIGIT, /* 2 50 32 */ BOOST_CC_DIGIT|BOOST_CC_XDIGIT, /* 3 51 33 */ BOOST_CC_DIGIT|BOOST_CC_XDIGIT, /* 4 52 34 */ BOOST_CC_DIGIT|BOOST_CC_XDIGIT, /* 5 53 35 */ BOOST_CC_DIGIT|BOOST_CC_XDIGIT, /* 6 54 36 */ BOOST_CC_DIGIT|BOOST_CC_XDIGIT, /* 7 55 37 */ BOOST_CC_DIGIT|BOOST_CC_XDIGIT, /* 8 56 38 */ BOOST_CC_DIGIT|BOOST_CC_XDIGIT, /* 9 57 39 */ BOOST_CC_DIGIT|BOOST_CC_XDIGIT, /* : 58 3a */ BOOST_CC_PUNCT, /* ; 59 3b */ BOOST_CC_PUNCT, /* < 60 3c */ BOOST_CC_PUNCT, /* = 61 3d */ BOOST_CC_PUNCT, /* > 62 3e */ BOOST_CC_PUNCT, /* ? 63 3f */ BOOST_CC_PUNCT, /* @ 64 40 */ BOOST_CC_PUNCT, /* A 65 41 */ BOOST_CC_ALPHA|BOOST_CC_XDIGIT|BOOST_CC_UPPER, /* B 66 42 */ BOOST_CC_ALPHA|BOOST_CC_XDIGIT|BOOST_CC_UPPER, /* C 67 43 */ BOOST_CC_ALPHA|BOOST_CC_XDIGIT|BOOST_CC_UPPER, /* D 68 44 */ BOOST_CC_ALPHA|BOOST_CC_XDIGIT|BOOST_CC_UPPER, /* E 69 45 */ BOOST_CC_ALPHA|BOOST_CC_XDIGIT|BOOST_CC_UPPER, /* F 70 46 */ BOOST_CC_ALPHA|BOOST_CC_XDIGIT|BOOST_CC_UPPER, /* G 71 47 */ BOOST_CC_ALPHA|BOOST_CC_UPPER, /* H 72 48 */ BOOST_CC_ALPHA|BOOST_CC_UPPER, /* I 73 49 */ BOOST_CC_ALPHA|BOOST_CC_UPPER, /* J 74 4a */ BOOST_CC_ALPHA|BOOST_CC_UPPER, /* K 75 4b */ BOOST_CC_ALPHA|BOOST_CC_UPPER, /* L 76 4c */ BOOST_CC_ALPHA|BOOST_CC_UPPER, /* M 77 4d */ BOOST_CC_ALPHA|BOOST_CC_UPPER, /* N 78 4e */ BOOST_CC_ALPHA|BOOST_CC_UPPER, /* O 79 4f */ BOOST_CC_ALPHA|BOOST_CC_UPPER, /* P 80 50 */ BOOST_CC_ALPHA|BOOST_CC_UPPER, /* Q 81 51 */ BOOST_CC_ALPHA|BOOST_CC_UPPER, /* R 82 52 */ BOOST_CC_ALPHA|BOOST_CC_UPPER, /* S 83 53 */ BOOST_CC_ALPHA|BOOST_CC_UPPER, /* T 84 54 */ BOOST_CC_ALPHA|BOOST_CC_UPPER, /* U 85 55 */ BOOST_CC_ALPHA|BOOST_CC_UPPER, /* V 86 56 */ BOOST_CC_ALPHA|BOOST_CC_UPPER, /* W 87 57 */ BOOST_CC_ALPHA|BOOST_CC_UPPER, /* X 88 58 */ BOOST_CC_ALPHA|BOOST_CC_UPPER, /* Y 89 59 */ BOOST_CC_ALPHA|BOOST_CC_UPPER, /* Z 90 5a */ BOOST_CC_ALPHA|BOOST_CC_UPPER, /* [ 91 5b */ BOOST_CC_PUNCT, /* \ 92 5c */ BOOST_CC_PUNCT, /* ] 93 5d */ BOOST_CC_PUNCT, /* ^ 94 5e */ BOOST_CC_PUNCT, /* _ 95 5f */ BOOST_CC_PUNCT, /* ` 96 60 */ BOOST_CC_PUNCT, /* a 97 61 */ BOOST_CC_ALPHA|BOOST_CC_XDIGIT|BOOST_CC_LOWER, /* b 98 62 */ BOOST_CC_ALPHA|BOOST_CC_XDIGIT|BOOST_CC_LOWER, /* c 99 63 */ BOOST_CC_ALPHA|BOOST_CC_XDIGIT|BOOST_CC_LOWER, /* d 100 64 */ BOOST_CC_ALPHA|BOOST_CC_XDIGIT|BOOST_CC_LOWER, /* e 101 65 */ BOOST_CC_ALPHA|BOOST_CC_XDIGIT|BOOST_CC_LOWER, /* f 102 66 */ BOOST_CC_ALPHA|BOOST_CC_XDIGIT|BOOST_CC_LOWER, /* g 103 67 */ BOOST_CC_ALPHA|BOOST_CC_LOWER, /* h 104 68 */ BOOST_CC_ALPHA|BOOST_CC_LOWER, /* i 105 69 */ BOOST_CC_ALPHA|BOOST_CC_LOWER, /* j 106 6a */ BOOST_CC_ALPHA|BOOST_CC_LOWER, /* k 107 6b */ BOOST_CC_ALPHA|BOOST_CC_LOWER, /* l 108 6c */ BOOST_CC_ALPHA|BOOST_CC_LOWER, /* m 109 6d */ BOOST_CC_ALPHA|BOOST_CC_LOWER, /* n 110 6e */ BOOST_CC_ALPHA|BOOST_CC_LOWER, /* o 111 6f */ BOOST_CC_ALPHA|BOOST_CC_LOWER, /* p 112 70 */ BOOST_CC_ALPHA|BOOST_CC_LOWER, /* q 113 71 */ BOOST_CC_ALPHA|BOOST_CC_LOWER, /* r 114 72 */ BOOST_CC_ALPHA|BOOST_CC_LOWER, /* s 115 73 */ BOOST_CC_ALPHA|BOOST_CC_LOWER, /* t 116 74 */ BOOST_CC_ALPHA|BOOST_CC_LOWER, /* u 117 75 */ BOOST_CC_ALPHA|BOOST_CC_LOWER, /* v 118 76 */ BOOST_CC_ALPHA|BOOST_CC_LOWER, /* w 119 77 */ BOOST_CC_ALPHA|BOOST_CC_LOWER, /* x 120 78 */ BOOST_CC_ALPHA|BOOST_CC_LOWER, /* y 121 79 */ BOOST_CC_ALPHA|BOOST_CC_LOWER, /* z 122 7a */ BOOST_CC_ALPHA|BOOST_CC_LOWER, /* { 123 7b */ BOOST_CC_PUNCT, /* | 124 7c */ BOOST_CC_PUNCT, /* } 125 7d */ BOOST_CC_PUNCT, /* ~ 126 7e */ BOOST_CC_PUNCT, /* DEL 127 7f */ BOOST_CC_CTRL, /* -- 128 80 */ BOOST_CC_CTRL, /* -- 129 81 */ BOOST_CC_CTRL, /* -- 130 82 */ BOOST_CC_CTRL, /* -- 131 83 */ BOOST_CC_CTRL, /* -- 132 84 */ BOOST_CC_CTRL, /* -- 133 85 */ BOOST_CC_CTRL, /* -- 134 86 */ BOOST_CC_CTRL, /* -- 135 87 */ BOOST_CC_CTRL, /* -- 136 88 */ BOOST_CC_CTRL, /* -- 137 89 */ BOOST_CC_CTRL, /* -- 138 8a */ BOOST_CC_CTRL, /* -- 139 8b */ BOOST_CC_CTRL, /* -- 140 8c */ BOOST_CC_CTRL, /* -- 141 8d */ BOOST_CC_CTRL, /* -- 142 8e */ BOOST_CC_CTRL, /* -- 143 8f */ BOOST_CC_CTRL, /* -- 144 90 */ BOOST_CC_CTRL, /* -- 145 91 */ BOOST_CC_CTRL, /* -- 146 92 */ BOOST_CC_CTRL, /* -- 147 93 */ BOOST_CC_CTRL, /* -- 148 94 */ BOOST_CC_CTRL, /* -- 149 95 */ BOOST_CC_CTRL, /* -- 150 96 */ BOOST_CC_CTRL, /* -- 151 97 */ BOOST_CC_CTRL, /* -- 152 98 */ BOOST_CC_CTRL, /* -- 153 99 */ BOOST_CC_CTRL, /* -- 154 9a */ BOOST_CC_CTRL, /* -- 155 9b */ BOOST_CC_CTRL, /* -- 156 9c */ BOOST_CC_CTRL, /* -- 157 9d */ BOOST_CC_CTRL, /* -- 158 9e */ BOOST_CC_CTRL, /* -- 159 9f */ BOOST_CC_CTRL, /* 160 a0 */ BOOST_CC_SPACE, /* ¡ 161 a1 */ BOOST_CC_PUNCT, /* ¢ 162 a2 */ BOOST_CC_PUNCT, /* £ 163 a3 */ BOOST_CC_PUNCT, /* ¤ 164 a4 */ BOOST_CC_PUNCT, /* ¥ 165 a5 */ BOOST_CC_PUNCT, /* ¦ 166 a6 */ BOOST_CC_PUNCT, /* § 167 a7 */ BOOST_CC_PUNCT, /* ¨ 168 a8 */ BOOST_CC_PUNCT, /* © 169 a9 */ BOOST_CC_PUNCT, /* ª 170 aa */ BOOST_CC_PUNCT, /* « 171 ab */ BOOST_CC_PUNCT, /* ¬ 172 ac */ BOOST_CC_PUNCT, /* ­ 173 ad */ BOOST_CC_PUNCT, /* ® 174 ae */ BOOST_CC_PUNCT, /* ¯ 175 af */ BOOST_CC_PUNCT, /* ° 176 b0 */ BOOST_CC_PUNCT, /* ± 177 b1 */ BOOST_CC_PUNCT, /* ² 178 b2 */ BOOST_CC_DIGIT|BOOST_CC_PUNCT, /* ³ 179 b3 */ BOOST_CC_DIGIT|BOOST_CC_PUNCT, /* ´ 180 b4 */ BOOST_CC_PUNCT, /* µ 181 b5 */ BOOST_CC_PUNCT, /* ¶ 182 b6 */ BOOST_CC_PUNCT, /* · 183 b7 */ BOOST_CC_PUNCT, /* ¸ 184 b8 */ BOOST_CC_PUNCT, /* ¹ 185 b9 */ BOOST_CC_DIGIT|BOOST_CC_PUNCT, /* º 186 ba */ BOOST_CC_PUNCT, /* » 187 bb */ BOOST_CC_PUNCT, /* ¼ 188 bc */ BOOST_CC_PUNCT, /* ½ 189 bd */ BOOST_CC_PUNCT, /* ¾ 190 be */ BOOST_CC_PUNCT, /* ¿ 191 bf */ BOOST_CC_PUNCT, /* À 192 c0 */ BOOST_CC_ALPHA|BOOST_CC_UPPER, /* Á 193 c1 */ BOOST_CC_ALPHA|BOOST_CC_UPPER, /* Â 194 c2 */ BOOST_CC_ALPHA|BOOST_CC_UPPER, /* Ã 195 c3 */ BOOST_CC_ALPHA|BOOST_CC_UPPER, /* Ä 196 c4 */ BOOST_CC_ALPHA|BOOST_CC_UPPER, /* Å 197 c5 */ BOOST_CC_ALPHA|BOOST_CC_UPPER, /* Æ 198 c6 */ BOOST_CC_ALPHA|BOOST_CC_UPPER, /* Ç 199 c7 */ BOOST_CC_ALPHA|BOOST_CC_UPPER, /* È 200 c8 */ BOOST_CC_ALPHA|BOOST_CC_UPPER, /* É 201 c9 */ BOOST_CC_ALPHA|BOOST_CC_UPPER, /* Ê 202 ca */ BOOST_CC_ALPHA|BOOST_CC_UPPER, /* Ë 203 cb */ BOOST_CC_ALPHA|BOOST_CC_UPPER, /* Ì 204 cc */ BOOST_CC_ALPHA|BOOST_CC_UPPER, /* Í 205 cd */ BOOST_CC_ALPHA|BOOST_CC_UPPER, /* Î 206 ce */ BOOST_CC_ALPHA|BOOST_CC_UPPER, /* Ï 207 cf */ BOOST_CC_ALPHA|BOOST_CC_UPPER, /* Ð 208 d0 */ BOOST_CC_ALPHA|BOOST_CC_UPPER, /* Ñ 209 d1 */ BOOST_CC_ALPHA|BOOST_CC_UPPER, /* Ò 210 d2 */ BOOST_CC_ALPHA|BOOST_CC_UPPER, /* Ó 211 d3 */ BOOST_CC_ALPHA|BOOST_CC_UPPER, /* Ô 212 d4 */ BOOST_CC_ALPHA|BOOST_CC_UPPER, /* Õ 213 d5 */ BOOST_CC_ALPHA|BOOST_CC_UPPER, /* Ö 214 d6 */ BOOST_CC_ALPHA|BOOST_CC_UPPER, /* × 215 d7 */ BOOST_CC_PUNCT, /* Ø 216 d8 */ BOOST_CC_ALPHA|BOOST_CC_UPPER, /* Ù 217 d9 */ BOOST_CC_ALPHA|BOOST_CC_UPPER, /* Ú 218 da */ BOOST_CC_ALPHA|BOOST_CC_UPPER, /* Û 219 db */ BOOST_CC_ALPHA|BOOST_CC_UPPER, /* Ü 220 dc */ BOOST_CC_ALPHA|BOOST_CC_UPPER, /* Ý 221 dd */ BOOST_CC_ALPHA|BOOST_CC_UPPER, /* Þ 222 de */ BOOST_CC_ALPHA|BOOST_CC_UPPER, /* ß 223 df */ BOOST_CC_ALPHA|BOOST_CC_LOWER, /* à 224 e0 */ BOOST_CC_ALPHA|BOOST_CC_LOWER, /* á 225 e1 */ BOOST_CC_ALPHA|BOOST_CC_LOWER, /* â 226 e2 */ BOOST_CC_ALPHA|BOOST_CC_LOWER, /* ã 227 e3 */ BOOST_CC_ALPHA|BOOST_CC_LOWER, /* ä 228 e4 */ BOOST_CC_ALPHA|BOOST_CC_LOWER, /* å 229 e5 */ BOOST_CC_ALPHA|BOOST_CC_LOWER, /* æ 230 e6 */ BOOST_CC_ALPHA|BOOST_CC_LOWER, /* ç 231 e7 */ BOOST_CC_ALPHA|BOOST_CC_LOWER, /* è 232 e8 */ BOOST_CC_ALPHA|BOOST_CC_LOWER, /* é 233 e9 */ BOOST_CC_ALPHA|BOOST_CC_LOWER, /* ê 234 ea */ BOOST_CC_ALPHA|BOOST_CC_LOWER, /* ë 235 eb */ BOOST_CC_ALPHA|BOOST_CC_LOWER, /* ì 236 ec */ BOOST_CC_ALPHA|BOOST_CC_LOWER, /* í 237 ed */ BOOST_CC_ALPHA|BOOST_CC_LOWER, /* î 238 ee */ BOOST_CC_ALPHA|BOOST_CC_LOWER, /* ï 239 ef */ BOOST_CC_ALPHA|BOOST_CC_LOWER, /* ð 240 f0 */ BOOST_CC_ALPHA|BOOST_CC_LOWER, /* ñ 241 f1 */ BOOST_CC_ALPHA|BOOST_CC_LOWER, /* ò 242 f2 */ BOOST_CC_ALPHA|BOOST_CC_LOWER, /* ó 243 f3 */ BOOST_CC_ALPHA|BOOST_CC_LOWER, /* ô 244 f4 */ BOOST_CC_ALPHA|BOOST_CC_LOWER, /* õ 245 f5 */ BOOST_CC_ALPHA|BOOST_CC_LOWER, /* ö 246 f6 */ BOOST_CC_ALPHA|BOOST_CC_LOWER, /* ÷ 247 f7 */ BOOST_CC_PUNCT, /* ø 248 f8 */ BOOST_CC_ALPHA|BOOST_CC_LOWER, /* ù 249 f9 */ BOOST_CC_ALPHA|BOOST_CC_LOWER, /* ú 250 fa */ BOOST_CC_ALPHA|BOOST_CC_LOWER, /* û 251 fb */ BOOST_CC_ALPHA|BOOST_CC_LOWER, /* ü 252 fc */ BOOST_CC_ALPHA|BOOST_CC_LOWER, /* ý 253 fd */ BOOST_CC_ALPHA|BOOST_CC_LOWER, /* þ 254 fe */ BOOST_CC_ALPHA|BOOST_CC_LOWER, /* ÿ 255 ff */ BOOST_CC_ALPHA|BOOST_CC_LOWER, }; /////////////////////////////////////////////////////////////////////////// // ISO 8859-1 character conversion table /////////////////////////////////////////////////////////////////////////// const unsigned char iso8859_1_char_conversion[] = { /* NUL 0 0 */ '\0', /* SOH 1 1 */ '\0', /* STX 2 2 */ '\0', /* ETX 3 3 */ '\0', /* EOT 4 4 */ '\0', /* ENQ 5 5 */ '\0', /* ACK 6 6 */ '\0', /* BEL 7 7 */ '\0', /* BS 8 8 */ '\0', /* HT 9 9 */ '\0', /* NL 10 a */ '\0', /* VT 11 b */ '\0', /* NP 12 c */ '\0', /* CR 13 d */ '\0', /* SO 14 e */ '\0', /* SI 15 f */ '\0', /* DLE 16 10 */ '\0', /* DC1 17 11 */ '\0', /* DC2 18 12 */ '\0', /* DC3 19 13 */ '\0', /* DC4 20 14 */ '\0', /* NAK 21 15 */ '\0', /* SYN 22 16 */ '\0', /* ETB 23 17 */ '\0', /* CAN 24 18 */ '\0', /* EM 25 19 */ '\0', /* SUB 26 1a */ '\0', /* ESC 27 1b */ '\0', /* FS 28 1c */ '\0', /* GS 29 1d */ '\0', /* RS 30 1e */ '\0', /* US 31 1f */ '\0', /* SP 32 20 */ '\0', /* ! 33 21 */ '\0', /* " 34 22 */ '\0', /* # 35 23 */ '\0', /* $ 36 24 */ '\0', /* % 37 25 */ '\0', /* & 38 26 */ '\0', /* ' 39 27 */ '\0', /* ( 40 28 */ '\0', /* ) 41 29 */ '\0', /* * 42 2a */ '\0', /* + 43 2b */ '\0', /* , 44 2c */ '\0', /* - 45 2d */ '\0', /* . 46 2e */ '\0', /* / 47 2f */ '\0', /* 0 48 30 */ '\0', /* 1 49 31 */ '\0', /* 2 50 32 */ '\0', /* 3 51 33 */ '\0', /* 4 52 34 */ '\0', /* 5 53 35 */ '\0', /* 6 54 36 */ '\0', /* 7 55 37 */ '\0', /* 8 56 38 */ '\0', /* 9 57 39 */ '\0', /* : 58 3a */ '\0', /* ; 59 3b */ '\0', /* < 60 3c */ '\0', /* = 61 3d */ '\0', /* > 62 3e */ '\0', /* ? 63 3f */ '\0', /* @ 64 40 */ '\0', /* A 65 41 */ 'a', /* B 66 42 */ 'b', /* C 67 43 */ 'c', /* D 68 44 */ 'd', /* E 69 45 */ 'e', /* F 70 46 */ 'f', /* G 71 47 */ 'g', /* H 72 48 */ 'h', /* I 73 49 */ 'i', /* J 74 4a */ 'j', /* K 75 4b */ 'k', /* L 76 4c */ 'l', /* M 77 4d */ 'm', /* N 78 4e */ 'n', /* O 79 4f */ 'o', /* P 80 50 */ 'p', /* Q 81 51 */ 'q', /* R 82 52 */ 'r', /* S 83 53 */ 's', /* T 84 54 */ 't', /* U 85 55 */ 'u', /* V 86 56 */ 'v', /* W 87 57 */ 'w', /* X 88 58 */ 'x', /* Y 89 59 */ 'y', /* Z 90 5a */ 'z', /* [ 91 5b */ '\0', /* \ 92 5c */ '\0', /* ] 93 5d */ '\0', /* ^ 94 5e */ '\0', /* _ 95 5f */ '\0', /* ` 96 60 */ '\0', /* a 97 61 */ 'A', /* b 98 62 */ 'B', /* c 99 63 */ 'C', /* d 100 64 */ 'D', /* e 101 65 */ 'E', /* f 102 66 */ 'F', /* g 103 67 */ 'G', /* h 104 68 */ 'H', /* i 105 69 */ 'I', /* j 106 6a */ 'J', /* k 107 6b */ 'K', /* l 108 6c */ 'L', /* m 109 6d */ 'M', /* n 110 6e */ 'N', /* o 111 6f */ 'O', /* p 112 70 */ 'P', /* q 113 71 */ 'Q', /* r 114 72 */ 'R', /* s 115 73 */ 'S', /* t 116 74 */ 'T', /* u 117 75 */ 'U', /* v 118 76 */ 'V', /* w 119 77 */ 'W', /* x 120 78 */ 'X', /* y 121 79 */ 'Y', /* z 122 7a */ 'Z', /* { 123 7b */ '\0', /* | 124 7c */ '\0', /* } 125 7d */ '\0', /* ~ 126 7e */ '\0', /* DEL 127 7f */ '\0', /* -- 128 80 */ '\0', /* -- 129 81 */ '\0', /* -- 130 82 */ '\0', /* -- 131 83 */ '\0', /* -- 132 84 */ '\0', /* -- 133 85 */ '\0', /* -- 134 86 */ '\0', /* -- 135 87 */ '\0', /* -- 136 88 */ '\0', /* -- 137 89 */ '\0', /* -- 138 8a */ '\0', /* -- 139 8b */ '\0', /* -- 140 8c */ '\0', /* -- 141 8d */ '\0', /* -- 142 8e */ '\0', /* -- 143 8f */ '\0', /* -- 144 90 */ '\0', /* -- 145 91 */ '\0', /* -- 146 92 */ '\0', /* -- 147 93 */ '\0', /* -- 148 94 */ '\0', /* -- 149 95 */ '\0', /* -- 150 96 */ '\0', /* -- 151 97 */ '\0', /* -- 152 98 */ '\0', /* -- 153 99 */ '\0', /* -- 154 9a */ '\0', /* -- 155 9b */ '\0', /* -- 156 9c */ '\0', /* -- 157 9d */ '\0', /* -- 158 9e */ '\0', /* -- 159 9f */ '\0', /* 160 a0 */ '\0', /* ¡ 161 a1 */ '\0', /* ¢ 162 a2 */ '\0', /* £ 163 a3 */ '\0', /* ¤ 164 a4 */ '\0', /* ¥ 165 a5 */ '\0', /* ¦ 166 a6 */ '\0', /* § 167 a7 */ '\0', /* ¨ 168 a8 */ '\0', /* © 169 a9 */ '\0', /* ª 170 aa */ '\0', /* « 171 ab */ '\0', /* ¬ 172 ac */ '\0', /* ­ 173 ad */ '\0', /* ® 174 ae */ '\0', /* ¯ 175 af */ '\0', /* ° 176 b0 */ '\0', /* ± 177 b1 */ '\0', /* ² 178 b2 */ '\0', /* ³ 179 b3 */ '\0', /* ´ 180 b4 */ '\0', /* µ 181 b5 */ '\0', /* ¶ 182 b6 */ '\0', /* · 183 b7 */ '\0', /* ¸ 184 b8 */ '\0', /* ¹ 185 b9 */ '\0', /* º 186 ba */ '\0', /* » 187 bb */ '\0', /* ¼ 188 bc */ '\0', /* ½ 189 bd */ '\0', /* ¾ 190 be */ '\0', /* ¿ 191 bf */ '\0', /* à 192 c0 */ 0xe0, /* á 193 c1 */ 0xe1, /* â 194 c2 */ 0xe2, /* ã 195 c3 */ 0xe3, /* ä 196 c4 */ 0xe4, /* å 197 c5 */ 0xe5, /* æ 198 c6 */ 0xe6, /* ç 199 c7 */ 0xe7, /* è 200 c8 */ 0xe8, /* é 201 c9 */ 0xe9, /* ê 202 ca */ 0xea, /* ë 203 cb */ 0xeb, /* ì 204 cc */ 0xec, /* í 205 cd */ 0xed, /* î 206 ce */ 0xee, /* ï 207 cf */ 0xef, /* ð 208 d0 */ 0xf0, /* ñ 209 d1 */ 0xf1, /* ò 210 d2 */ 0xf2, /* ó 211 d3 */ 0xf3, /* ô 212 d4 */ 0xf4, /* õ 213 d5 */ 0xf5, /* ö 214 d6 */ 0xf6, /* × 215 d7 */ '\0', /* ø 216 d8 */ 0xf8, /* ù 217 d9 */ 0xf9, /* ú 218 da */ 0xfa, /* û 219 db */ 0xfb, /* ü 220 dc */ 0xfc, /* ý 221 dd */ 0xfd, /* þ 222 de */ 0xfe, /* ß 223 df */ '\0', /* À 224 e0 */ 0xc0, /* Á 225 e1 */ 0xc1, /* Â 226 e2 */ 0xc2, /* Ã 227 e3 */ 0xc3, /* Ä 228 e4 */ 0xc4, /* Å 229 e5 */ 0xc5, /* Æ 230 e6 */ 0xc6, /* Ç 231 e7 */ 0xc7, /* È 232 e8 */ 0xc8, /* É 233 e9 */ 0xc9, /* Ê 234 ea */ 0xca, /* Ë 235 eb */ 0xcb, /* Ì 236 ec */ 0xcc, /* Í 237 ed */ 0xcd, /* Î 238 ee */ 0xce, /* Ï 239 ef */ 0xcf, /* Ð 240 f0 */ 0xd0, /* Ñ 241 f1 */ 0xd1, /* Ò 242 f2 */ 0xd2, /* Ó 243 f3 */ 0xd3, /* Ô 244 f4 */ 0xd4, /* Õ 245 f5 */ 0xd5, /* Ö 246 f6 */ 0xd6, /* ÷ 247 f7 */ '\0', /* Ø 248 f8 */ 0xd8, /* Ù 249 f9 */ 0xd9, /* Ú 250 fa */ 0xda, /* Û 251 fb */ 0xdb, /* Ü 252 fc */ 0xdc, /* Ý 253 fd */ 0xdd, /* Þ 254 fe */ 0xde, /* ÿ 255 ff */ '\0', }; /////////////////////////////////////////////////////////////////////////// // Test characters for specified conditions (using iso8859-1) /////////////////////////////////////////////////////////////////////////// struct iso8859_1 { typedef unsigned char char_type; static bool isascii_(int ch) { return 0 == (ch & ~0x7f); } static bool ischar(int ch) { // iso8859.1 uses all 8 bits // we have to watch out for sign extensions return (0 == (ch & ~0xff) || ~0 == (ch | 0xff)) ? true : false; } static int isalnum(int ch) { BOOST_ASSERT(0 == (ch & ~UCHAR_MAX)); return (iso8859_1_char_types[ch] & BOOST_CC_ALPHA) || (iso8859_1_char_types[ch] & BOOST_CC_DIGIT); } static int isalpha(int ch) { BOOST_ASSERT(0 == (ch & ~UCHAR_MAX)); return (iso8859_1_char_types[ch] & BOOST_CC_ALPHA); } static int isdigit(int ch) { BOOST_ASSERT(0 == (ch & ~UCHAR_MAX)); return (iso8859_1_char_types[ch] & BOOST_CC_DIGIT); } static int isxdigit(int ch) { BOOST_ASSERT(0 == (ch & ~UCHAR_MAX)); return (iso8859_1_char_types[ch] & BOOST_CC_XDIGIT); } static int iscntrl(int ch) { BOOST_ASSERT(0 == (ch & ~UCHAR_MAX)); return (iso8859_1_char_types[ch] & BOOST_CC_CTRL); } static int isgraph(int ch) { return ('\x21' <= ch && ch <= '\x7e') || ('\xa1' <= ch && ch <= '\xff'); } static int islower(int ch) { BOOST_ASSERT(0 == (ch & ~UCHAR_MAX)); return (iso8859_1_char_types[ch] & BOOST_CC_LOWER); } static int isprint(int ch) { return ('\x20' <= ch && ch <= '\x7e') || ('\xa0' <= ch && ch <= '\xff'); } static int ispunct(int ch) { BOOST_ASSERT(0 == (ch & ~UCHAR_MAX)); return (iso8859_1_char_types[ch] & BOOST_CC_PUNCT); } static int isspace(int ch) { BOOST_ASSERT(0 == (ch & ~UCHAR_MAX)); return (iso8859_1_char_types[ch] & BOOST_CC_SPACE); } static int isblank BOOST_PREVENT_MACRO_SUBSTITUTION (int ch) { return ('\x09' == ch || '\x20' == ch || '\xa0' == ch); } static int isupper(int ch) { BOOST_ASSERT(0 == (ch & ~UCHAR_MAX)); return (iso8859_1_char_types[ch] & BOOST_CC_UPPER); } /////////////////////////////////////////////////////////////////////////// // Simple character conversions /////////////////////////////////////////////////////////////////////////// static int tolower(int ch) { return isupper(ch) && '\0' != iso8859_1_char_conversion[ch] ? iso8859_1_char_conversion[ch] : ch; } static int toupper(int ch) { return islower(ch) && '\0' != iso8859_1_char_conversion[ch] ? iso8859_1_char_conversion[ch] : ch; } static ::boost::uint32_t toucs4(int ch) { // The first 256 characters in Unicode and the UCS are // identical to those in ISO/IEC-8859-1. return ch; } }; }}} /////////////////////////////////////////////////////////////////////////////// // undefine macros /////////////////////////////////////////////////////////////////////////////// #undef BOOST_CC_DIGIT #undef BOOST_CC_XDIGIT #undef BOOST_CC_ALPHA #undef BOOST_CC_CTRL #undef BOOST_CC_LOWER #undef BOOST_CC_UPPER #undef BOOST_CC_PUNCT #undef BOOST_CC_SPACE #endif