| 1 | /****************************************************************************
|
|---|
| 2 | **
|
|---|
| 3 | ** Copyright (C) 2010 Nokia Corporation and/or its subsidiary(-ies).
|
|---|
| 4 | ** All rights reserved.
|
|---|
| 5 | ** Contact: Nokia Corporation ([email protected])
|
|---|
| 6 | **
|
|---|
| 7 | ** This file is part of the tools applications of the Qt Toolkit.
|
|---|
| 8 | **
|
|---|
| 9 | ** $QT_BEGIN_LICENSE:LGPL$
|
|---|
| 10 | ** Commercial Usage
|
|---|
| 11 | ** Licensees holding valid Qt Commercial licenses may use this file in
|
|---|
| 12 | ** accordance with the Qt Commercial License Agreement provided with the
|
|---|
| 13 | ** Software or, alternatively, in accordance with the terms contained in
|
|---|
| 14 | ** a written agreement between you and Nokia.
|
|---|
| 15 | **
|
|---|
| 16 | ** GNU Lesser General Public License Usage
|
|---|
| 17 | ** Alternatively, this file may be used under the terms of the GNU Lesser
|
|---|
| 18 | ** General Public License version 2.1 as published by the Free Software
|
|---|
| 19 | ** Foundation and appearing in the file LICENSE.LGPL included in the
|
|---|
| 20 | ** packaging of this file. Please review the following information to
|
|---|
| 21 | ** ensure the GNU Lesser General Public License version 2.1 requirements
|
|---|
| 22 | ** will be met: http://www.gnu.org/licenses/old-licenses/lgpl-2.1.html.
|
|---|
| 23 | **
|
|---|
| 24 | ** In addition, as a special exception, Nokia gives you certain additional
|
|---|
| 25 | ** rights. These rights are described in the Nokia Qt LGPL Exception
|
|---|
| 26 | ** version 1.1, included in the file LGPL_EXCEPTION.txt in this package.
|
|---|
| 27 | **
|
|---|
| 28 | ** GNU General Public License Usage
|
|---|
| 29 | ** Alternatively, this file may be used under the terms of the GNU
|
|---|
| 30 | ** General Public License version 3.0 as published by the Free Software
|
|---|
| 31 | ** Foundation and appearing in the file LICENSE.GPL included in the
|
|---|
| 32 | ** packaging of this file. Please review the following information to
|
|---|
| 33 | ** ensure the GNU General Public License version 3.0 requirements will be
|
|---|
| 34 | ** met: http://www.gnu.org/copyleft/gpl.html.
|
|---|
| 35 | **
|
|---|
| 36 | ** If you have questions regarding the use of this file, please contact
|
|---|
| 37 | ** Nokia at [email protected].
|
|---|
| 38 | ** $QT_END_LICENSE$
|
|---|
| 39 | **
|
|---|
| 40 | ****************************************************************************/
|
|---|
| 41 |
|
|---|
| 42 | #include "preprocessor.h"
|
|---|
| 43 | #include "utils.h"
|
|---|
| 44 | #include <QStringList>
|
|---|
| 45 | #include <QFile>
|
|---|
| 46 | #include <QDir>
|
|---|
| 47 | #include <QFileInfo>
|
|---|
| 48 |
|
|---|
| 49 | QT_BEGIN_NAMESPACE
|
|---|
| 50 |
|
|---|
| 51 | #include "ppkeywords.cpp"
|
|---|
| 52 | #include "keywords.cpp"
|
|---|
| 53 |
|
|---|
| 54 | // transform \r\n into \n
|
|---|
| 55 | // \r into \n (os9 style)
|
|---|
| 56 | // backslash-newlines into newlines
|
|---|
| 57 | static QByteArray cleaned(const QByteArray &input)
|
|---|
| 58 | {
|
|---|
| 59 | QByteArray result;
|
|---|
| 60 | result.reserve(input.size());
|
|---|
| 61 | const char *data = input;
|
|---|
| 62 | char *output = result.data();
|
|---|
| 63 |
|
|---|
| 64 | int newlines = 0;
|
|---|
| 65 | while (*data) {
|
|---|
| 66 | while (*data && is_space(*data))
|
|---|
| 67 | ++data;
|
|---|
| 68 | bool takeLine = (*data == '#');
|
|---|
| 69 | if (*data == '%' && *(data+1) == ':') {
|
|---|
| 70 | takeLine = true;
|
|---|
| 71 | ++data;
|
|---|
| 72 | }
|
|---|
| 73 | if (takeLine) {
|
|---|
| 74 | *output = '#';
|
|---|
| 75 | ++output;
|
|---|
| 76 | do ++data; while (*data && is_space(*data));
|
|---|
| 77 | }
|
|---|
| 78 | while (*data) {
|
|---|
| 79 | // handle \\\n, \\\r\n and \\\r
|
|---|
| 80 | if (*data == '\\') {
|
|---|
| 81 | if (*(data + 1) == '\r') {
|
|---|
| 82 | ++data;
|
|---|
| 83 | }
|
|---|
| 84 | if (*data && (*(data + 1) == '\n' || (*data) == '\r')) {
|
|---|
| 85 | ++newlines;
|
|---|
| 86 | data += 1;
|
|---|
| 87 | if (*data != '\r')
|
|---|
| 88 | data += 1;
|
|---|
| 89 | continue;
|
|---|
| 90 | }
|
|---|
| 91 | } else if (*data == '\r' && *(data + 1) == '\n') { // reduce \r\n to \n
|
|---|
| 92 | ++data;
|
|---|
| 93 | }
|
|---|
| 94 |
|
|---|
| 95 | char ch = *data;
|
|---|
| 96 | if (ch == '\r') // os9: replace \r with \n
|
|---|
| 97 | ch = '\n';
|
|---|
| 98 | *output = ch;
|
|---|
| 99 | ++output;
|
|---|
| 100 |
|
|---|
| 101 | if (*data == '\n') {
|
|---|
| 102 | // output additional newlines to keep the correct line-numbering
|
|---|
| 103 | // for the lines following the backslash-newline sequence(s)
|
|---|
| 104 | while (newlines) {
|
|---|
| 105 | *output = '\n';
|
|---|
| 106 | ++output;
|
|---|
| 107 | --newlines;
|
|---|
| 108 | }
|
|---|
| 109 | ++data;
|
|---|
| 110 | break;
|
|---|
| 111 | }
|
|---|
| 112 | ++data;
|
|---|
| 113 | }
|
|---|
| 114 | }
|
|---|
| 115 | result.resize(output - result.constData());
|
|---|
| 116 | return result;
|
|---|
| 117 | }
|
|---|
| 118 |
|
|---|
| 119 | bool Preprocessor::preprocessOnly = false;
|
|---|
| 120 | void Preprocessor::skipUntilEndif()
|
|---|
| 121 | {
|
|---|
| 122 | while(index < symbols.size() - 1 && symbols.at(index).token != PP_ENDIF){
|
|---|
| 123 | switch (symbols.at(index).token) {
|
|---|
| 124 | case PP_IF:
|
|---|
| 125 | case PP_IFDEF:
|
|---|
| 126 | case PP_IFNDEF:
|
|---|
| 127 | ++index;
|
|---|
| 128 | skipUntilEndif();
|
|---|
| 129 | break;
|
|---|
| 130 | default:
|
|---|
| 131 | ;
|
|---|
| 132 | }
|
|---|
| 133 | ++index;
|
|---|
| 134 | }
|
|---|
| 135 | }
|
|---|
| 136 |
|
|---|
| 137 | bool Preprocessor::skipBranch()
|
|---|
| 138 | {
|
|---|
| 139 | while (index < symbols.size() - 1
|
|---|
| 140 | && (symbols.at(index).token != PP_ENDIF
|
|---|
| 141 | && symbols.at(index).token != PP_ELIF
|
|---|
| 142 | && symbols.at(index).token != PP_ELSE)
|
|---|
| 143 | ){
|
|---|
| 144 | switch (symbols.at(index).token) {
|
|---|
| 145 | case PP_IF:
|
|---|
| 146 | case PP_IFDEF:
|
|---|
| 147 | case PP_IFNDEF:
|
|---|
| 148 | ++index;
|
|---|
| 149 | skipUntilEndif();
|
|---|
| 150 | break;
|
|---|
| 151 | default:
|
|---|
| 152 | ;
|
|---|
| 153 | }
|
|---|
| 154 | ++index;
|
|---|
| 155 | }
|
|---|
| 156 | return (index < symbols.size() - 1);
|
|---|
| 157 | }
|
|---|
| 158 |
|
|---|
| 159 |
|
|---|
| 160 | enum TokenizeMode { TokenizeCpp, TokenizePreprocessor, PreparePreprocessorStatement, TokenizePreprocessorStatement, TokenizeInclude };
|
|---|
| 161 | static Symbols tokenize(const QByteArray &input, int lineNum = 1, TokenizeMode mode = TokenizeCpp)
|
|---|
| 162 | {
|
|---|
| 163 | Symbols symbols;
|
|---|
| 164 | const char *begin = input;
|
|---|
| 165 | const char *data = begin;
|
|---|
| 166 | while (*data) {
|
|---|
| 167 | if (mode == TokenizeCpp) {
|
|---|
| 168 | int column = 0;
|
|---|
| 169 |
|
|---|
| 170 | const char *lexem = data;
|
|---|
| 171 | int state = 0;
|
|---|
| 172 | Token token = NOTOKEN;
|
|---|
| 173 | for (;;) {
|
|---|
| 174 | if (static_cast<signed char>(*data) < 0) {
|
|---|
| 175 | ++data;
|
|---|
| 176 | continue;
|
|---|
| 177 | }
|
|---|
| 178 | int nextindex = keywords[state].next;
|
|---|
| 179 | int next = 0;
|
|---|
| 180 | if (*data == keywords[state].defchar)
|
|---|
| 181 | next = keywords[state].defnext;
|
|---|
| 182 | else if (!state || nextindex)
|
|---|
| 183 | next = keyword_trans[nextindex][(int)*data];
|
|---|
| 184 | if (!next)
|
|---|
| 185 | break;
|
|---|
| 186 | state = next;
|
|---|
| 187 | token = keywords[state].token;
|
|---|
| 188 | ++data;
|
|---|
| 189 | }
|
|---|
| 190 |
|
|---|
| 191 | // suboptimal, is_ident_char should use a table
|
|---|
| 192 | if (keywords[state].ident && is_ident_char(*data))
|
|---|
| 193 | token = keywords[state].ident;
|
|---|
| 194 |
|
|---|
| 195 | if (token == NOTOKEN) {
|
|---|
| 196 | // an error really
|
|---|
| 197 | ++data;
|
|---|
| 198 | continue;
|
|---|
| 199 | }
|
|---|
| 200 |
|
|---|
| 201 | ++column;
|
|---|
| 202 |
|
|---|
| 203 | if (token > SPECIAL_TREATMENT_MARK) {
|
|---|
| 204 | switch (token) {
|
|---|
| 205 | case QUOTE:
|
|---|
| 206 | data = skipQuote(data);
|
|---|
| 207 | token = STRING_LITERAL;
|
|---|
| 208 | // concatenate multi-line strings for easier
|
|---|
| 209 | // STRING_LITERAAL handling in moc
|
|---|
| 210 | if (!Preprocessor::preprocessOnly
|
|---|
| 211 | && !symbols.isEmpty()
|
|---|
| 212 | && symbols.last().token == STRING_LITERAL) {
|
|---|
| 213 |
|
|---|
| 214 | QByteArray newString = symbols.last().unquotedLexem();
|
|---|
| 215 | newString += input.mid(lexem - begin + 1, data - lexem - 2);
|
|---|
| 216 | newString.prepend('\"');
|
|---|
| 217 | newString.append('\"');
|
|---|
| 218 | symbols.last() = Symbol(symbols.last().lineNum,
|
|---|
| 219 | STRING_LITERAL,
|
|---|
| 220 | newString);
|
|---|
| 221 | continue;
|
|---|
| 222 | }
|
|---|
| 223 | break;
|
|---|
| 224 | case SINGLEQUOTE:
|
|---|
| 225 | while (*data && (*data != '\''
|
|---|
| 226 | || (*(data-1)=='\\'
|
|---|
| 227 | && *(data-2)!='\\')))
|
|---|
| 228 | ++data;
|
|---|
| 229 | if (*data)
|
|---|
| 230 | ++data;
|
|---|
| 231 | token = CHARACTER_LITERAL;
|
|---|
| 232 | break;
|
|---|
| 233 | case LANGLE_SCOPE:
|
|---|
| 234 | // split <:: into two tokens, < and ::
|
|---|
| 235 | token = LANGLE;
|
|---|
| 236 | data -= 2;
|
|---|
| 237 | break;
|
|---|
| 238 | case DIGIT:
|
|---|
| 239 | while (is_digit_char(*data))
|
|---|
| 240 | ++data;
|
|---|
| 241 | if (!*data || *data != '.') {
|
|---|
| 242 | token = INTEGER_LITERAL;
|
|---|
| 243 | if (data - lexem == 1 &&
|
|---|
| 244 | (*data == 'x' || *data == 'X')
|
|---|
| 245 | && *lexem == '0') {
|
|---|
| 246 | ++data;
|
|---|
| 247 | while (is_hex_char(*data))
|
|---|
| 248 | ++data;
|
|---|
| 249 | }
|
|---|
| 250 | break;
|
|---|
| 251 | }
|
|---|
| 252 | token = FLOATING_LITERAL;
|
|---|
| 253 | ++data;
|
|---|
| 254 | // fall through
|
|---|
| 255 | case FLOATING_LITERAL:
|
|---|
| 256 | while (is_digit_char(*data))
|
|---|
| 257 | ++data;
|
|---|
| 258 | if (*data == '+' || *data == '-')
|
|---|
| 259 | ++data;
|
|---|
| 260 | if (*data == 'e' || *data == 'E') {
|
|---|
| 261 | ++data;
|
|---|
| 262 | while (is_digit_char(*data))
|
|---|
| 263 | ++data;
|
|---|
| 264 | }
|
|---|
| 265 | if (*data == 'f' || *data == 'F'
|
|---|
| 266 | || *data == 'l' || *data == 'L')
|
|---|
| 267 | ++data;
|
|---|
| 268 | break;
|
|---|
| 269 | case HASH:
|
|---|
| 270 | if (column == 1) {
|
|---|
| 271 | mode = PreparePreprocessorStatement;
|
|---|
| 272 | while (*data && (*data == ' ' || *data == '\t'))
|
|---|
| 273 | ++data;
|
|---|
| 274 | if (is_ident_char(*data))
|
|---|
| 275 | mode = TokenizePreprocessorStatement;
|
|---|
| 276 | continue;
|
|---|
| 277 | }
|
|---|
| 278 | break;
|
|---|
| 279 | case NEWLINE:
|
|---|
| 280 | ++lineNum;
|
|---|
| 281 | continue;
|
|---|
| 282 | case BACKSLASH:
|
|---|
| 283 | {
|
|---|
| 284 | const char *rewind = data;
|
|---|
| 285 | while (*data && (*data == ' ' || *data == '\t'))
|
|---|
| 286 | ++data;
|
|---|
| 287 | if (*data && *data == '\n') {
|
|---|
| 288 | ++data;
|
|---|
| 289 | continue;
|
|---|
| 290 | }
|
|---|
| 291 | data = rewind;
|
|---|
| 292 | } break;
|
|---|
| 293 | case CHARACTER:
|
|---|
| 294 | while (is_ident_char(*data))
|
|---|
| 295 | ++data;
|
|---|
| 296 | token = IDENTIFIER;
|
|---|
| 297 | break;
|
|---|
| 298 | case C_COMMENT:
|
|---|
| 299 | if (*data) {
|
|---|
| 300 | if (*data == '\n')
|
|---|
| 301 | ++lineNum;
|
|---|
| 302 | ++data;
|
|---|
| 303 | if (*data) {
|
|---|
| 304 | if (*data == '\n')
|
|---|
| 305 | ++lineNum;
|
|---|
| 306 | ++data;
|
|---|
| 307 | }
|
|---|
| 308 | }
|
|---|
| 309 | while (*data && (*(data-1) != '/' || *(data-2) != '*')) {
|
|---|
| 310 | if (*data == '\n')
|
|---|
| 311 | ++lineNum;
|
|---|
| 312 | ++data;
|
|---|
| 313 | }
|
|---|
| 314 | token = WHITESPACE; // one comment, one whitespace
|
|---|
| 315 | // fall through;
|
|---|
| 316 | case WHITESPACE:
|
|---|
| 317 | if (column == 1)
|
|---|
| 318 | column = 0;
|
|---|
| 319 | while (*data && (*data == ' ' || *data == '\t'))
|
|---|
| 320 | ++data;
|
|---|
| 321 | if (Preprocessor::preprocessOnly) // tokenize whitespace
|
|---|
| 322 | break;
|
|---|
| 323 | continue;
|
|---|
| 324 | case CPP_COMMENT:
|
|---|
| 325 | while (*data && *data != '\n')
|
|---|
| 326 | ++data;
|
|---|
| 327 | continue; // ignore safely, the newline is a separator
|
|---|
| 328 | default:
|
|---|
| 329 | continue; //ignore
|
|---|
| 330 | }
|
|---|
| 331 | }
|
|---|
| 332 | #ifdef USE_LEXEM_STORE
|
|---|
| 333 | if (!Preprocessor::preprocessOnly
|
|---|
| 334 | && token != IDENTIFIER
|
|---|
| 335 | && token != STRING_LITERAL
|
|---|
| 336 | && token != FLOATING_LITERAL
|
|---|
| 337 | && token != INTEGER_LITERAL)
|
|---|
| 338 | symbols += Symbol(lineNum, token);
|
|---|
| 339 | else
|
|---|
| 340 | #endif
|
|---|
| 341 | symbols += Symbol(lineNum, token, input, lexem-begin, data-lexem);
|
|---|
| 342 |
|
|---|
| 343 | } else { // Preprocessor
|
|---|
| 344 |
|
|---|
| 345 | const char *lexem = data;
|
|---|
| 346 | int state = 0;
|
|---|
| 347 | Token token = NOTOKEN;
|
|---|
| 348 | if (mode == TokenizePreprocessorStatement) {
|
|---|
| 349 | state = pp_keyword_trans[0][(int)'#'];
|
|---|
| 350 | mode = TokenizePreprocessor;
|
|---|
| 351 | }
|
|---|
| 352 | for (;;) {
|
|---|
| 353 | if (static_cast<signed char>(*data) < 0) {
|
|---|
| 354 | ++data;
|
|---|
| 355 | continue;
|
|---|
| 356 | }
|
|---|
| 357 |
|
|---|
| 358 | int nextindex = pp_keywords[state].next;
|
|---|
| 359 | int next = 0;
|
|---|
| 360 | if (*data == pp_keywords[state].defchar)
|
|---|
| 361 | next = pp_keywords[state].defnext;
|
|---|
| 362 | else if (!state || nextindex)
|
|---|
| 363 | next = pp_keyword_trans[nextindex][(int)*data];
|
|---|
| 364 | if (!next)
|
|---|
| 365 | break;
|
|---|
| 366 | state = next;
|
|---|
| 367 | token = pp_keywords[state].token;
|
|---|
| 368 | ++data;
|
|---|
| 369 | }
|
|---|
| 370 | // suboptimal, is_ident_char should use a table
|
|---|
| 371 | if (pp_keywords[state].ident && is_ident_char(*data))
|
|---|
| 372 | token = pp_keywords[state].ident;
|
|---|
| 373 |
|
|---|
| 374 | switch (token) {
|
|---|
| 375 | case NOTOKEN:
|
|---|
| 376 | ++data;
|
|---|
| 377 | break;
|
|---|
| 378 | case PP_IFDEF:
|
|---|
| 379 | symbols += Symbol(lineNum, PP_IF);
|
|---|
| 380 | symbols += Symbol(lineNum, PP_DEFINED);
|
|---|
| 381 | continue;
|
|---|
| 382 | case PP_IFNDEF:
|
|---|
| 383 | symbols += Symbol(lineNum, PP_IF);
|
|---|
| 384 | symbols += Symbol(lineNum, PP_NOT);
|
|---|
| 385 | symbols += Symbol(lineNum, PP_DEFINED);
|
|---|
| 386 | continue;
|
|---|
| 387 | case PP_INCLUDE:
|
|---|
| 388 | mode = TokenizeInclude;
|
|---|
| 389 | break;
|
|---|
| 390 | case PP_QUOTE:
|
|---|
| 391 | data = skipQuote(data);
|
|---|
| 392 | token = PP_STRING_LITERAL;
|
|---|
| 393 | break;
|
|---|
| 394 | case PP_SINGLEQUOTE:
|
|---|
| 395 | while (*data && (*data != '\''
|
|---|
| 396 | || (*(data-1)=='\\'
|
|---|
| 397 | && *(data-2)!='\\')))
|
|---|
| 398 | ++data;
|
|---|
| 399 | if (*data)
|
|---|
| 400 | ++data;
|
|---|
| 401 | token = PP_CHARACTER_LITERAL;
|
|---|
| 402 | break;
|
|---|
| 403 | case PP_DIGIT:
|
|---|
| 404 | while (is_digit_char(*data))
|
|---|
| 405 | ++data;
|
|---|
| 406 | if (!*data || *data != '.') {
|
|---|
| 407 | token = PP_INTEGER_LITERAL;
|
|---|
| 408 | if (data - lexem == 1 &&
|
|---|
| 409 | (*data == 'x' || *data == 'X')
|
|---|
| 410 | && *lexem == '0') {
|
|---|
| 411 | ++data;
|
|---|
| 412 | while (is_hex_char(*data))
|
|---|
| 413 | ++data;
|
|---|
| 414 | }
|
|---|
| 415 | break;
|
|---|
| 416 | }
|
|---|
| 417 | token = PP_FLOATING_LITERAL;
|
|---|
| 418 | ++data;
|
|---|
| 419 | // fall through
|
|---|
| 420 | case PP_FLOATING_LITERAL:
|
|---|
| 421 | while (is_digit_char(*data))
|
|---|
| 422 | ++data;
|
|---|
| 423 | if (*data == '+' || *data == '-')
|
|---|
| 424 | ++data;
|
|---|
| 425 | if (*data == 'e' || *data == 'E') {
|
|---|
| 426 | ++data;
|
|---|
| 427 | while (is_digit_char(*data))
|
|---|
| 428 | ++data;
|
|---|
| 429 | }
|
|---|
| 430 | if (*data == 'f' || *data == 'F'
|
|---|
| 431 | || *data == 'l' || *data == 'L')
|
|---|
| 432 | ++data;
|
|---|
| 433 | break;
|
|---|
| 434 | case PP_CHARACTER:
|
|---|
| 435 | if (mode == PreparePreprocessorStatement) {
|
|---|
| 436 | // rewind entire token to begin
|
|---|
| 437 | data = lexem;
|
|---|
| 438 | mode = TokenizePreprocessorStatement;
|
|---|
| 439 | continue;
|
|---|
| 440 | }
|
|---|
| 441 | while (is_ident_char(*data))
|
|---|
| 442 | ++data;
|
|---|
| 443 | token = PP_IDENTIFIER;
|
|---|
| 444 | break;
|
|---|
| 445 | case PP_C_COMMENT:
|
|---|
| 446 | if (*data) {
|
|---|
| 447 | if (*data == '\n')
|
|---|
| 448 | ++lineNum;
|
|---|
| 449 | ++data;
|
|---|
| 450 | if (*data) {
|
|---|
| 451 | if (*data == '\n')
|
|---|
| 452 | ++lineNum;
|
|---|
| 453 | ++data;
|
|---|
| 454 | }
|
|---|
| 455 | }
|
|---|
| 456 | while (*data && (*(data-1) != '/' || *(data-2) != '*')) {
|
|---|
| 457 | if (*data == '\n')
|
|---|
| 458 | ++lineNum;
|
|---|
| 459 | ++data;
|
|---|
| 460 | }
|
|---|
| 461 | token = PP_WHITESPACE; // one comment, one whitespace
|
|---|
| 462 | // fall through;
|
|---|
| 463 | case PP_WHITESPACE:
|
|---|
| 464 | while (*data && (*data == ' ' || *data == '\t'))
|
|---|
| 465 | ++data;
|
|---|
| 466 | continue; // the preprocessor needs no whitespace
|
|---|
| 467 | case PP_CPP_COMMENT:
|
|---|
| 468 | while (*data && *data != '\n')
|
|---|
| 469 | ++data;
|
|---|
| 470 | continue; // ignore safely, the newline is a separator
|
|---|
| 471 | case PP_NEWLINE:
|
|---|
| 472 | ++lineNum;
|
|---|
| 473 | mode = TokenizeCpp;
|
|---|
| 474 | break;
|
|---|
| 475 | case PP_BACKSLASH:
|
|---|
| 476 | {
|
|---|
| 477 | const char *rewind = data;
|
|---|
| 478 | while (*data && (*data == ' ' || *data == '\t'))
|
|---|
| 479 | ++data;
|
|---|
| 480 | if (*data && *data == '\n') {
|
|---|
| 481 | ++data;
|
|---|
| 482 | continue;
|
|---|
| 483 | }
|
|---|
| 484 | data = rewind;
|
|---|
| 485 | } break;
|
|---|
| 486 | case PP_LANGLE:
|
|---|
| 487 | if (mode != TokenizeInclude)
|
|---|
| 488 | break;
|
|---|
| 489 | token = PP_STRING_LITERAL;
|
|---|
| 490 | while (*data && *data != '\n' && *(data-1) != '>')
|
|---|
| 491 | ++data;
|
|---|
| 492 | break;
|
|---|
| 493 | default:
|
|---|
| 494 | break;
|
|---|
| 495 | }
|
|---|
| 496 | if (mode == PreparePreprocessorStatement)
|
|---|
| 497 | continue;
|
|---|
| 498 | #ifdef USE_LEXEM_STORE
|
|---|
| 499 | if (token != PP_IDENTIFIER
|
|---|
| 500 | && token != PP_STRING_LITERAL
|
|---|
| 501 | && token != PP_FLOATING_LITERAL
|
|---|
| 502 | && token != PP_INTEGER_LITERAL)
|
|---|
| 503 | symbols += Symbol(lineNum, token);
|
|---|
| 504 | else
|
|---|
| 505 | #endif
|
|---|
| 506 | symbols += Symbol(lineNum, token, input, lexem-begin, data-lexem);
|
|---|
| 507 | }
|
|---|
| 508 | }
|
|---|
| 509 | symbols += Symbol(); // eof symbol
|
|---|
| 510 | return symbols;
|
|---|
| 511 | }
|
|---|
| 512 |
|
|---|
| 513 | void Preprocessor::substituteMacro(const MacroName ¯o, Symbols &substituted, MacroSafeSet safeset)
|
|---|
| 514 | {
|
|---|
| 515 | Symbols saveSymbols = symbols;
|
|---|
| 516 | int saveIndex = index;
|
|---|
| 517 |
|
|---|
| 518 | symbols = macros.value(macro).symbols;
|
|---|
| 519 | index = 0;
|
|---|
| 520 |
|
|---|
| 521 | safeset += macro;
|
|---|
| 522 | substituteUntilNewline(substituted, safeset);
|
|---|
| 523 |
|
|---|
| 524 | symbols = saveSymbols;
|
|---|
| 525 | index = saveIndex;
|
|---|
| 526 | }
|
|---|
| 527 |
|
|---|
| 528 |
|
|---|
| 529 |
|
|---|
| 530 | void Preprocessor::substituteUntilNewline(Symbols &substituted, MacroSafeSet safeset)
|
|---|
| 531 | {
|
|---|
| 532 | while (hasNext()) {
|
|---|
| 533 | Token token = next();
|
|---|
| 534 | if (token == PP_IDENTIFIER) {
|
|---|
| 535 | MacroName macro = symbol();
|
|---|
| 536 | if (macros.contains(macro) && !safeset.contains(macro)) {
|
|---|
| 537 | substituteMacro(macro, substituted, safeset);
|
|---|
| 538 | continue;
|
|---|
| 539 | }
|
|---|
| 540 | } else if (token == PP_DEFINED) {
|
|---|
| 541 | test(PP_LPAREN);
|
|---|
| 542 | next(PP_IDENTIFIER);
|
|---|
| 543 | Symbol definedOrNotDefined = symbol();
|
|---|
| 544 | definedOrNotDefined.token = macros.contains(definedOrNotDefined)? PP_MOC_TRUE : PP_MOC_FALSE;
|
|---|
| 545 | substituted += definedOrNotDefined;
|
|---|
| 546 | test(PP_RPAREN);
|
|---|
| 547 | continue;
|
|---|
| 548 | } else if (token == PP_NEWLINE) {
|
|---|
| 549 | substituted += symbol();
|
|---|
| 550 | break;
|
|---|
| 551 | }
|
|---|
| 552 | substituted += symbol();
|
|---|
| 553 | }
|
|---|
| 554 | }
|
|---|
| 555 |
|
|---|
| 556 |
|
|---|
| 557 | class PP_Expression : public Parser
|
|---|
| 558 | {
|
|---|
| 559 | public:
|
|---|
| 560 | int value() { index = 0; return unary_expression_lookup() ? conditional_expression() : 0; }
|
|---|
| 561 |
|
|---|
| 562 | int conditional_expression();
|
|---|
| 563 | int logical_OR_expression();
|
|---|
| 564 | int logical_AND_expression();
|
|---|
| 565 | int inclusive_OR_expression();
|
|---|
| 566 | int exclusive_OR_expression();
|
|---|
| 567 | int AND_expression();
|
|---|
| 568 | int equality_expression();
|
|---|
| 569 | int relational_expression();
|
|---|
| 570 | int shift_expression();
|
|---|
| 571 | int additive_expression();
|
|---|
| 572 | int multiplicative_expression();
|
|---|
| 573 | int unary_expression();
|
|---|
| 574 | bool unary_expression_lookup();
|
|---|
| 575 | int primary_expression();
|
|---|
| 576 | bool primary_expression_lookup();
|
|---|
| 577 | };
|
|---|
| 578 |
|
|---|
| 579 | int PP_Expression::conditional_expression()
|
|---|
| 580 | {
|
|---|
| 581 | int value = logical_OR_expression();
|
|---|
| 582 | if (test(PP_QUESTION)) {
|
|---|
| 583 | int alt1 = conditional_expression();
|
|---|
| 584 | int alt2 = test(PP_COLON) ? conditional_expression() : 0;
|
|---|
| 585 | return value ? alt1 : alt2;
|
|---|
| 586 | }
|
|---|
| 587 | return value;
|
|---|
| 588 | }
|
|---|
| 589 |
|
|---|
| 590 | int PP_Expression::logical_OR_expression()
|
|---|
| 591 | {
|
|---|
| 592 | int value = logical_AND_expression();
|
|---|
| 593 | if (test(PP_OROR))
|
|---|
| 594 | return logical_OR_expression() || value;
|
|---|
| 595 | return value;
|
|---|
| 596 | }
|
|---|
| 597 |
|
|---|
| 598 | int PP_Expression::logical_AND_expression()
|
|---|
| 599 | {
|
|---|
| 600 | int value = inclusive_OR_expression();
|
|---|
| 601 | if (test(PP_ANDAND))
|
|---|
| 602 | return logical_AND_expression() && value;
|
|---|
| 603 | return value;
|
|---|
| 604 | }
|
|---|
| 605 |
|
|---|
| 606 | int PP_Expression::inclusive_OR_expression()
|
|---|
| 607 | {
|
|---|
| 608 | int value = exclusive_OR_expression();
|
|---|
| 609 | if (test(PP_OR))
|
|---|
| 610 | return value | inclusive_OR_expression();
|
|---|
| 611 | return value;
|
|---|
| 612 | }
|
|---|
| 613 |
|
|---|
| 614 | int PP_Expression::exclusive_OR_expression()
|
|---|
| 615 | {
|
|---|
| 616 | int value = AND_expression();
|
|---|
| 617 | if (test(PP_HAT))
|
|---|
| 618 | return value ^ exclusive_OR_expression();
|
|---|
| 619 | return value;
|
|---|
| 620 | }
|
|---|
| 621 |
|
|---|
| 622 | int PP_Expression::AND_expression()
|
|---|
| 623 | {
|
|---|
| 624 | int value = equality_expression();
|
|---|
| 625 | if (test(PP_AND))
|
|---|
| 626 | return value & AND_expression();
|
|---|
| 627 | return value;
|
|---|
| 628 | }
|
|---|
| 629 |
|
|---|
| 630 | int PP_Expression::equality_expression()
|
|---|
| 631 | {
|
|---|
| 632 | int value = relational_expression();
|
|---|
| 633 | switch (next()) {
|
|---|
| 634 | case PP_EQEQ:
|
|---|
| 635 | return value == equality_expression();
|
|---|
| 636 | case PP_NE:
|
|---|
| 637 | return value != equality_expression();
|
|---|
| 638 | default:
|
|---|
| 639 | prev();
|
|---|
| 640 | return value;
|
|---|
| 641 | }
|
|---|
| 642 | }
|
|---|
| 643 |
|
|---|
| 644 | int PP_Expression::relational_expression()
|
|---|
| 645 | {
|
|---|
| 646 | int value = shift_expression();
|
|---|
| 647 | switch (next()) {
|
|---|
| 648 | case PP_LANGLE:
|
|---|
| 649 | return value < relational_expression();
|
|---|
| 650 | case PP_RANGLE:
|
|---|
| 651 | return value > relational_expression();
|
|---|
| 652 | case PP_LE:
|
|---|
| 653 | return value <= relational_expression();
|
|---|
| 654 | case PP_GE:
|
|---|
| 655 | return value >= relational_expression();
|
|---|
| 656 | default:
|
|---|
| 657 | prev();
|
|---|
| 658 | return value;
|
|---|
| 659 | }
|
|---|
|
|---|