Qt
Internal/Contributor docs for the Qt SDK. Note: These are NOT official API docs; those are found at https://doc.qt.io/
Loading...
Searching...
No Matches
tokenizer.cpp
Go to the documentation of this file.
1// Copyright (C) 2021 The Qt Company Ltd.
2// SPDX-License-Identifier: LicenseRef-Qt-Commercial OR GPL-3.0-only WITH Qt-GPL-exception-1.0
3
4#include "tokenizer.h"
5
6#include "config.h"
7#include "generator.h"
8
9#include <QtCore/qfile.h>
10#include <QtCore/qhash.h>
11#include <QtCore/qregularexpression.h>
12#include <QtCore/qstring.h>
13#include <QtCore/qstringconverter.h>
14
15#include <cctype>
16#include <cstring>
17#include <utility>
18
20
21#define LANGUAGE_CPP "Cpp"
22
23/* qmake ignore Q_OBJECT */
24
25/*
26 Keep in sync with tokenizer.h.
27*/
28static const char *kwords[] = { "char",
29 "class",
30 "const",
31 "double",
32 "enum",
33 "explicit",
34 "friend",
35 "inline",
36 "int",
37 "long",
38 "namespace",
39 "operator",
40 "private",
41 "protected",
42 "public",
43 "short",
44 "signals",
45 "signed",
46 "slots",
47 "static",
48 "struct",
49 "template",
50 "typedef",
51 "typename",
52 "union",
53 "unsigned",
54 "using",
55 "virtual",
56 "void",
57 "volatile",
58 "__int64",
59 "default",
60 "delete",
61 "final",
62 "override",
63 "Q_OBJECT",
64 "Q_OVERRIDE",
65 "Q_PROPERTY",
66 "Q_PRIVATE_PROPERTY",
67 "Q_DECLARE_SEQUENTIAL_ITERATOR",
68 "Q_DECLARE_MUTABLE_SEQUENTIAL_ITERATOR",
69 "Q_DECLARE_ASSOCIATIVE_ITERATOR",
70 "Q_DECLARE_MUTABLE_ASSOCIATIVE_ITERATOR",
71 "Q_DECLARE_FLAGS",
72 "Q_SIGNALS",
73 "Q_SLOTS",
74 "QT_COMPAT",
75 "QT_COMPAT_CONSTRUCTOR",
76 "QT_DEPRECATED",
77 "QT_MOC_COMPAT",
78 "QT_MODULE",
79 "QT3_SUPPORT",
80 "QT3_SUPPORT_CONSTRUCTOR",
81 "QT3_MOC_SUPPORT",
82 "QDOC_PROPERTY",
83 "QPrivateSignal" };
84
85static const int KwordHashTableSize = 4096;
87
89
90static QRegularExpression *comment = nullptr;
91static QRegularExpression *versionX = nullptr;
92static QRegularExpression *definedX = nullptr;
93
94static QRegularExpression *defines = nullptr;
95static QRegularExpression *falsehoods = nullptr;
96
98
99/*
100 This function is a perfect hash function for the 37 keywords of C99
101 (with a hash table size of 512). It should perform well on our
102 Qt-enhanced C++ subset.
103*/
104static int hashKword(const char *s, int len)
105{
106 return (((uchar)s[0]) + (((uchar)s[2]) << 5) + (((uchar)s[len - 1]) << 3)) % KwordHashTableSize;
107}
108
109static void insertKwordIntoHash(const char *s, int number)
110{
111 int k = hashKword(s, int(strlen(s)));
112 while (kwordHashTable[k]) {
113 if (++k == KwordHashTableSize)
114 k = 0;
115 }
116 kwordHashTable[k] = number;
117}
118
119Tokenizer::Tokenizer(const Location &loc, QFile &in)
120{
121 init();
122 m_in = in.readAll();
123 m_pos = 0;
124 start(loc);
125}
126
127Tokenizer::Tokenizer(const Location &loc, QByteArray in) : m_in(std::move(in))
128{
129 init();
130 m_pos = 0;
131 start(loc);
132}
133
135{
136 delete[] m_lexBuf1;
137 delete[] m_lexBuf2;
138}
139
141{
142 token_too_long_warning_was_issued = false;
143
144 char *t = m_prevLex;
145 m_prevLex = m_lex;
146 m_lex = t;
147
148 while (m_ch != EOF) {
149 m_tokLoc = m_curLoc;
150 m_lexLen = 0;
151
152 if (isspace(m_ch)) {
153 do {
154 m_ch = getChar();
155 } while (isspace(m_ch));
156 } else if (isalpha(m_ch) || m_ch == '_') {
157 do {
158 m_ch = getChar();
159 } while (isalnum(m_ch) || m_ch == '_');
160
161 int k = hashKword(m_lex, int(m_lexLen));
162 for (;;) {
163 int i = kwordHashTable[k];
164 if (i == 0) {
165 return Tok_Ident;
166 } else if (i == -1) {
167 if (!m_parsingMacro && ignoredTokensAndDirectives->contains(m_lex)) {
168 if (ignoredTokensAndDirectives->value(m_lex)) { // it's a directive
169 int parenDepth = 0;
170 while (m_ch != EOF && (m_ch != ')' || parenDepth > 1)) {
171 if (m_ch == '(')
172 ++parenDepth;
173 else if (m_ch == ')')
174 --parenDepth;
175 m_ch = getChar();
176 }
177 if (m_ch == ')')
178 m_ch = getChar();
179 }
180 break;
181 }
182 } else if (strcmp(m_lex, kwords[i - 1]) == 0) {
183 int ret = (int)Tok_FirstKeyword + i - 1;
184 if (ret != Tok_typename)
185 return ret;
186 break;
187 }
188
189 if (++k == KwordHashTableSize)
190 k = 0;
191 }
192 } else if (isdigit(m_ch)) {
193 do {
194 m_ch = getChar();
195 } while (isalnum(m_ch) || m_ch == '.' || m_ch == '+' || m_ch == '-');
196 return Tok_Number;
197 } else {
198 switch (m_ch) {
199 case '!':
200 case '%':
201 m_ch = getChar();
202 if (m_ch == '=')
203 m_ch = getChar();
204 return Tok_SomeOperator;
205 case '"':
206 m_ch = getChar();
207
208 while (m_ch != EOF && m_ch != '"') {
209 if (m_ch == '\\')
210 m_ch = getChar();
211 m_ch = getChar();
212 }
213 m_ch = getChar();
214
215 if (m_ch == EOF)
216 m_tokLoc.warning(
217 QStringLiteral("Unterminated C++ string literal"),
218 QStringLiteral("Maybe you forgot '/*!' at the beginning of the file?"));
219 else
220 return Tok_String;
221 break;
222 case '#':
223 return getTokenAfterPreprocessor();
224 case '&':
225 m_ch = getChar();
226 /*
227 Removed check for '&&', only interpret '&=' as an operator.
228 '&&' is also used for an rvalue reference. QTBUG-32675
229 */
230 if (m_ch == '=') {
231 m_ch = getChar();
232 return Tok_SomeOperator;
233 } else {
234 return Tok_Ampersand;
235 }
236 case '\'':
237 m_ch = getChar();
238 /*
239 Allow empty character literal. QTBUG-25775
240 */
241 if (m_ch == '\'') {
242 m_ch = getChar();
243 break;
244 }
245 if (m_ch == '\\')
246 m_ch = getChar();
247 do {
248 m_ch = getChar();
249 } while (m_ch != EOF && m_ch != '\'');
250
251 if (m_ch == EOF) {
252 m_tokLoc.warning(QStringLiteral("Unterminated C++ character literal"));
253 } else {
254 m_ch = getChar();
255 return Tok_Number;
256 }
257 break;
258 case '(':
259 m_ch = getChar();
260 if (m_numPreprocessorSkipping == 0)
261 m_parenDepth++;
262 if (isspace(m_ch)) {
263 do {
264 m_ch = getChar();
265 } while (isspace(m_ch));
266 m_lexLen = 1;
267 m_lex[1] = '\0';
268 }
269 if (m_ch == '*') {
270 m_ch = getChar();
271 return Tok_LeftParenAster;
272 }
273 return Tok_LeftParen;
274 case ')':
275 m_ch = getChar();
276 if (m_numPreprocessorSkipping == 0)
277 m_parenDepth--;
278 return Tok_RightParen;
279 case '*':
280 m_ch = getChar();
281 if (m_ch == '=') {
282 m_ch = getChar();
283 return Tok_SomeOperator;
284 } else {
285 return Tok_Aster;
286 }
287 case '^':
288 m_ch = getChar();
289 if (m_ch == '=') {
290 m_ch = getChar();
291 return Tok_SomeOperator;
292 } else {
293 return Tok_Caret;
294 }
295 case '+':
296 m_ch = getChar();
297 if (m_ch == '+' || m_ch == '=')
298 m_ch = getChar();
299 return Tok_SomeOperator;
300 case ',':
301 m_ch = getChar();
302 return Tok_Comma;
303 case '-':
304 m_ch = getChar();
305 if (m_ch == '-' || m_ch == '=') {
306 m_ch = getChar();
307 } else if (m_ch == '>') {
308 m_ch = getChar();
309 if (m_ch == '*')
310 m_ch = getChar();
311 }
312 return Tok_SomeOperator;
313 case '.':
314 m_ch = getChar();
315 if (m_ch == '*') {
316 m_ch = getChar();
317 } else if (m_ch == '.') {
318 do {
319 m_ch = getChar();
320 } while (m_ch == '.');
321 return Tok_Ellipsis;
322 } else if (isdigit(m_ch)) {
323 do {
324 m_ch = getChar();
325 } while (isalnum(m_ch) || m_ch == '.' || m_ch == '+' || m_ch == '-');
326 return Tok_Number;
327 }
328 return Tok_SomeOperator;
329 case '/':
330 m_ch = getChar();
331 if (m_ch == '/') {
332 do {
333 m_ch = getChar();
334 } while (m_ch != EOF && m_ch != '\n');
335 } else if (m_ch == '*') {
336 bool metDoc = false; // empty doc is no doc
337 bool metSlashAsterBang = false;
338 bool metAster = false;
339 bool metAsterSlash = false;
340
341 m_ch = getChar();
342 if (m_ch == '!')
343 metSlashAsterBang = true;
344
345 while (!metAsterSlash) {
346 if (m_ch == EOF) {
347 m_tokLoc.warning(QStringLiteral("Unterminated C++ comment"));
348 break;
349 } else {
350 if (m_ch == '*') {
351 metAster = true;
352 } else if (metAster && m_ch == '/') {
353 metAsterSlash = true;
354 } else {
355 metAster = false;
356 if (isgraph(m_ch))
357 metDoc = true;
358 }
359 }
360 m_ch = getChar();
361 }
362 if (metSlashAsterBang && metDoc)
363 return Tok_Doc;
364 else if (m_parenDepth > 0)
365 return Tok_Comment;
366 } else {
367 if (m_ch == '=')
368 m_ch = getChar();
369 return Tok_SomeOperator;
370 }
371 break;
372 case ':':
373 m_ch = getChar();
374 if (m_ch == ':') {
375 m_ch = getChar();
376 return Tok_Gulbrandsen;
377 } else {
378 return Tok_Colon;
379 }
380 case ';':
381 m_ch = getChar();
382 return Tok_Semicolon;
383 case '<':
384 m_ch = getChar();
385 if (m_ch == '<') {
386 m_ch = getChar();
387 if (m_ch == '=')
388 m_ch = getChar();
389 return Tok_SomeOperator;
390 } else if (m_ch == '=') {
391 m_ch = getChar();
392 return Tok_SomeOperator;
393 } else {
394 return Tok_LeftAngle;
395 }
396 case '=':
397 m_ch = getChar();
398 if (m_ch == '=') {
399 m_ch = getChar();
400 return Tok_SomeOperator;
401 } else {
402 return Tok_Equal;
403 }
404 case '>':
405 m_ch = getChar();
406 if (m_ch == '>') {
407 m_ch = getChar();
408 if (m_ch == '=')
409 m_ch = getChar();
410 return Tok_SomeOperator;
411 } else if (m_ch == '=') {
412 m_ch = getChar();
413 return Tok_SomeOperator;
414 } else {
415 return Tok_RightAngle;
416 }
417 case '?':
418 m_ch = getChar();
419 return Tok_SomeOperator;
420 case '[':
421 m_ch = getChar();
422 if (m_numPreprocessorSkipping == 0)
423 m_bracketDepth++;
424 return Tok_LeftBracket;
425 case '\\':
426 m_ch = getChar();
427 m_ch = getChar(); // skip one character
428 break;
429 case ']':
430 m_ch = getChar();
431 if (m_numPreprocessorSkipping == 0)
432 m_bracketDepth--;
433 return Tok_RightBracket;
434 case '{':
435 m_ch = getChar();
436 if (m_numPreprocessorSkipping == 0)
437 m_braceDepth++;
438 return Tok_LeftBrace;
439 case '}':
440 m_ch = getChar();
441 if (m_numPreprocessorSkipping == 0)
442 m_braceDepth--;
443 return Tok_RightBrace;
444 case '|':
445 m_ch = getChar();
446 if (m_ch == '|' || m_ch == '=')
447 m_ch = getChar();
448 return Tok_SomeOperator;
449 case '~':
450 m_ch = getChar();
451 return Tok_Tilde;
452 case '@':
453 m_ch = getChar();
454 return Tok_At;
455 default:
456 // ### We should really prevent qdoc from looking at snippet files rather than
457 // ### suppress warnings when reading them.
458 if (m_numPreprocessorSkipping == 0
459 && !(m_tokLoc.fileName().endsWith(".qdoc")
460 || m_tokLoc.fileName().endsWith(".js"))) {
461 m_tokLoc.warning(QStringLiteral("Hostile character 0x%1 in C++ source")
462 .arg((uchar)m_ch, 1, 16));
463 }
464 m_ch = getChar();
465 }
466 }
467 }
468
469 if (m_preprocessorSkipping.size() > 1) {
470 m_tokLoc.warning(QStringLiteral("Expected #endif before end of file"));
471 // clear it out or we get an infinite loop!
472 while (!m_preprocessorSkipping.isEmpty()) {
473 popSkipping();
474 }
475 }
476
477 strcpy(m_lex, "end-of-input");
478 m_lexLen = strlen(m_lex);
479 return Tok_Eoi;
480}
481
483{
484 Config &config = Config::instance();
485 QString versionSym = config.get(CONFIG_VERSIONSYM).asString();
486 const QLatin1String defaultEncoding("UTF-8");
487
488 QString sourceEncoding = config.get(CONFIG_SOURCEENCODING).asString(defaultEncoding);
489 if (!QStringConverter::encodingForName(sourceEncoding.toUtf8().constData())) {
490 Location().warning(QStringLiteral("Source encoding '%1' not supported, using '%2' as default.")
491 .arg(sourceEncoding, defaultEncoding));
492 sourceEncoding = defaultEncoding;
493 }
494 sourceDecoder = QStringDecoder(sourceEncoding.toUtf8().constData());
495 Q_ASSERT(sourceDecoder.isValid());
496
497 comment = new QRegularExpression("/(?:\\*.*\\*/|/.*\n|/[^\n]*$)", QRegularExpression::InvertedGreedinessOption);
498 versionX = new QRegularExpression("$cannot possibly match^");
499 if (!versionSym.isEmpty())
500 versionX->setPattern("^[ \t]*(?:" + QRegularExpression::escape(versionSym)
501 + ")[ \t]+\"([^\"]*)\"[ \t]*$");
502 definedX = new QRegularExpression("^defined ?\\‍(?([A-Z_0-9a-z]+) ?\\‍)?$");
503
504 QStringList d{config.get(CONFIG_DEFINES).asStringList()};
505 d += "qdoc";
506 defines = new QRegularExpression(QRegularExpression::anchoredPattern(d.join('|')));
507 falsehoods = new QRegularExpression(QRegularExpression::anchoredPattern(
508 config.get(CONFIG_FALSEHOODS).asStringList().join('|')));
509
510 /*
511 The keyword hash table is always cleared before any words are inserted.
512 */
513 memset(kwordHashTable, 0, sizeof(kwordHashTable));
514 for (int i = 0; i < Tok_LastKeyword - Tok_FirstKeyword + 1; i++)
515 insertKwordIntoHash(kwords[i], i + 1);
516
517 ignoredTokensAndDirectives = new QHash<QByteArray, bool>;
518
519 const QStringList tokens{config.get(LANGUAGE_CPP
520 + Config::dot
521 + CONFIG_IGNORETOKENS).asStringList()};
522 for (const auto &token : tokens) {
523 const QByteArray tb = token.toLatin1();
524 ignoredTokensAndDirectives->insert(tb, false);
525 insertKwordIntoHash(tb.data(), -1);
526 }
527
528 const QStringList directives{config.get(LANGUAGE_CPP
529 + Config::dot
530 + CONFIG_IGNOREDIRECTIVES).asStringList()};
531 for (const auto &directive : directives) {
532 const QByteArray db = directive.toLatin1();
533 ignoredTokensAndDirectives->insert(db, true);
534 insertKwordIntoHash(db.data(), -1);
535 }
536}
537
538/*!
539 The heap allocated variables are freed here. The keyword
540 hash table is not cleared here, but it is cleared in the
541 initialize() function, before any keywords are inserted.
542 */
544{
545 delete comment;
546 comment = nullptr;
547 delete versionX;
548 versionX = nullptr;
549 delete definedX;
550 definedX = nullptr;
551 delete defines;
552 defines = nullptr;
553 delete falsehoods;
554 falsehoods = nullptr;
555 delete ignoredTokensAndDirectives;
557}
558
559void Tokenizer::init()
560{
561 m_lexBuf1 = new char[(int)yyLexBufSize];
562 m_lexBuf2 = new char[(int)yyLexBufSize];
563 m_prevLex = m_lexBuf1;
564 m_prevLex[0] = '\0';
565 m_lex = m_lexBuf2;
566 m_lex[0] = '\0';
567 m_lexLen = 0;
568 m_preprocessorSkipping.push(false);
569 m_numPreprocessorSkipping = 0;
570 m_braceDepth = 0;
571 m_parenDepth = 0;
572 m_bracketDepth = 0;
573 m_ch = '\0';
574 m_parsingMacro = false;
575}
576
577void Tokenizer::start(const Location &loc)
578{
579 m_tokLoc = loc;
580 m_curLoc = loc;
581 m_curLoc.start();
582 strcpy(m_prevLex, "beginning-of-input");
583 strcpy(m_lex, "beginning-of-input");
584 m_lexLen = strlen(m_lex);
585 m_braceDepth = 0;
586 m_parenDepth = 0;
587 m_bracketDepth = 0;
588 m_ch = '\0';
589 m_ch = getChar();
590}
591
592/*
593 Returns the next token, if # was met. This function interprets the
594 preprocessor directive, skips over any #ifdef'd out tokens, and returns the
595 token after all of that.
596*/
597int Tokenizer::getTokenAfterPreprocessor()
598{
599 m_ch = getChar();
600 while (isspace(m_ch) && m_ch != '\n')
601 m_ch = getChar();
602
603 /*
604 #directive condition
605 */
606 QString directive;
607 QString condition;
608
609 while (isalpha(m_ch)) {
610 directive += QChar(m_ch);
611 m_ch = getChar();
612 }
613 if (!directive.isEmpty()) {
614 while (m_ch != EOF && m_ch != '\n') {
615 if (m_ch == '\\') {
616 m_ch = getChar();
617 if (m_ch == '\r')
618 m_ch = getChar();
619 }
620 condition += QChar(m_ch);
621 m_ch = getChar();
622 }
623 condition.remove(*comment);
624 condition = condition.simplified();
625
626 /*
627 The #if, #ifdef, #ifndef, #elif, #else, and #endif
628 directives have an effect on the skipping stack. For
629 instance, if the code processed so far is
630
631 #if 1
632 #if 0
633 #if 1
634 // ...
635 #else
636
637 the skipping stack contains, from bottom to top, false true
638 true (assuming 0 is false and 1 is true). If at least one
639 entry of the stack is true, the tokens are skipped.
640
641 This mechanism is simple yet hard to understand.
642 */
643 if (directive[0] == QChar('i')) {
644 if (directive == QString("if"))
645 pushSkipping(!isTrue(condition));
646 else if (directive == QString("ifdef"))
647 pushSkipping(!defines->match(condition).hasMatch());
648 else if (directive == QString("ifndef"))
649 pushSkipping(defines->match(condition).hasMatch());
650 } else if (directive[0] == QChar('e')) {
651 if (directive == QString("elif")) {
652 bool old = popSkipping();
653 if (old)
654 pushSkipping(!isTrue(condition));
655 else
656 pushSkipping(true);
657 } else if (directive == QString("else")) {
658 pushSkipping(!popSkipping());
659 } else if (directive == QString("endif")) {
660 popSkipping();
661 }
662 } else if (directive == QString("define")) {
663 auto match = versionX->match(condition);
664 if (match.hasMatch())
665 m_version = match.captured(1);
666 }
667 }
668
669 int tok;
670 do {
671 /*
672 We set yyLex now, and after getToken() this will be
673 yyPrevLex. This way, we skip over the preprocessor
674 directive.
675 */
676 qstrcpy(m_lex, m_prevLex);
677
678 /*
679 If getToken() meets another #, it will call
680 getTokenAfterPreprocessor() once again, which could in turn
681 call getToken() again, etc. Unless there are 10,000 or so
682 preprocessor directives in a row, this shouldn't overflow
683 the stack.
684 */
685 tok = getToken();
686 } while (m_numPreprocessorSkipping > 0 && tok != Tok_Eoi);
687 return tok;
688}
689
690/*
691 Pushes a new skipping value onto the stack. This corresponds to entering a
692 new #if block.
693*/
694void Tokenizer::pushSkipping(bool skip)
695{
696 m_preprocessorSkipping.push(skip);
697 if (skip)
698 m_numPreprocessorSkipping++;
699}
700
701/*
702 Pops a skipping value from the stack. This corresponds to reaching a #endif.
703*/
704bool Tokenizer::popSkipping()
705{
706 if (m_preprocessorSkipping.isEmpty()) {
707 m_tokLoc.warning(QStringLiteral("Unexpected #elif, #else or #endif"));
708 return true;
709 }
710
711 bool skip = m_preprocessorSkipping.pop();
712 if (skip)
713 m_numPreprocessorSkipping--;
714 return skip;
715}
716
717/*
718 Returns \c true if the condition evaluates as true, otherwise false. The
719 condition is represented by a string. Unsophisticated parsing techniques are
720 used. The preprocessing method could be named StriNg-Oriented PreProcessing,
721 as SNOBOL stands for StriNg-Oriented symBOlic Language.
722*/
723bool Tokenizer::isTrue(const QString &condition)
724{
725 int firstOr = -1;
726 int firstAnd = -1;
727 int parenDepth = 0;
728
729 /*
730 Find the first logical operator at top level, but be careful
731 about precedence. Examples:
732
733 X || Y // the or
734 X || Y || Z // the leftmost or
735 X || Y && Z // the or
736 X && Y || Z // the or
737 (X || Y) && Z // the and
738 */
739 for (int i = 0; i < condition.size() - 1; i++) {
740 QChar ch = condition[i];
741 if (ch == QChar('(')) {
742 parenDepth++;
743 } else if (ch == QChar(')')) {
744 parenDepth--;
745 } else if (parenDepth == 0) {
746 if (condition[i + 1] == ch) {
747 if (ch == QChar('|')) {
748 firstOr = i;
749 break;
750 } else if (ch == QChar('&')) {
751 if (firstAnd == -1)
752 firstAnd = i;
753 }
754 }
755 }
756 }
757 if (firstOr != -1)
758 return isTrue(condition.left(firstOr)) || isTrue(condition.mid(firstOr + 2));
759 if (firstAnd != -1)
760 return isTrue(condition.left(firstAnd)) && isTrue(condition.mid(firstAnd + 2));
761
762 QString t = condition.simplified();
763 if (t.isEmpty())
764 return true;
765
766 if (t[0] == QChar('!'))
767 return !isTrue(t.mid(1));
768 if (t[0] == QChar('(') && t.endsWith(QChar(')')))
769 return isTrue(t.mid(1, t.size() - 2));
770
771 auto match = definedX->match(t);
772 if (match.hasMatch())
773 return defines->match(match.captured(1)).hasMatch();
774 else
775 return !falsehoods->match(t).hasMatch();
776}
777
779{
780 return sourceDecoder(m_lex);
781}
782
784{
785 return sourceDecoder(m_prevLex);
786}
787
788QT_END_NAMESPACE
The Config class contains the configuration variables for controlling how qdoc produces documentation...
Definition config.h:84
The Location class provides a way to mark a location in a file.
Definition location.h:15
Location()
Constructs an empty location.
Definition location.cpp:40
QString previousLexeme() const
int getToken()
QString lexeme() const
static void terminate()
The heap allocated variables are freed here.
Tokenizer(const Location &loc, QFile &file)
static void initialize()
Tokenizer(const Location &loc, QByteArray in)
#define CONFIG_FALSEHOODS
Definition config.h:343
#define CONFIG_IGNOREDIRECTIVES
Definition config.h:351
#define CONFIG_DEFINES
Definition config.h:331
#define CONFIG_VERSIONSYM
Definition config.h:395
#define CONFIG_IGNORETOKENS
Definition config.h:353
#define CONFIG_SOURCEENCODING
Definition config.h:383
#define LANGUAGE_CPP
Definition tokenizer.cpp:21
static int kwordHashTable[KwordHashTableSize]
Definition tokenizer.cpp:86
static QHash< QByteArray, bool > * ignoredTokensAndDirectives
Definition tokenizer.cpp:88
static QRegularExpression * defines
Definition tokenizer.cpp:94
static const int KwordHashTableSize
Definition tokenizer.cpp:85
static QRegularExpression * falsehoods
Definition tokenizer.cpp:95
static const char * kwords[]
Definition tokenizer.cpp:28
static QRegularExpression * definedX
Definition tokenizer.cpp:92
static QRegularExpression * comment
Definition tokenizer.cpp:90
static QStringDecoder sourceDecoder
Definition tokenizer.cpp:97
static int hashKword(const char *s, int len)
static void insertKwordIntoHash(const char *s, int number)
static QRegularExpression * versionX
Definition tokenizer.cpp:91
@ Tok_Eoi
Definition tokenizer.h:24
@ Tok_LastKeyword
Definition tokenizer.h:67
@ Tok_RightParen
Definition tokenizer.h:29
@ Tok_Tilde
Definition tokenizer.h:43
@ Tok_SomeOperator
Definition tokenizer.h:44
@ Tok_Doc
Definition tokenizer.h:47
@ Tok_String
Definition tokenizer.h:46
@ Tok_Ellipsis
Definition tokenizer.h:39
@ Tok_Gulbrandsen
Definition tokenizer.h:40
@ Tok_Equal
Definition tokenizer.h:31
@ Tok_At
Definition tokenizer.h:50
@ Tok_Caret
Definition tokenizer.h:27
@ Tok_LeftBracket
Definition tokenizer.h:41
@ Tok_LeftAngle
Definition tokenizer.h:36
@ Tok_Comma
Definition tokenizer.h:38
@ Tok_LeftBrace
Definition tokenizer.h:32
@ Tok_Ident
Definition tokenizer.h:49
@ Tok_LeftParenAster
Definition tokenizer.h:30
@ Tok_typename
Definition tokenizer.h:60
@ Tok_LeftParen
Definition tokenizer.h:28
@ Tok_RightAngle
Definition tokenizer.h:37
@ Tok_RightBrace
Definition tokenizer.h:33
@ Tok_Ampersand
Definition tokenizer.h:25
@ Tok_RightBracket
Definition tokenizer.h:42
@ Tok_Aster
Definition tokenizer.h:26
@ Tok_Semicolon
Definition tokenizer.h:34
@ Tok_FirstKeyword
Definition tokenizer.h:66
@ Tok_Number
Definition tokenizer.h:45
@ Tok_Comment
Definition tokenizer.h:48
@ Tok_Colon
Definition tokenizer.h:35