forked from qt-creator/qt-creator
		
	Change-Id: I5195fc43e8a6653bf52c0eaa6cddb8dfd25b6217 Reviewed-on: http://codereview.qt.nokia.com/319 Reviewed-by: Qt Sanity Bot <qt_sanity_bot@ovi.com> Reviewed-by: Joerg Bornemann <joerg.bornemann@nokia.com>
		
			
				
	
	
		
			437 lines
		
	
	
		
			13 KiB
		
	
	
	
		
			C++
		
	
	
	
	
	
			
		
		
	
	
			437 lines
		
	
	
		
			13 KiB
		
	
	
	
		
			C++
		
	
	
	
	
	
| /**************************************************************************
 | |
| **
 | |
| ** This file is part of Qt Creator
 | |
| **
 | |
| ** Copyright (c) 2011 Nokia Corporation and/or its subsidiary(-ies).
 | |
| **
 | |
| ** Contact: Nokia Corporation (info@qt.nokia.com)
 | |
| **
 | |
| **
 | |
| ** GNU Lesser General Public License Usage
 | |
| **
 | |
| ** This file may be used under the terms of the GNU Lesser General Public
 | |
| ** License version 2.1 as published by the Free Software Foundation and
 | |
| ** appearing in the file LICENSE.LGPL included in the packaging of this file.
 | |
| ** Please review the following information to ensure the GNU Lesser General
 | |
| ** Public License version 2.1 requirements will be met:
 | |
| ** http://www.gnu.org/licenses/old-licenses/lgpl-2.1.html.
 | |
| **
 | |
| ** In addition, as a special exception, Nokia gives you certain additional
 | |
| ** rights. These rights are described in the Nokia Qt LGPL Exception
 | |
| ** version 1.1, included in the file LGPL_EXCEPTION.txt in this package.
 | |
| **
 | |
| ** Other Usage
 | |
| **
 | |
| ** Alternatively, this file may be used in accordance with the terms and
 | |
| ** conditions contained in a signed written agreement between you and Nokia.
 | |
| **
 | |
| ** If you have questions regarding the use of this file, please contact
 | |
| ** Nokia at info@qt.nokia.com.
 | |
| **
 | |
| **************************************************************************/
 | |
| 
 | |
| #include <qmljs/qmljsscanner.h>
 | |
| 
 | |
| #include <QtGui/QTextCharFormat>
 | |
| 
 | |
| using namespace QmlJS;
 | |
| 
 | |
| namespace {
 | |
| QString js_keywords[] = {
 | |
|     QLatin1String("break"),
 | |
|     QString::fromLatin1("case"),
 | |
|     QString::fromLatin1("catch"),
 | |
|     QString::fromLatin1("continue"),
 | |
|     QString::fromLatin1("debugger"),
 | |
|     QString::fromLatin1("default"),
 | |
|     QString::fromLatin1("delete"),
 | |
|     QString::fromLatin1("do"),
 | |
|     QString::fromLatin1("else"),
 | |
|     QString::fromLatin1("finally"),
 | |
|     QString::fromLatin1("for"),
 | |
|     QString::fromLatin1("function"),
 | |
|     QString::fromLatin1("if"),
 | |
|     QString::fromLatin1("in"),
 | |
|     QString::fromLatin1("instanceof"),
 | |
|     QString::fromLatin1("new"),
 | |
|     QString::fromLatin1("return"),
 | |
|     QString::fromLatin1("switch"),
 | |
|     QString::fromLatin1("this"),
 | |
|     QString::fromLatin1("throw"),
 | |
|     QString::fromLatin1("try"),
 | |
|     QString::fromLatin1("typeof"),
 | |
|     QString::fromLatin1("var"),
 | |
|     QString::fromLatin1("void"),
 | |
|     QString::fromLatin1("while"),
 | |
|     QString::fromLatin1("with")
 | |
| };
 | |
| } // end of anonymous namespace
 | |
| 
 | |
| template <typename _Tp, int N>
 | |
| const _Tp *begin(const _Tp (&a)[N])
 | |
| {
 | |
|     return a;
 | |
| }
 | |
| 
 | |
| template <typename _Tp, int N>
 | |
| const _Tp *end(const _Tp (&a)[N])
 | |
| {
 | |
|     return a + N;
 | |
| }
 | |
| 
 | |
| Scanner::Scanner()
 | |
|     : _state(Normal),
 | |
|       _scanComments(true)
 | |
| {
 | |
| }
 | |
| 
 | |
| Scanner::~Scanner()
 | |
| {
 | |
| }
 | |
| 
 | |
| bool Scanner::scanComments() const
 | |
| {
 | |
|     return _scanComments;
 | |
| }
 | |
| 
 | |
| void Scanner::setScanComments(bool scanComments)
 | |
| {
 | |
|     _scanComments = scanComments;
 | |
| }
 | |
| 
 | |
| static bool isIdentifierChar(QChar ch)
 | |
| {
 | |
|     switch (ch.unicode()) {
 | |
|     case '$': case '_':
 | |
|         return true;
 | |
| 
 | |
|     default:
 | |
|         return ch.isLetterOrNumber();
 | |
|     }
 | |
| }
 | |
| 
 | |
| static bool isNumberChar(QChar ch)
 | |
| {
 | |
|     switch (ch.unicode()) {
 | |
|     case '.':
 | |
|     case 'e':
 | |
|     case 'E': // ### more...
 | |
|         return true;
 | |
| 
 | |
|     default:
 | |
|         return ch.isLetterOrNumber();
 | |
|     }
 | |
| }
 | |
| 
 | |
| static int findRegExpEnd(const QString &text, int start)
 | |
| {
 | |
|     if (start >= text.size() || text.at(start) != QLatin1Char('/'))
 | |
|         return start;
 | |
| 
 | |
|     // find the second /
 | |
|     int index = start + 1;
 | |
|     for (; index < text.length(); ++index) {
 | |
|         const QChar ch = text.at(index);
 | |
| 
 | |
|         if (ch == QLatin1Char('\\')) {
 | |
|             ++index;
 | |
|         } else if (ch == QLatin1Char('[')) {
 | |
|             // find closing ]
 | |
|             for (; index < text.length(); ++index) {
 | |
|                 const QChar ch2 = text.at(index);
 | |
|                 if (ch2 == QLatin1Char('\\')) {
 | |
|                     ++index;
 | |
|                 } else if (ch2 == QLatin1Char(']'))
 | |
|                     break;
 | |
|             }
 | |
|             if (index >= text.size())
 | |
|                 return text.size();
 | |
|         } else if (ch == QLatin1Char('/'))
 | |
|             break;
 | |
|     }
 | |
|     if (index >= text.size())
 | |
|         return text.size();
 | |
|     ++index;
 | |
| 
 | |
|     // find end of reg exp flags
 | |
|     for (; index < text.size(); ++index) {
 | |
|         const QChar ch = text.at(index);
 | |
|         if (!isIdentifierChar(ch))
 | |
|             break;
 | |
|     }
 | |
| 
 | |
|     return index;
 | |
| }
 | |
| 
 | |
| 
 | |
| static inline int multiLineState(int state)
 | |
| {
 | |
|     return state & Scanner::MultiLineMask;
 | |
| }
 | |
| 
 | |
| static inline void setMultiLineState(int *state, int s)
 | |
| {
 | |
|     *state = s | (*state & ~Scanner::MultiLineMask);
 | |
| }
 | |
| 
 | |
| static inline bool regexpMayFollow(int state)
 | |
| {
 | |
|     return state & Scanner::RegexpMayFollow;
 | |
| }
 | |
| 
 | |
| static inline void setRegexpMayFollow(int *state, bool on)
 | |
| {
 | |
|     *state = (on ? Scanner::RegexpMayFollow : 0) | (*state & ~Scanner::RegexpMayFollow);
 | |
| }
 | |
| 
 | |
| QList<Token> Scanner::operator()(const QString &text, int startState)
 | |
| {
 | |
|     _state = startState;
 | |
|     QList<Token> tokens;
 | |
| 
 | |
|     int index = 0;
 | |
| 
 | |
|     if (multiLineState(_state) == MultiLineComment) {
 | |
|         int start = -1;
 | |
|         while (index < text.length()) {
 | |
|             const QChar ch = text.at(index);
 | |
| 
 | |
|             if (start == -1 && !ch.isSpace())
 | |
|                 start = index;
 | |
| 
 | |
|             QChar la;
 | |
|             if (index + 1 < text.length())
 | |
|                 la = text.at(index + 1);
 | |
| 
 | |
|             if (ch == QLatin1Char('*') && la == QLatin1Char('/')) {
 | |
|                 setMultiLineState(&_state, Normal);
 | |
|                 index += 2;
 | |
|                 break;
 | |
|             } else {
 | |
|                 ++index;
 | |
|             }
 | |
|         }
 | |
| 
 | |
|         if (_scanComments && start != -1)
 | |
|             tokens.append(Token(start, index - start, Token::Comment));
 | |
|     } else if (multiLineState(_state) == MultiLineStringDQuote || multiLineState(_state) == MultiLineStringSQuote) {
 | |
|         const QChar quote = (_state == MultiLineStringDQuote ? QLatin1Char('"') : QLatin1Char('\''));
 | |
|         const int start = index;
 | |
|         while (index < text.length()) {
 | |
|             const QChar ch = text.at(index);
 | |
| 
 | |
|             if (ch == quote)
 | |
|                 break;
 | |
|             else if (index + 1 < text.length() && ch == QLatin1Char('\\'))
 | |
|                 index += 2;
 | |
|             else
 | |
|                 ++index;
 | |
|         }
 | |
|         if (index < text.length()) {
 | |
|             ++index;
 | |
|             setMultiLineState(&_state, Normal);
 | |
|         }
 | |
|         if (start < index)
 | |
|             tokens.append(Token(start, index - start, Token::String));
 | |
|         setRegexpMayFollow(&_state, false);
 | |
|     }
 | |
| 
 | |
|     while (index < text.length()) {
 | |
|         const QChar ch = text.at(index);
 | |
| 
 | |
|         QChar la; // lookahead char
 | |
|         if (index + 1 < text.length())
 | |
|             la = text.at(index + 1);
 | |
| 
 | |
|         switch (ch.unicode()) {
 | |
|         case '/':
 | |
|             if (la == QLatin1Char('/')) {
 | |
|                 if (_scanComments)
 | |
|                     tokens.append(Token(index, text.length() - index, Token::Comment));
 | |
|                 index = text.length();
 | |
|             } else if (la == QLatin1Char('*')) {
 | |
|                 const int start = index;
 | |
|                 index += 2;
 | |
|                 setMultiLineState(&_state, MultiLineComment);
 | |
|                 while (index < text.length()) {
 | |
|                     const QChar ch = text.at(index);
 | |
|                     QChar la;
 | |
|                     if (index + 1 < text.length())
 | |
|                         la = text.at(index + 1);
 | |
| 
 | |
|                     if (ch == QLatin1Char('*') && la == QLatin1Char('/')) {
 | |
|                         setMultiLineState(&_state, Normal);
 | |
|                         index += 2;
 | |
|                         break;
 | |
|                     } else {
 | |
|                         ++index;
 | |
|                     }
 | |
|                 }
 | |
|                 if (_scanComments)
 | |
|                     tokens.append(Token(start, index - start, Token::Comment));
 | |
|             } else if (regexpMayFollow(_state)) {
 | |
|                 const int end = findRegExpEnd(text, index);
 | |
|                 tokens.append(Token(index, end - index, Token::RegExp));
 | |
|                 index = end;
 | |
|                 setRegexpMayFollow(&_state, false);
 | |
|             } else {
 | |
|                 tokens.append(Token(index++, 1, Token::Delimiter));
 | |
|                 setRegexpMayFollow(&_state, true);
 | |
|             }
 | |
|             break;
 | |
| 
 | |
|         case '\'':
 | |
|         case '"': {
 | |
|             const QChar quote = ch;
 | |
|             const int start = index;
 | |
|             ++index;
 | |
|             while (index < text.length()) {
 | |
|                 const QChar ch = text.at(index);
 | |
| 
 | |
|                 if (ch == quote)
 | |
|                     break;
 | |
|                 else if (index + 1 < text.length() && ch == QLatin1Char('\\'))
 | |
|                     index += 2;
 | |
|                 else
 | |
|                     ++index;
 | |
|             }
 | |
| 
 | |
|             if (index < text.length()) {
 | |
|                 ++index;
 | |
|                 // good one
 | |
|             } else {
 | |
|                 if (quote.unicode() == '"')
 | |
|                     setMultiLineState(&_state, MultiLineStringDQuote);
 | |
|                 else
 | |
|                     setMultiLineState(&_state, MultiLineStringSQuote);
 | |
|             }
 | |
| 
 | |
|             tokens.append(Token(start, index - start, Token::String));
 | |
|             setRegexpMayFollow(&_state, false);
 | |
|         } break;
 | |
| 
 | |
|         case '.':
 | |
|             if (la.isDigit()) {
 | |
|                 const int start = index;
 | |
|                 do {
 | |
|                     ++index;
 | |
|                 } while (index < text.length() && isNumberChar(text.at(index)));
 | |
|                 tokens.append(Token(start, index - start, Token::Number));
 | |
|                 break;
 | |
|             }
 | |
|             tokens.append(Token(index++, 1, Token::Dot));
 | |
|             setRegexpMayFollow(&_state, false);
 | |
|             break;
 | |
| 
 | |
|          case '(':
 | |
|             tokens.append(Token(index++, 1, Token::LeftParenthesis));
 | |
|             setRegexpMayFollow(&_state, true);
 | |
|             break;
 | |
| 
 | |
|          case ')':
 | |
|             tokens.append(Token(index++, 1, Token::RightParenthesis));
 | |
|             setRegexpMayFollow(&_state, false);
 | |
|             break;
 | |
| 
 | |
|          case '[':
 | |
|             tokens.append(Token(index++, 1, Token::LeftBracket));
 | |
|             setRegexpMayFollow(&_state, true);
 | |
|             break;
 | |
| 
 | |
|          case ']':
 | |
|             tokens.append(Token(index++, 1, Token::RightBracket));
 | |
|             setRegexpMayFollow(&_state, false);
 | |
|             break;
 | |
| 
 | |
|          case '{':
 | |
|             tokens.append(Token(index++, 1, Token::LeftBrace));
 | |
|             setRegexpMayFollow(&_state, true);
 | |
|             break;
 | |
| 
 | |
|          case '}':
 | |
|             tokens.append(Token(index++, 1, Token::RightBrace));
 | |
|             setRegexpMayFollow(&_state, false);
 | |
|             break;
 | |
| 
 | |
|          case ';':
 | |
|             tokens.append(Token(index++, 1, Token::Semicolon));
 | |
|             setRegexpMayFollow(&_state, true);
 | |
|             break;
 | |
| 
 | |
|          case ':':
 | |
|             tokens.append(Token(index++, 1, Token::Colon));
 | |
|             setRegexpMayFollow(&_state, true);
 | |
|             break;
 | |
| 
 | |
|          case ',':
 | |
|             tokens.append(Token(index++, 1, Token::Comma));
 | |
|             setRegexpMayFollow(&_state, true);
 | |
|             break;
 | |
| 
 | |
|         case '+':
 | |
|         case '-':
 | |
|             if (la == ch) {
 | |
|                 tokens.append(Token(index, 2, Token::Delimiter));
 | |
|                 index += 2;
 | |
|             } else {
 | |
|                 tokens.append(Token(index++, 1, Token::Delimiter));
 | |
|             }
 | |
|             setRegexpMayFollow(&_state, true);
 | |
|             break;
 | |
| 
 | |
|         default:
 | |
|             if (ch.isSpace()) {
 | |
|                 do {
 | |
|                     ++index;
 | |
|                 } while (index < text.length() && text.at(index).isSpace());
 | |
|             } else if (ch.isNumber()) {
 | |
|                 const int start = index;
 | |
|                 do {
 | |
|                     ++index;
 | |
|                 } while (index < text.length() && isNumberChar(text.at(index)));
 | |
|                 tokens.append(Token(start, index - start, Token::Number));
 | |
|                 setRegexpMayFollow(&_state, false);
 | |
|             } else if (ch.isLetter() || ch == QLatin1Char('_') || ch == QLatin1Char('$')) {
 | |
|                 const int start = index;
 | |
|                 do {
 | |
|                     ++index;
 | |
|                 } while (index < text.length() && isIdentifierChar(text.at(index)));
 | |
| 
 | |
|                 if (isKeyword(text.mid(start, index - start)))
 | |
|                     tokens.append(Token(start, index - start, Token::Keyword)); // ### fixme
 | |
|                 else
 | |
|                     tokens.append(Token(start, index - start, Token::Identifier));
 | |
|                 setRegexpMayFollow(&_state, false);
 | |
|             } else {
 | |
|                 tokens.append(Token(index++, 1, Token::Delimiter));
 | |
|                 setRegexpMayFollow(&_state, true);
 | |
|             }
 | |
|         } // end of switch
 | |
|     }
 | |
| 
 | |
|     return tokens;
 | |
| }
 | |
| 
 | |
| int Scanner::state() const
 | |
| {
 | |
|     return _state;
 | |
| }
 | |
| 
 | |
| bool Scanner::isKeyword(const QString &text) const
 | |
| {
 | |
|     if (qBinaryFind(begin(js_keywords), end(js_keywords), text) != end(js_keywords))
 | |
|         return true;
 | |
| 
 | |
|     return false;
 | |
| }
 | |
| 
 | |
| QStringList Scanner::keywords()
 | |
| {
 | |
|     static QStringList words;
 | |
|     if (words.isEmpty()) {
 | |
|         for (const QString *word = begin(js_keywords); word != end(js_keywords); ++word)
 | |
|             words.append(*word);
 | |
|     }
 | |
|     return words;
 | |
| }
 |