blob: 5f680900c7c3f390d390b088da211e31dd991638 [file] [log] [blame]
/****************************************************************************
**
** Copyright (C) 2001-2004 Roberto Raggi
** Copyright (C) 2011 Nokia Corporation and/or its subsidiary(-ies).
** All rights reserved.
** Contact: Nokia Corporation (qt-info@nokia.com)
**
** This file is part of the qt3to4 porting application of the Qt Toolkit.
**
** $QT_BEGIN_LICENSE:LGPL$
** GNU Lesser General Public License Usage
** This file may be used under the terms of the GNU Lesser General Public
** License version 2.1 as published by the Free Software Foundation and
** appearing in the file LICENSE.LGPL included in the packaging of this
** file. Please review the following information to ensure the GNU Lesser
** General Public License version 2.1 requirements will be met:
** http://www.gnu.org/licenses/old-licenses/lgpl-2.1.html.
**
** In addition, as a special exception, Nokia gives you certain additional
** rights. These rights are described in the Nokia Qt LGPL Exception
** version 1.1, included in the file LGPL_EXCEPTION.txt in this package.
**
** GNU General Public License Usage
** Alternatively, this file may be used under the terms of the GNU General
** Public License version 3.0 as published by the Free Software Foundation
** and appearing in the file LICENSE.GPL included in the packaging of this
** file. Please review the following information to ensure the GNU General
** Public License version 3.0 requirements will be met:
** http://www.gnu.org/copyleft/gpl.html.
**
** Other Usage
** Alternatively, this file may be used in accordance with the terms and
** conditions contained in a signed written agreement between you and Nokia.
**
**
**
**
**
** $QT_END_LICENSE$
**
****************************************************************************/
#include "rpplexer.h"
#include <QChar>
#include <ctype.h>
QT_BEGIN_NAMESPACE
using namespace TokenEngine;
namespace Rpp {
RppLexer::RppLexer()
: m_buffer(0), m_ptr(0), m_len(0)
{
setupScanTable();
}
void RppLexer::setupScanTable()
{
memset(s_attr_table, 0, 256);
for (int i=0; i<128; ++i) {
switch (i) {
case ':':
case '*':
case '%':
case '^':
case '=':
case '!':
case '&':
case '|':
case '+':
case '<':
case '>':
case '-':
case '.':
s_scan_table[i] = &RppLexer::scanOperator;
break;
case '\r':
case '\n':
s_scan_table[i] = &RppLexer::scanNewline;
break;
case '\'':
s_scan_table[i] = &RppLexer::scanCharLiteral;
break;
case '"':
s_scan_table[i] = &RppLexer::scanStringLiteral;
break;
case '#':
s_scan_table[i] = &RppLexer::scanPreprocessor;
break;
case '/':
s_scan_table[i] = &RppLexer::scanComment;
break;
default:
if (isspace(i)) {
s_scan_table[i] = &RppLexer::scanWhiteSpaces;
s_attr_table[i] |= A_Whitespace;
} else if (isalpha(i) || i == '_') {
s_scan_table[i] = &RppLexer::scanKeyword;
s_attr_table[i] |= A_Alpha;
} else if (isdigit(i)) {
s_scan_table[i] = &RppLexer::scanNumberLiteral;
s_attr_table[i] |= A_Digit;
} else
s_scan_table[i] = &RppLexer::scanChar;
}
}
s_scan_table[128] = &RppLexer::scanUnicodeChar;
}
QVector<Type> RppLexer::lex(const TokenContainer &tokenContainer)
{
QVector<Type> tokenTypes;
const int numTokens = tokenContainer.count();
tokenTypes.reserve(numTokens);
QByteArray text = tokenContainer.fullText();
m_buffer = text.constData();
for(int t=0; t<numTokens; ++t) {
TokenEngine::Token token = tokenContainer.token(t);
tokenTypes.append(indentify(token.start, token.length));
}
return tokenTypes;
}
Type RppLexer::indentify(int pos, int length)
{
Q_ASSERT(length > 0);
m_ptr = pos;
m_len = length;
int kind = 0;
const unsigned char ch = m_buffer[pos];
(this->*s_scan_table[ch < 128 ? ch : 128])(&kind);
return (Type)kind;
}
void RppLexer::scanChar(int *kind)
{
*kind = m_buffer[m_ptr];
}
void RppLexer::scanWhiteSpaces(int *kind)
{
*kind = Token_whitespaces;
while (unsigned char ch = m_buffer[m_ptr]) {
if (s_attr_table[ch] & A_Whitespace)
++m_ptr;
else
break;
}
}
void RppLexer::scanNewline(int *kind)
{
*kind = '\n';
}
void RppLexer::scanUnicodeChar(int *kind)
{
*kind = m_buffer[m_ptr];
}
void RppLexer::scanCharLiteral(int *kind)
{
*kind = Token_char_literal;
}
void RppLexer::scanStringLiteral(int *kind)
{
*kind = Token_string_literal;
}
void RppLexer::scanIdentifier(int *kind)
{
*kind = Token_identifier;
}
void RppLexer::scanNumberLiteral(int *kind)
{
*kind = Token_number_literal;
}
void RppLexer::scanPreprocessor(int *kind)
{
*kind = Token_preproc;
}
void RppLexer::scanComment(int *kind)
{
switch(m_buffer[m_ptr + 1]) {
case '/':
*kind = Token_line_comment;
break;
case '*':
*kind = Token_multiline_comment;
break;
default:
scanOperator(kind);
}
}
void RppLexer::scanOperator(int *kind)
{
switch (m_buffer[m_ptr]) {
case ':':
if (m_buffer[m_ptr+1] == ':') {
*kind = Token_scope;
return;
}
break;
case '*':
case '/':
case '%':
case '^':
if (m_buffer[m_ptr+1] == '=') {
*kind = Token_assign;
return;
}
break;
case '=':
if (m_buffer[m_ptr+1] == '=') {
*kind = Token_eq;
return;
}
break;
case '!':
if (m_buffer[m_ptr+1] == '=') {
*kind = Token_not_eq;
return;
}
break;
case '&':
if (m_buffer[m_ptr+1] == '&') {
*kind = Token_and;
return;
} else if (m_buffer[m_ptr+1] == '=') {
*kind = Token_assign;
return;
}
break;
case '|':
if (m_buffer[m_ptr+1] == '|' ) {
*kind = Token_or;
return;
} else if (m_buffer[m_ptr+1] == '=') {
*kind = Token_assign;
return;
}
break;
case '+':
if (m_buffer[m_ptr+1] == '+' ) {
*kind = Token_incr;
return;
} else if (m_buffer[m_ptr+1] == '=') {
*kind = Token_assign;
return;
}
break;
case '<':
if (m_buffer[m_ptr+1] == '<') {
if (m_buffer[m_ptr+2] == '=') {
*kind = Token_assign;
return;
}
*kind = Token_left_shift;
return;
} else if (m_buffer[m_ptr+1] == '=') {
*kind = Token_leq;
return;
}
break;
case '>':
if (m_buffer[m_ptr+1] == '>') {
if (m_buffer[m_ptr+2] == '=') {
*kind = Token_assign;
return;
}
*kind = Token_right_shift;
return;
} else if (m_buffer[m_ptr+1] == '=') {
*kind = Token_geq;
return;
}
break;
case '-':
if (m_buffer[m_ptr+1] == '>') {
if (m_buffer[m_ptr+2] == '*') {
*kind = Token_ptrmem;
return;
}
*kind = Token_arrow;
return;
} else if (m_buffer[m_ptr+1] == '-') {
*kind = Token_decr;
return;
} else if (m_buffer[m_ptr+1] == '=') {
*kind = Token_assign;
return;
}
break;
case '.':
if (m_buffer[m_ptr+1] == '.' && m_buffer[m_ptr+2] == '.') {
*kind = Token_ellipsis;
return;
} else if (m_buffer[m_ptr+1] == '*') {
*kind = Token_ptrmem;
return;
}
break;
}
*kind = m_buffer[m_ptr++];
}
bool RppLexer::match(const char *buf, int len)
{
if (m_len != len)
return false;
for (int i = 0; i < len; ++i) {
if(m_buffer[m_ptr + i] != buf[i])
return false;
}
return true;
}
void RppLexer::scanKeyword(int *kind)
{
if(match("if", 2))
*kind = Token_directive_if;
else if(match("elif", 4))
*kind = Token_directive_elif;
else if(match("else", 4))
*kind = Token_directive_else;
else if(match("line", 4))
*kind = Token_directive_line;
else if(match("else", 4))
*kind = Token_directive_else;
else if(match("line", 4))
*kind = Token_directive_line;
else if(match("endif", 5))
*kind = Token_directive_endif;
else if(match("ifdef", 5))
*kind = Token_directive_ifdef;
else if(match("error", 5))
*kind = Token_directive_error;
else if(match("undef", 5))
*kind = Token_directive_undef;
else if(match("pragma", 6))
*kind = Token_directive_pragma;
else if(match("ifndef", 6))
*kind = Token_directive_ifndef;
else if(match("define", 6))
*kind = Token_directive_define;
else if(match("include", 7))
*kind = Token_directive_include;
else if(match("defined", 7))
*kind = Token_defined;
else
*kind = Token_identifier;
}
} //namespace Rpp
QT_END_NAMESPACE