Windows-4.7.4/tools/porting/src/rpplexer.cpp - platform/external/qt - Git at Google

 /****************************************************************************
 **
 ** Copyright (C) 2001-2004 Roberto Raggi
 ** Copyright (C) 2011 Nokia Corporation and/or its subsidiary(-ies).
 ** All rights reserved.
 ** Contact: Nokia Corporation (qt-info@nokia.com)
 **
 ** This file is part of the qt3to4 porting application of the Qt Toolkit.
 **
 ** $QT_BEGIN_LICENSE:LGPL$
 ** GNU Lesser General Public License Usage
 ** This file may be used under the terms of the GNU Lesser General Public
 ** License version 2.1 as published by the Free Software Foundation and
 ** appearing in the file LICENSE.LGPL included in the packaging of this
 ** file. Please review the following information to ensure the GNU Lesser
 ** General Public License version 2.1 requirements will be met:
 ** http://www.gnu.org/licenses/old-licenses/lgpl-2.1.html.
 **
 ** In addition, as a special exception, Nokia gives you certain additional
 ** rights. These rights are described in the Nokia Qt LGPL Exception
 ** version 1.1, included in the file LGPL_EXCEPTION.txt in this package.
 **
 ** GNU General Public License Usage
 ** Alternatively, this file may be used under the terms of the GNU General
 ** Public License version 3.0 as published by the Free Software Foundation
 ** and appearing in the file LICENSE.GPL included in the packaging of this
 ** file. Please review the following information to ensure the GNU General
 ** Public License version 3.0 requirements will be met:
 ** http://www.gnu.org/copyleft/gpl.html.
 **
 ** Other Usage
 ** Alternatively, this file may be used in accordance with the terms and
 ** conditions contained in a signed written agreement between you and Nokia.
 **
 **
 **
 **
 **
 ** $QT_END_LICENSE$
 **
 ****************************************************************************/

 #include "rpplexer.h"
 #include <QChar>
 #include <ctype.h>

 QT_BEGIN_NAMESPACE

 using namespace TokenEngine;

 namespace Rpp {
 RppLexer::RppLexer()
     : m_buffer(0), m_ptr(0), m_len(0)
 {
     setupScanTable();
 }

 void RppLexer::setupScanTable()
 {
     memset(s_attr_table, 0, 256);

     for (int i=0; i<128; ++i) {
         switch (i) {
         case ':':
         case '*':
         case '%':
         case '^':
         case '=':
         case '!':
         case '&':
         case '|':
         case '+':
         case '<':
         case '>':
         case '-':
         case '.':
             s_scan_table[i] = &RppLexer::scanOperator;
             break;

         case '\r':
 		case '\n':
             s_scan_table[i] = &RppLexer::scanNewline;
             break;

         case '\'':
             s_scan_table[i] = &RppLexer::scanCharLiteral;
             break;

         case '"':
             s_scan_table[i] = &RppLexer::scanStringLiteral;
             break;
         case '#':
             s_scan_table[i] = &RppLexer::scanPreprocessor;
             break;

         case '/':
             s_scan_table[i] = &RppLexer::scanComment;
             break;

         default:
             if (isspace(i)) {
                 s_scan_table[i] = &RppLexer::scanWhiteSpaces;
                 s_attr_table[i] |= A_Whitespace;
             } else if (isalpha(i) || i == '_') {
                 s_scan_table[i] = &RppLexer::scanKeyword;
                 s_attr_table[i] |= A_Alpha;
             } else if (isdigit(i)) {
                 s_scan_table[i] = &RppLexer::scanNumberLiteral;
                 s_attr_table[i] |= A_Digit;
             } else
                 s_scan_table[i] = &RppLexer::scanChar;
         }
     }

     s_scan_table[128] = &RppLexer::scanUnicodeChar;
 }

 QVector<Type> RppLexer::lex(const TokenContainer &tokenContainer)
 {
     QVector<Type> tokenTypes;
     const int numTokens = tokenContainer.count();
     tokenTypes.reserve(numTokens);
     QByteArray text = tokenContainer.fullText();
     m_buffer = text.constData();
     for(int t=0; t<numTokens; ++t) {
         TokenEngine::Token token = tokenContainer.token(t);
         tokenTypes.append(indentify(token.start, token.length));
     }
     return tokenTypes;
 }

 Type RppLexer::indentify(int pos, int length)
 {
     Q_ASSERT(length > 0);
     m_ptr = pos;
     m_len = length;
     int kind = 0;
     const unsigned char ch = m_buffer[pos];
     (this->*s_scan_table[ch < 128 ? ch : 128])(&kind);
     return (Type)kind;
 }

 void RppLexer::scanChar(int *kind)
 {
     *kind = m_buffer[m_ptr];
 }

 void RppLexer::scanWhiteSpaces(int *kind)
 {
     *kind = Token_whitespaces;

     while (unsigned char ch = m_buffer[m_ptr]) {
         if (s_attr_table[ch] & A_Whitespace)
             ++m_ptr;
         else
             break;
     }
 }

 void RppLexer::scanNewline(int *kind)
 {
     *kind = '\n';
 }

 void RppLexer::scanUnicodeChar(int *kind)
 {
     *kind = m_buffer[m_ptr];
 }

 void RppLexer::scanCharLiteral(int *kind)
 {
     *kind = Token_char_literal;
 }

 void RppLexer::scanStringLiteral(int *kind)
 {
     *kind = Token_string_literal;
 }

 void RppLexer::scanIdentifier(int *kind)
 {
     *kind = Token_identifier;
 }

 void RppLexer::scanNumberLiteral(int *kind)
 {
     *kind = Token_number_literal;
 }

 void RppLexer::scanPreprocessor(int *kind)
 {
     *kind = Token_preproc;
 }

 void RppLexer::scanComment(int *kind)
 {
     switch(m_buffer[m_ptr + 1]) {
     case '/':
         *kind = Token_line_comment;
         break;
     case '*':
         *kind = Token_multiline_comment;
         break;
     default:
         scanOperator(kind);
     }
 }

 void RppLexer::scanOperator(int *kind)
 {
     switch (m_buffer[m_ptr]) {
     case ':':
         if (m_buffer[m_ptr+1] == ':') {
             *kind = Token_scope;
             return;
         }
         break;

     case '*':
     case '/':
     case '%':
     case '^':
         if (m_buffer[m_ptr+1] == '=') {
             *kind = Token_assign;
             return;
         }
         break;

     case '=':
        if (m_buffer[m_ptr+1] == '=') {
             *kind = Token_eq;
             return;
         }
         break;
     case '!':
        if (m_buffer[m_ptr+1] == '=') {
             *kind = Token_not_eq;
             return;
         }
         break;

     case '&':
         if (m_buffer[m_ptr+1] == '&') {
             *kind = Token_and;
             return;
         } else if (m_buffer[m_ptr+1] == '=') {
             *kind = Token_assign;
             return;
         }
         break;

     case '|':
         if (m_buffer[m_ptr+1] == '|' ) {
             *kind = Token_or;
             return;
         } else if (m_buffer[m_ptr+1] == '=') {
             *kind = Token_assign;
             return;
         }
         break;

     case '+':
         if (m_buffer[m_ptr+1] == '+' ) {
             *kind = Token_incr;
             return;
         } else if (m_buffer[m_ptr+1] == '=') {
             *kind = Token_assign;
             return;
         }
         break;

     case '<':
         if (m_buffer[m_ptr+1] == '<') {
             if (m_buffer[m_ptr+2] == '=') {
                 *kind = Token_assign;
                 return;
             }
             *kind = Token_left_shift;
             return;
         } else if (m_buffer[m_ptr+1] == '=') {
             *kind = Token_leq;
             return;
         }
         break;

     case '>':
         if (m_buffer[m_ptr+1] == '>') {
             if (m_buffer[m_ptr+2] == '=') {
                 *kind = Token_assign;
                 return;
             }
             *kind = Token_right_shift;
             return;
         } else if (m_buffer[m_ptr+1] == '=') {
             *kind = Token_geq;
             return;
         }
         break;

     case '-':
         if (m_buffer[m_ptr+1] == '>') {
             if (m_buffer[m_ptr+2] == '*') {
                 *kind = Token_ptrmem;
                 return;
             }
             *kind = Token_arrow;
             return;
         } else if (m_buffer[m_ptr+1] == '-') {
             *kind = Token_decr;
             return;
         } else if (m_buffer[m_ptr+1] == '=') {
             *kind = Token_assign;
             return;
         }
         break;

     case '.':
         if (m_buffer[m_ptr+1] == '.' && m_buffer[m_ptr+2] == '.') {
             *kind = Token_ellipsis;
             return;
         } else if (m_buffer[m_ptr+1] == '*') {
             *kind = Token_ptrmem;
             return;
         }
         break;

     }

     *kind = m_buffer[m_ptr++];
 }

 bool RppLexer::match(const char *buf, int len)
 {
     if (m_len != len)
         return false;
     for (int i = 0; i < len; ++i) {
         if(m_buffer[m_ptr + i] != buf[i])
             return false;
     }
     return true;
 }

 void RppLexer::scanKeyword(int *kind)
 {
     if(match("if", 2))
         *kind = Token_directive_if;
     else if(match("elif", 4))
         *kind = Token_directive_elif;
     else if(match("else", 4))
         *kind = Token_directive_else;
     else if(match("line", 4))
         *kind = Token_directive_line;
     else if(match("else", 4))
         *kind = Token_directive_else;
     else if(match("line", 4))
         *kind = Token_directive_line;
     else if(match("endif", 5))
         *kind = Token_directive_endif;
     else if(match("ifdef", 5))
         *kind = Token_directive_ifdef;
     else if(match("error", 5))
         *kind = Token_directive_error;
     else if(match("undef", 5))
         *kind = Token_directive_undef;
     else if(match("pragma", 6))
         *kind = Token_directive_pragma;
     else if(match("ifndef", 6))
         *kind = Token_directive_ifndef;
     else if(match("define", 6))
         *kind = Token_directive_define;
     else if(match("include", 7))
         *kind = Token_directive_include;
     else if(match("defined", 7))
         *kind = Token_defined;
     else
         *kind = Token_identifier;
 }

 } //namespace Rpp

 QT_END_NAMESPACE
	/****************************************************************************
	**
	** Copyright (C) 2001-2004 Roberto Raggi
	** Copyright (C) 2011 Nokia Corporation and/or its subsidiary(-ies).
	** All rights reserved.
	** Contact: Nokia Corporation (qt-info@nokia.com)
	**
	** This file is part of the qt3to4 porting application of the Qt Toolkit.
	**
	** $QT_BEGIN_LICENSE:LGPL$
	** GNU Lesser General Public License Usage
	** This file may be used under the terms of the GNU Lesser General Public
	** License version 2.1 as published by the Free Software Foundation and
	** appearing in the file LICENSE.LGPL included in the packaging of this
	** file. Please review the following information to ensure the GNU Lesser
	** General Public License version 2.1 requirements will be met:
	** http://www.gnu.org/licenses/old-licenses/lgpl-2.1.html.
	**
	** In addition, as a special exception, Nokia gives you certain additional
	** rights. These rights are described in the Nokia Qt LGPL Exception
	** version 1.1, included in the file LGPL_EXCEPTION.txt in this package.
	**
	** GNU General Public License Usage
	** Alternatively, this file may be used under the terms of the GNU General
	** Public License version 3.0 as published by the Free Software Foundation
	** and appearing in the file LICENSE.GPL included in the packaging of this
	** file. Please review the following information to ensure the GNU General
	** Public License version 3.0 requirements will be met:
	** http://www.gnu.org/copyleft/gpl.html.
	**
	** Other Usage
	** Alternatively, this file may be used in accordance with the terms and
	** conditions contained in a signed written agreement between you and Nokia.
	**
	**
	**
	**
	**
	** $QT_END_LICENSE$
	**
	****************************************************************************/

	#include "rpplexer.h"
	#include <QChar>
	#include <ctype.h>

	QT_BEGIN_NAMESPACE

	using namespace TokenEngine;

	namespace Rpp {
	RppLexer::RppLexer()
	: m_buffer(0), m_ptr(0), m_len(0)
	{
	setupScanTable();
	}

	void RppLexer::setupScanTable()
	{
	memset(s_attr_table, 0, 256);

	for (int i=0; i<128; ++i) {
	switch (i) {
	case ':':
	case '*':
	case '%':
	case '^':
	case '=':
	case '!':
	case '&':
	case '\|':
	case '+':
	case '<':
	case '>':
	case '-':
	case '.':
	s_scan_table[i] = &RppLexer::scanOperator;
	break;

	case '\r':
	case '\n':
	s_scan_table[i] = &RppLexer::scanNewline;
	break;

	case '\'':
	s_scan_table[i] = &RppLexer::scanCharLiteral;
	break;

	case '"':
	s_scan_table[i] = &RppLexer::scanStringLiteral;
	break;
	case '#':
	s_scan_table[i] = &RppLexer::scanPreprocessor;
	break;

	case '/':
	s_scan_table[i] = &RppLexer::scanComment;
	break;

	default:
	if (isspace(i)) {
	s_scan_table[i] = &RppLexer::scanWhiteSpaces;
	s_attr_table[i] \|= A_Whitespace;
	} else if (isalpha(i) \|\| i == '_') {
	s_scan_table[i] = &RppLexer::scanKeyword;
	s_attr_table[i] \|= A_Alpha;
	} else if (isdigit(i)) {
	s_scan_table[i] = &RppLexer::scanNumberLiteral;
	s_attr_table[i] \|= A_Digit;
	} else
	s_scan_table[i] = &RppLexer::scanChar;
	}
	}

	s_scan_table[128] = &RppLexer::scanUnicodeChar;
	}

	QVector<Type> RppLexer::lex(const TokenContainer &tokenContainer)
	{
	QVector<Type> tokenTypes;
	const int numTokens = tokenContainer.count();
	tokenTypes.reserve(numTokens);
	QByteArray text = tokenContainer.fullText();
	m_buffer = text.constData();
	for(int t=0; t<numTokens; ++t) {
	TokenEngine::Token token = tokenContainer.token(t);
	tokenTypes.append(indentify(token.start, token.length));
	}
	return tokenTypes;
	}

	Type RppLexer::indentify(int pos, int length)
	{
	Q_ASSERT(length > 0);
	m_ptr = pos;
	m_len = length;
	int kind = 0;
	const unsigned char ch = m_buffer[pos];
	(this->*s_scan_table[ch < 128 ? ch : 128])(&kind);
	return (Type)kind;
	}

	void RppLexer::scanChar(int *kind)
	{
	*kind = m_buffer[m_ptr];
	}

	void RppLexer::scanWhiteSpaces(int *kind)
	{
	*kind = Token_whitespaces;

	while (unsigned char ch = m_buffer[m_ptr]) {
	if (s_attr_table[ch] & A_Whitespace)
	++m_ptr;
	else
	break;
	}
	}

	void RppLexer::scanNewline(int *kind)
	{
	*kind = '\n';
	}

	void RppLexer::scanUnicodeChar(int *kind)
	{
	*kind = m_buffer[m_ptr];
	}

	void RppLexer::scanCharLiteral(int *kind)
	{
	*kind = Token_char_literal;
	}

	void RppLexer::scanStringLiteral(int *kind)
	{
	*kind = Token_string_literal;
	}

	void RppLexer::scanIdentifier(int *kind)
	{
	*kind = Token_identifier;
	}

	void RppLexer::scanNumberLiteral(int *kind)
	{
	*kind = Token_number_literal;
	}

	void RppLexer::scanPreprocessor(int *kind)
	{
	*kind = Token_preproc;
	}

	void RppLexer::scanComment(int *kind)
	{
	switch(m_buffer[m_ptr + 1]) {
	case '/':
	*kind = Token_line_comment;
	break;
	case '*':
	*kind = Token_multiline_comment;
	break;
	default:
	scanOperator(kind);
	}
	}

	void RppLexer::scanOperator(int *kind)
	{
	switch (m_buffer[m_ptr]) {
	case ':':
	if (m_buffer[m_ptr+1] == ':') {
	*kind = Token_scope;
	return;
	}
	break;

	case '*':
	case '/':
	case '%':
	case '^':
	if (m_buffer[m_ptr+1] == '=') {
	*kind = Token_assign;
	return;
	}
	break;

	case '=':
	if (m_buffer[m_ptr+1] == '=') {
	*kind = Token_eq;
	return;
	}
	break;
	case '!':
	if (m_buffer[m_ptr+1] == '=') {
	*kind = Token_not_eq;
	return;
	}
	break;

	case '&':
	if (m_buffer[m_ptr+1] == '&') {
	*kind = Token_and;
	return;
	} else if (m_buffer[m_ptr+1] == '=') {
	*kind = Token_assign;
	return;
	}
	break;

	case '\|':
	if (m_buffer[m_ptr+1] == '\|' ) {
	*kind = Token_or;
	return;
	} else if (m_buffer[m_ptr+1] == '=') {
	*kind = Token_assign;
	return;
	}
	break;

	case '+':
	if (m_buffer[m_ptr+1] == '+' ) {
	*kind = Token_incr;
	return;
	} else if (m_buffer[m_ptr+1] == '=') {
	*kind = Token_assign;
	return;
	}
	break;

	case '<':
	if (m_buffer[m_ptr+1] == '<') {
	if (m_buffer[m_ptr+2] == '=') {
	*kind = Token_assign;
	return;
	}
	*kind = Token_left_shift;
	return;
	} else if (m_buffer[m_ptr+1] == '=') {
	*kind = Token_leq;
	return;
	}
	break;

	case '>':
	if (m_buffer[m_ptr+1] == '>') {
	if (m_buffer[m_ptr+2] == '=') {
	*kind = Token_assign;
	return;
	}
	*kind = Token_right_shift;
	return;
	} else if (m_buffer[m_ptr+1] == '=') {
	*kind = Token_geq;
	return;
	}
	break;

	case '-':
	if (m_buffer[m_ptr+1] == '>') {
	if (m_buffer[m_ptr+2] == '*') {
	*kind = Token_ptrmem;
	return;
	}
	*kind = Token_arrow;
	return;
	} else if (m_buffer[m_ptr+1] == '-') {
	*kind = Token_decr;
	return;
	} else if (m_buffer[m_ptr+1] == '=') {
	*kind = Token_assign;
	return;
	}
	break;

	case '.':
	if (m_buffer[m_ptr+1] == '.' && m_buffer[m_ptr+2] == '.') {
	*kind = Token_ellipsis;
	return;
	} else if (m_buffer[m_ptr+1] == '*') {
	*kind = Token_ptrmem;
	return;
	}
	break;

	}

	*kind = m_buffer[m_ptr++];
	}

	bool RppLexer::match(const char *buf, int len)
	{
	if (m_len != len)
	return false;
	for (int i = 0; i < len; ++i) {
	if(m_buffer[m_ptr + i] != buf[i])
	return false;
	}
	return true;
	}

	void RppLexer::scanKeyword(int *kind)
	{
	if(match("if", 2))
	*kind = Token_directive_if;
	else if(match("elif", 4))
	*kind = Token_directive_elif;
	else if(match("else", 4))
	*kind = Token_directive_else;
	else if(match("line", 4))
	*kind = Token_directive_line;
	else if(match("else", 4))
	*kind = Token_directive_else;
	else if(match("line", 4))
	*kind = Token_directive_line;
	else if(match("endif", 5))
	*kind = Token_directive_endif;
	else if(match("ifdef", 5))
	*kind = Token_directive_ifdef;
	else if(match("error", 5))
	*kind = Token_directive_error;
	else if(match("undef", 5))
	*kind = Token_directive_undef;
	else if(match("pragma", 6))
	*kind = Token_directive_pragma;
	else if(match("ifndef", 6))
	*kind = Token_directive_ifndef;
	else if(match("define", 6))
	*kind = Token_directive_define;
	else if(match("include", 7))
	*kind = Token_directive_include;
	else if(match("defined", 7))
	*kind = Token_defined;
	else
	*kind = Token_identifier;
	}

	} //namespace Rpp

	QT_END_NAMESPACE