blob: 868136605e5abe59209fdc5518dfcead45bde8c5 [file] [log] [blame]
/****************************************************************************
**
** Copyright (C) 2011 Nokia Corporation and/or its subsidiary(-ies).
** All rights reserved.
** Contact: Nokia Corporation (qt-info@nokia.com)
**
** This file is part of the QtCore module of the Qt Toolkit.
**
** $QT_BEGIN_LICENSE:LGPL$
** GNU Lesser General Public License Usage
** This file may be used under the terms of the GNU Lesser General Public
** License version 2.1 as published by the Free Software Foundation and
** appearing in the file LICENSE.LGPL included in the packaging of this
** file. Please review the following information to ensure the GNU Lesser
** General Public License version 2.1 requirements will be met:
** http://www.gnu.org/licenses/old-licenses/lgpl-2.1.html.
**
** In addition, as a special exception, Nokia gives you certain additional
** rights. These rights are described in the Nokia Qt LGPL Exception
** version 1.1, included in the file LGPL_EXCEPTION.txt in this package.
**
** GNU General Public License Usage
** Alternatively, this file may be used under the terms of the GNU General
** Public License version 3.0 as published by the Free Software Foundation
** and appearing in the file LICENSE.GPL included in the packaging of this
** file. Please review the following information to ensure the GNU General
** Public License version 3.0 requirements will be met:
** http://www.gnu.org/copyleft/gpl.html.
**
** Other Usage
** Alternatively, this file may be used in accordance with the terms and
** conditions contained in a signed written agreement between you and Nokia.
**
**
**
**
**
** $QT_END_LICENSE$
**
****************************************************************************/
// Most of the code here was originally written by Hans Petter Bieker,
// and is included in Qt with the author's permission, and the grateful
// thanks of the Qt team.
#include "qtsciicodec_p.h"
#include "qlist.h"
#ifndef QT_NO_CODECS
QT_BEGIN_NAMESPACE
static unsigned char qt_UnicodeToTSCII(ushort u1, ushort u2, ushort u3);
static unsigned int qt_TSCIIToUnicode(unsigned int code, uint *s);
#define IsTSCIIChar(c) (((c) >= 0x80) && ((c) <= 0xfd))
/*! \class QTsciiCodec
\reentrant
\internal
*/
/*!
Destroys the text codec object.
*/
QTsciiCodec::~QTsciiCodec()
{
}
/*!
Converts the first \a len characters in \a uc from Unicode to this
encoding, and returns the result in a byte array. The \a state contains
some conversion flags, and is used by the codec to maintain state
information.
*/
QByteArray QTsciiCodec::convertFromUnicode(const QChar *uc, int len, ConverterState *state) const
{
char replacement = '?';
if (state) {
if (state->flags & ConvertInvalidToNull)
replacement = 0;
}
int invalid = 0;
QByteArray rstr(len, Qt::Uninitialized);
uchar* cursor = (uchar*)rstr.data();
for (int i = 0; i < len; i++) {
QChar ch = uc[i];
uchar j;
if (ch.row() == 0x00 && ch.cell() < 0x80) {
// ASCII
j = ch.cell();
} else if ((j = qt_UnicodeToTSCII(uc[i].unicode(),
uc[i + 1].unicode(),
uc[i + 2].unicode()))) {
// We have to check the combined chars first!
i += 2;
} else if ((j = qt_UnicodeToTSCII(uc[i].unicode(),
uc[i + 1].unicode(), 0))) {
i++;
} else if ((j = qt_UnicodeToTSCII(uc[i].unicode(), 0, 0))) {
} else {
// Error
j = replacement;
++invalid;
}
*cursor++ = j;
}
rstr.resize(cursor - (const uchar*)rstr.constData());
if (state) {
state->invalidChars += invalid;
}
return rstr;
}
/*!
Converts the first \a len characters in \a chars from this encoding
to Unicode, and returns the result in a QString. The \a state contains
some conversion flags, and is used by the codec to maintain state
information.
*/
QString QTsciiCodec::convertToUnicode(const char* chars, int len, ConverterState *state) const
{
QChar replacement = QChar::ReplacementCharacter;
if (state) {
if (state->flags & ConvertInvalidToNull)
replacement = QChar::Null;
}
int invalid = 0;
QString result;
for (int i = 0; i < len; i++) {
uchar ch = chars[i];
if (ch < 0x80) {
// ASCII
result += QLatin1Char(ch);
} else if (IsTSCIIChar(ch)) {
// TSCII
uint s[3];
uint u = qt_TSCIIToUnicode(ch, s);
uint *p = s;
while (u--) {
uint c = *p++;
if (c)
result += QChar(c);
else {
result += replacement;
++invalid;
}
}
} else {
// Invalid
result += replacement;
++invalid;
}
}
if (state) {
state->invalidChars += invalid;
}
return result;
}
/*!
Returns the official name for the encoding that is handled by the codec.
\sa QTextCodec::name()
*/
QByteArray QTsciiCodec::name() const
{
return "TSCII";
}
/*!
Returns the MIB enum for the encoding.
\sa QTextCodec::mibEnum()
*/
int QTsciiCodec::mibEnum() const
{
return 2107;
}
static const int UnToTsLast = 124; // 125 items -- so the last will be 124
static const ushort UnToTs [][4] = {
// *Sorted* list of TSCII maping for unicode chars
//FIRST SECOND THIRD TSCII
{0x00A0, 0x0000, 0x0000, 0xA0},
{0x00A9, 0x0000, 0x0000, 0xA9},
{0x0B83, 0x0000, 0x0000, 0xB7},
{0x0B85, 0x0000, 0x0000, 0xAB},
{0x0B86, 0x0000, 0x0000, 0xAC},
{0x0B87, 0x0000, 0x0000, 0xAD},
{0x0B88, 0x0000, 0x0000, 0xAE},
{0x0B89, 0x0000, 0x0000, 0xAF},
{0x0B8A, 0x0000, 0x0000, 0xB0},
{0x0B8E, 0x0000, 0x0000, 0xB1},
{0x0B8F, 0x0000, 0x0000, 0xB2},
{0x0B90, 0x0000, 0x0000, 0xB3},
{0x0B92, 0x0000, 0x0000, 0xB4},
{0x0B93, 0x0000, 0x0000, 0xB5},
{0x0B94, 0x0000, 0x0000, 0xB6},
{0x0B95, 0x0000, 0x0000, 0xB8},
{0x0B95, 0x0B82, 0x0000, 0xEC},
{0x0B95, 0x0BC1, 0x0000, 0xCC},
{0x0B95, 0x0BC2, 0x0000, 0xDC},
{0x0B99, 0x0000, 0x0000, 0xB9},
{0x0B99, 0x0B82, 0x0000, 0xED},
{0x0B99, 0x0BC1, 0x0000, 0x99},
{0x0B99, 0x0BC2, 0x0000, 0x9B},
{0x0B9A, 0x0000, 0x0000, 0xBA},
{0x0B9A, 0x0B82, 0x0000, 0xEE},
{0x0B9A, 0x0BC1, 0x0000, 0xCD},
{0x0B9A, 0x0BC2, 0x0000, 0xDD},
{0x0B9C, 0x0000, 0x0000, 0x83},
{0x0B9C, 0x0B82, 0x0000, 0x88},
{0x0B9E, 0x0000, 0x0000, 0xBB},
{0x0B9E, 0x0B82, 0x0000, 0xEF},
{0x0B9E, 0x0BC1, 0x0000, 0x9A},
{0x0B9E, 0x0BC2, 0x0000, 0x9C},
{0x0B9F, 0x0000, 0x0000, 0xBC},
{0x0B9F, 0x0B82, 0x0000, 0xF0},
{0x0B9F, 0x0BBF, 0x0000, 0xCA},
{0x0B9F, 0x0BC0, 0x0000, 0xCB},
{0x0B9F, 0x0BC1, 0x0000, 0xCE},
{0x0B9F, 0x0BC2, 0x0000, 0xDE},
{0x0BA1, 0x0B82, 0x0000, 0xF2},
{0x0BA3, 0x0000, 0x0000, 0xBD},
{0x0BA3, 0x0B82, 0x0000, 0xF1},
{0x0BA3, 0x0BC1, 0x0000, 0xCF},
{0x0BA3, 0x0BC2, 0x0000, 0xDF},
{0x0BA4, 0x0000, 0x0000, 0xBE},
{0x0BA4, 0x0BC1, 0x0000, 0xD0},
{0x0BA4, 0x0BC2, 0x0000, 0xE0},
{0x0BA8, 0x0000, 0x0000, 0xBF},
{0x0BA8, 0x0B82, 0x0000, 0xF3},
{0x0BA8, 0x0BC1, 0x0000, 0xD1},
{0x0BA8, 0x0BC2, 0x0000, 0xE1},
{0x0BA9, 0x0000, 0x0000, 0xC9},
{0x0BA9, 0x0B82, 0x0000, 0xFD},
{0x0BA9, 0x0BC1, 0x0000, 0xDB},
{0x0BA9, 0x0BC2, 0x0000, 0xEB},
{0x0BAA, 0x0000, 0x0000, 0xC0},
{0x0BAA, 0x0B82, 0x0000, 0xF4},
{0x0BAA, 0x0BC1, 0x0000, 0xD2},
{0x0BAA, 0x0BC2, 0x0000, 0xE2},
{0x0BAE, 0x0000, 0x0000, 0xC1},
{0x0BAE, 0x0B82, 0x0000, 0xF5},
{0x0BAE, 0x0BC1, 0x0000, 0xD3},
{0x0BAE, 0x0BC2, 0x0000, 0xE3},
{0x0BAF, 0x0000, 0x0000, 0xC2},
{0x0BAF, 0x0B82, 0x0000, 0xF6},
{0x0BAF, 0x0BC1, 0x0000, 0xD4},
{0x0BAF, 0x0BC2, 0x0000, 0xE4},
{0x0BB0, 0x0000, 0x0000, 0xC3},
{0x0BB0, 0x0B82, 0x0000, 0xF7},
{0x0BB0, 0x0BC1, 0x0000, 0xD5},
{0x0BB0, 0x0BC2, 0x0000, 0xE5},
{0x0BB1, 0x0000, 0x0000, 0xC8},
{0x0BB1, 0x0B82, 0x0000, 0xFC},
{0x0BB1, 0x0BC1, 0x0000, 0xDA},
{0x0BB1, 0x0BC2, 0x0000, 0xEA},
{0x0BB2, 0x0000, 0x0000, 0xC4},
{0x0BB2, 0x0B82, 0x0000, 0xF8},
{0x0BB2, 0x0BC1, 0x0000, 0xD6},
{0x0BB2, 0x0BC2, 0x0000, 0xE6},
{0x0BB3, 0x0000, 0x0000, 0xC7},
{0x0BB3, 0x0B82, 0x0000, 0xFB},
{0x0BB3, 0x0BC1, 0x0000, 0xD9},
{0x0BB3, 0x0BC2, 0x0000, 0xE9},
{0x0BB4, 0x0000, 0x0000, 0xC6},
{0x0BB4, 0x0B82, 0x0000, 0xFA},
{0x0BB4, 0x0BC1, 0x0000, 0xD8},
{0x0BB4, 0x0BC2, 0x0000, 0xE8},
{0x0BB5, 0x0000, 0x0000, 0xC5},
{0x0BB5, 0x0B82, 0x0000, 0xF9},
{0x0BB5, 0x0BC1, 0x0000, 0xD7},
{0x0BB5, 0x0BC2, 0x0000, 0xE7},
{0x0BB7, 0x0000, 0x0000, 0x84},
{0x0BB7, 0x0B82, 0x0000, 0x89},
{0x0BB8, 0x0000, 0x0000, 0x85},
{0x0BB8, 0x0B82, 0x0000, 0x8A},
{0x0BB9, 0x0000, 0x0000, 0x86},
{0x0BB9, 0x0B82, 0x0000, 0x8B},
{0x0BBE, 0x0000, 0x0000, 0xA1},
{0x0BBF, 0x0000, 0x0000, 0xA2},
{0x0BC0, 0x0000, 0x0000, 0xA3},
{0x0BC1, 0x0000, 0x0000, 0xA4},
{0x0BC2, 0x0000, 0x0000, 0xA5},
{0x0BC6, 0x0000, 0x0000, 0xA6},
{0x0BC7, 0x0000, 0x0000, 0xA7},
{0x0BC8, 0x0000, 0x0000, 0xA8},
{0x0BCC, 0x0000, 0x0000, 0xAA},
{0x0BE6, 0x0000, 0x0000, 0x80},
{0x0BE7, 0x0000, 0x0000, 0x81},
{0x0BE7, 0x0BB7, 0x0000, 0x87},
{0x0BE7, 0x0BB7, 0x0B82, 0x8C},
{0x0BE8, 0x0000, 0x0000, 0x8D},
{0x0BE9, 0x0000, 0x0000, 0x8E},
{0x0BEA, 0x0000, 0x0000, 0x8F},
{0x0BEB, 0x0000, 0x0000, 0x90},
{0x0BEC, 0x0000, 0x0000, 0x95},
{0x0BED, 0x0000, 0x0000, 0x96},
{0x0BEE, 0x0000, 0x0000, 0x97},
{0x0BEF, 0x0000, 0x0000, 0x98},
{0x0BF0, 0x0000, 0x0000, 0x9D},
{0x0BF1, 0x0000, 0x0000, 0x9E},
{0x0BF2, 0x0000, 0x0000, 0x9F},
{0x2018, 0x0000, 0x0000, 0x91},
{0x2019, 0x0000, 0x0000, 0x92},
{0x201C, 0x0000, 0x0000, 0x93},
{0x201C, 0x0000, 0x0000, 0x94}
};
static const ushort TsToUn [][3] = {
// Starting at 0x80
{0x0BE6, 0x0000, 0x0000},
{0x0BE7, 0x0000, 0x0000},
{0x0000, 0x0000, 0x0000}, // unknown
{0x0B9C, 0x0000, 0x0000},
{0x0BB7, 0x0000, 0x0000},
{0x0BB8, 0x0000, 0x0000},
{0x0BB9, 0x0000, 0x0000},
{0x0BE7, 0x0BB7, 0x0000},
{0x0B9C, 0x0B82, 0x0000},
{0x0BB7, 0x0B82, 0x0000},
{0x0BB8, 0x0B82, 0x0000},
{0x0BB9, 0x0B82, 0x0000},
{0x0BE7, 0x0BB7, 0x0B82},
{0x0BE8, 0x0000, 0x0000},
{0x0BE9, 0x0000, 0x0000},
{0x0BEA, 0x0000, 0x0000},
{0x0BEB, 0x0000, 0x0000},
{0x2018, 0x0000, 0x0000},
{0x2019, 0x0000, 0x0000},
{0x201C, 0x0000, 0x0000},
{0x201C, 0x0000, 0x0000}, // two of the same??
{0x0BEC, 0x0000, 0x0000},
{0x0BED, 0x0000, 0x0000},
{0x0BEE, 0x0000, 0x0000},
{0x0BEF, 0x0000, 0x0000},
{0x0B99, 0x0BC1, 0x0000},
{0x0B9E, 0x0BC1, 0x0000},
{0x0B99, 0x0BC2, 0x0000},
{0x0B9E, 0x0BC2, 0x0000},
{0x0BF0, 0x0000, 0x0000},
{0x0BF1, 0x0000, 0x0000},
{0x0BF2, 0x0000, 0x0000},
{0x00A0, 0x0000, 0x0000},
{0x0BBE, 0x0000, 0x0000},
{0x0BBF, 0x0000, 0x0000},
{0x0BC0, 0x0000, 0x0000},
{0x0BC1, 0x0000, 0x0000},
{0x0BC2, 0x0000, 0x0000},
{0x0BC6, 0x0000, 0x0000},
{0x0BC7, 0x0000, 0x0000},
{0x0BC8, 0x0000, 0x0000},
{0x00A9, 0x0000, 0x0000},
{0x0BCC, 0x0000, 0x0000},
{0x0B85, 0x0000, 0x0000},
{0x0B86, 0x0000, 0x0000},
{0x0B87, 0x0000, 0x0000},
{0x0B88, 0x0000, 0x0000},
{0x0B89, 0x0000, 0x0000},
{0x0B8A, 0x0000, 0x0000},
{0x0B8E, 0x0000, 0x0000},
{0x0B8F, 0x0000, 0x0000},
{0x0B90, 0x0000, 0x0000},
{0x0B92, 0x0000, 0x0000},
{0x0B93, 0x0000, 0x0000},
{0x0B94, 0x0000, 0x0000},
{0x0B83, 0x0000, 0x0000},
{0x0B95, 0x0000, 0x0000},
{0x0B99, 0x0000, 0x0000},
{0x0B9A, 0x0000, 0x0000},
{0x0B9E, 0x0000, 0x0000},
{0x0B9F, 0x0000, 0x0000},
{0x0BA3, 0x0000, 0x0000},
{0x0BA4, 0x0000, 0x0000},
{0x0BA8, 0x0000, 0x0000},
{0x0BAA, 0x0000, 0x0000},
{0x0BAE, 0x0000, 0x0000},
{0x0BAF, 0x0000, 0x0000},
{0x0BB0, 0x0000, 0x0000},
{0x0BB2, 0x0000, 0x0000},
{0x0BB5, 0x0000, 0x0000},
{0x0BB4, 0x0000, 0x0000},
{0x0BB3, 0x0000, 0x0000},
{0x0BB1, 0x0000, 0x0000},
{0x0BA9, 0x0000, 0x0000},
{0x0B9F, 0x0BBF, 0x0000},
{0x0B9F, 0x0BC0, 0x0000},
{0x0B95, 0x0BC1, 0x0000},
{0x0B9A, 0x0BC1, 0x0000},
{0x0B9F, 0x0BC1, 0x0000},
{0x0BA3, 0x0BC1, 0x0000},
{0x0BA4, 0x0BC1, 0x0000},
{0x0BA8, 0x0BC1, 0x0000},
{0x0BAA, 0x0BC1, 0x0000},
{0x0BAE, 0x0BC1, 0x0000},
{0x0BAF, 0x0BC1, 0x0000},
{0x0BB0, 0x0BC1, 0x0000},
{0x0BB2, 0x0BC1, 0x0000},
{0x0BB5, 0x0BC1, 0x0000},
{0x0BB4, 0x0BC1, 0x0000},
{0x0BB3, 0x0BC1, 0x0000},
{0x0BB1, 0x0BC1, 0x0000},
{0x0BA9, 0x0BC1, 0x0000},
{0x0B95, 0x0BC2, 0x0000},
{0x0B9A, 0x0BC2, 0x0000},
{0x0B9F, 0x0BC2, 0x0000},
{0x0BA3, 0x0BC2, 0x0000},
{0x0BA4, 0x0BC2, 0x0000},
{0x0BA8, 0x0BC2, 0x0000},
{0x0BAA, 0x0BC2, 0x0000},
{0x0BAE, 0x0BC2, 0x0000},
{0x0BAF, 0x0BC2, 0x0000},
{0x0BB0, 0x0BC2, 0x0000},
{0x0BB2, 0x0BC2, 0x0000},
{0x0BB5, 0x0BC2, 0x0000},
{0x0BB4, 0x0BC2, 0x0000},
{0x0BB3, 0x0BC2, 0x0000},
{0x0BB1, 0x0BC2, 0x0000},
{0x0BA9, 0x0BC2, 0x0000},
{0x0B95, 0x0B82, 0x0000},
{0x0B99, 0x0B82, 0x0000},
{0x0B9A, 0x0B82, 0x0000},
{0x0B9E, 0x0B82, 0x0000},
{0x0B9F, 0x0B82, 0x0000},
{0x0BA3, 0x0B82, 0x0000},
{0x0BA1, 0x0B82, 0x0000},
{0x0BA8, 0x0B82, 0x0000},
{0x0BAA, 0x0B82, 0x0000},
{0x0BAE, 0x0B82, 0x0000},
{0x0BAF, 0x0B82, 0x0000},
{0x0BB0, 0x0B82, 0x0000},
{0x0BB2, 0x0B82, 0x0000},
{0x0BB5, 0x0B82, 0x0000},
{0x0BB4, 0x0B82, 0x0000},
{0x0BB3, 0x0B82, 0x0000},
{0x0BB1, 0x0B82, 0x0000},
{0x0BA9, 0x0B82, 0x0000}
};
static int cmp(const ushort *s1, const ushort *s2, size_t len)
{
int diff = 0;
while (len-- && (diff = *s1++ - *s2++) == 0)
;
return diff;
}
static unsigned char qt_UnicodeToTSCII(ushort u1, ushort u2, ushort u3)
{
ushort s[3];
s[0] = u1;
s[1] = u2;
s[2] = u3;
int a = 0; // start pos
int b = UnToTsLast; // end pos
// do a binary search for the composed unicode in the list
while (a <= b) {
int w = (a + b) / 2;
int j = cmp(UnToTs[w], s, 3);
if (j == 0)
// found it
return UnToTs[w][3];
if (j < 0)
a = w + 1;
else
b = w - 1;
}
return 0;
}
static unsigned int qt_TSCIIToUnicode(uint code, uint *s)
{
int len = 0;
for (int i = 0; i < 3; i++) {
uint u = TsToUn[code & 0x7f][i];
s[i] = u;
if (s[i]) len = i + 1;
}
return len;
}
QT_END_NAMESPACE
#endif // QT_NO_CODECS