blob: 2e917ff798f4a39ddab9290ff2cb3375679737e3 [file] [log] [blame]
/*
* Licensed to the Apache Software Foundation (ASF) under one or more
* contributor license agreements. See the NOTICE file distributed with
* this work for additional information regarding copyright ownership.
* The ASF licenses this file to You under the Apache License, Version 2.0
* (the "License"); you may not use this file except in compliance with
* the License. You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
/*
* $Id: Iconv390TransService.cpp 568078 2007-08-21 11:43:25Z amassari $
*/
// ---------------------------------------------------------------------------
// Includes
// ---------------------------------------------------------------------------
#include "Iconv390TransService.hpp"
#include <xercesc/util/XMLUniDefs.hpp>
#include <xercesc/util/XMLUni.hpp>
#include <xercesc/util/regx/XMLUniCharacter.hpp>
#include <xercesc/framework/MemoryManager.hpp>
#include <wchar.h>
#include <string.h>
#include <stdlib.h>
#include <stdio.h>
#ifdef OS390BATCH
#include <unistd.h>
#endif
#include <ctype.h>
XERCES_CPP_NAMESPACE_BEGIN
//
// Cannot use the OS/390 c/c++ towupper and towlower functions in the
// Unicode environment. We will use mytowupper and mytowlower here.
//
#undef towupper
#undef towlower
#define towupper mytowupper
#define towlower mytowlower
// ---------------------------------------------------------------------------
// Local, const data
// ---------------------------------------------------------------------------
static const int gTempBuffArraySize = 1024;
static const XMLCh gMyServiceId[] =
{
chLatin_I, chLatin_C, chLatin_o, chLatin_n, chLatin_v, chNull
};
// ---------------------------------------------------------------------------
// gUnicodeToIBM037XlatTable
// This is the translation table for Unicode to ibm-037. This table
// contains 255 entries.
// ---------------------------------------------------------------------------
static const XMLByte gUnicodeToIBM037XlatTable[256] =
{
0x00, 0x01, 0x02, 0x03, 0x37, 0x2D, 0x2E, 0x2F
, 0x16, 0x05, 0x25, 0x0B, 0x0C, 0x0D, 0x0E, 0x0F
, 0x10, 0x11, 0x12, 0x13, 0x3C, 0x3D, 0x32, 0x26
, 0x18, 0x19, 0x3F, 0x27, 0x1C, 0x1D, 0x1E, 0x1F
, 0x40, 0x5A, 0x7F, 0x7B, 0x5B, 0x6C, 0x50, 0x7D
, 0x4D, 0x5D, 0x5C, 0x4E, 0x6B, 0x60, 0x4B, 0x61
, 0xF0, 0xF1, 0xF2, 0xF3, 0xF4, 0xF5, 0xF6, 0xF7
, 0xF8, 0xF9, 0x7A, 0x5E, 0x4C, 0x7E, 0x6E, 0x6F
, 0x7C, 0xC1, 0xC2, 0xC3, 0xC4, 0xC5, 0xC6, 0xC7
, 0xC8, 0xC9, 0xD1, 0xD2, 0xD3, 0xD4, 0xD5, 0xD6
, 0xD7, 0xD8, 0xD9, 0xE2, 0xE3, 0xE4, 0xE5, 0xE6
, 0xE7, 0xE8, 0xE9, 0xBA, 0xE0, 0xBB, 0xB0, 0x6D
, 0x79, 0x81, 0x82, 0x83, 0x84, 0x85, 0x86, 0x87
, 0x88, 0x89, 0x91, 0x92, 0x93, 0x94, 0x95, 0x96
, 0x97, 0x98, 0x99, 0xA2, 0xA3, 0xA4, 0xA5, 0xA6
, 0xA7, 0xA8, 0xA9, 0xC0, 0x4F, 0xD0, 0xA1, 0x07
, 0x20, 0x21, 0x22, 0x23, 0x24, 0x15, 0x06, 0x17
, 0x28, 0x29, 0x2A, 0x2B, 0x2C, 0x09, 0x0A, 0x1B
, 0x30, 0x31, 0x1A, 0x33, 0x34, 0x35, 0x36, 0x08
, 0x38, 0x39, 0x3A, 0x3B, 0x04, 0x14, 0x3E, 0xFF
, 0x41, 0xAA, 0x4A, 0xB1, 0x9F, 0xB2, 0x6A, 0xB5
, 0xBD, 0xB4, 0x9A, 0x8A, 0x5F, 0xCA, 0xAF, 0xBC
, 0x90, 0x8F, 0xEA, 0xFA, 0xBE, 0xA0, 0xB6, 0xB3
, 0x9D, 0xDA, 0x9B, 0x8B, 0xB7, 0xB8, 0xB9, 0xAB
, 0x64, 0x65, 0x62, 0x66, 0x63, 0x67, 0x9E, 0x68
, 0x74, 0x71, 0x72, 0x73, 0x78, 0x75, 0x76, 0x77
, 0xAC, 0x69, 0xED, 0xEE, 0xEB, 0xEF, 0xEC, 0xBF
, 0x80, 0xFD, 0xFE, 0xFB, 0xFC, 0xAD, 0xAE, 0x59
, 0x44, 0x45, 0x42, 0x46, 0x43, 0x47, 0x9C, 0x48
, 0x54, 0x51, 0x52, 0x53, 0x58, 0x55, 0x56, 0x57
, 0x8C, 0x49, 0xCD, 0xCE, 0xCB, 0xCF, 0xCC, 0xE1
, 0x70, 0xDD, 0xDE, 0xDB, 0xDC, 0x8D, 0x8E, 0xDF
};
iconvconverter * converterList;
XMLMutex converterListMutex;
iconvconverter * addConverter(const char* const EncodingName
,XMLTransService::Codes& resValue)
{
XMLMutexLock lockConverterlist(&converterListMutex);
iconvconverter *tconv=converterList;
while ( (tconv) &&
(strcmp(tconv->name,EncodingName)) )
tconv = tconv->nextconverter;
if (tconv) {
tconv->usecount++;
}
else {
tconv = new iconvconverter;
strcpy(tconv->name,EncodingName);
tconv->usecount=1;
tconv->fIconv390Descriptor = iconv_open("UCS-2",EncodingName);
if (tconv->fIconv390Descriptor == (iconv_t)(-1)) {
resValue = XMLTransService::UnsupportedEncoding;
delete tconv;
return 0;
}
tconv->nextconverter = converterList;
converterList = tconv;
}
return tconv;
}
void removeConverter(iconvconverter* const converter)
{
iconvconverter *pconv,*tconv;
tconv = 0;
if (converter) {
XMLMutexLock lockConverterlist(&converterListMutex);
if (--converter->usecount==0) {
tconv = converterList;
pconv = (iconvconverter*)&converterList;
while ( (tconv) && (tconv!=converter) ) {
pconv=tconv;
tconv=tconv->nextconverter;
}
pconv->nextconverter=tconv->nextconverter;
}
}
if (tconv) {
iconv_close(tconv->fIconv390Descriptor);
delete tconv;
}
}
// ---------------------------------------------------------------------------
// Local methods
// ---------------------------------------------------------------------------
static unsigned int getWideCharLength(const XMLCh* const src)
{
if (!src)
return 0;
unsigned int len = 0;
const XMLCh* pTmp = src;
while (*pTmp++)
len++;
return len;
}
// ---------------------------------------------------------------------------
// Iconv390TransService: Constructors and Destructor
// ---------------------------------------------------------------------------
Iconv390TransService::Iconv390TransService()
{
}
Iconv390TransService::~Iconv390TransService()
{
}
// ---------------------------------------------------------------------------
// Iconv390TransService: The virtual transcoding service API
// ---------------------------------------------------------------------------
int Iconv390TransService::compareIString( const XMLCh* const comp1
, const XMLCh* const comp2)
{
const XMLCh* cptr1 = comp1;
const XMLCh* cptr2 = comp2;
while ( (*cptr1 != 0) && (*cptr2 != 0) )
{
wint_t wch1 = towupper(*cptr1);
wint_t wch2 = towupper(*cptr2);
if (wch1 != wch2)
break;
cptr1++;
cptr2++;
}
return (int) ( towupper(*cptr1) - towupper(*cptr2) );
}
int Iconv390TransService::compareNIString( const XMLCh* const comp1
, const XMLCh* const comp2
, const unsigned int maxChars)
{
unsigned int n = 0;
const XMLCh* cptr1 = comp1;
const XMLCh* cptr2 = comp2;
while (true && maxChars)
{
wint_t wch1 = towupper(*cptr1);
wint_t wch2 = towupper(*cptr2);
if (wch1 != wch2)
return (int) (wch1 - wch2);
// If either ended, then both ended, so equal
if (!*cptr1 || !*cptr2)
break;
cptr1++;
cptr2++;
// Bump the count of chars done. If it equals the count then we
// are equal for the requested count, so break out and return
// equal.
n++;
if (n == maxChars)
break;
}
return 0;
}
const XMLCh* Iconv390TransService::getId() const
{
return gMyServiceId;
}
bool Iconv390TransService::isSpace(const XMLCh toCheck) const
{
unsigned short chartype = XMLUniCharacter::getType(toCheck);
if ( (chartype == XMLUniCharacter::SPACE_SEPARATOR) ||
(chartype == XMLUniCharacter::LINE_SEPARATOR) ||
(chartype == XMLUniCharacter::PARAGRAPH_SEPARATOR) )
return true;
else
return false;
}
XMLLCPTranscoder* Iconv390TransService::makeNewLCPTranscoder()
{
XMLTransService::Codes resValue;
// native MVS default code page is IBM-037
iconvconverter *tconv=addConverter("IBM-037",resValue);
if (tconv == 0) {
return 0;
}
return new Iconv390LCPTranscoder(tconv);
}
bool Iconv390TransService::supportsSrcOfs() const
{
return true;
}
// ---------------------------------------------------------------------------
// Iconv390TransService: The protected virtual transcoding service API
// ---------------------------------------------------------------------------
XMLTranscoder*
Iconv390TransService::makeNewXMLTranscoder(const XMLCh* const encodingName
, XMLTransService::Codes& resValue
, const unsigned int
, MemoryManager* const)
{
// This is a minimalist transcoding service, that only supports a local
// default transcoder. All named encodings return zero as a failure,
// which means that only the intrinsic encodings supported by the parser
// itself will work for XML data.
//
resValue = XMLTransService::UnsupportedEncoding;
return 0;
}
void Iconv390TransService::upperCase(XMLCh* const toUpperCase) const
{
XMLCh* outPtr = toUpperCase;
while (*outPtr != 0) {
if ((*outPtr >= 0x61) && (*outPtr <= 0x7A))
*outPtr = *outPtr - 0x20;
outPtr++;
}
}
void Iconv390TransService::lowerCase(XMLCh* const toLowerCase) const
{
XMLCh* outPtr = toLowerCase;
while (*outPtr != 0) {
if ((*outPtr >= 0x41) && (*outPtr <= 0x5A))
*outPtr = *outPtr + 0x20;
outPtr++;
}
}
// ---------------------------------------------------------------------------
unsigned int Iconv390LCPTranscoder::calcRequiredSize(const char* const srcText
, MemoryManager* const manager)
{
if (!srcText)
return 0;
unsigned charLen = ::mblen(srcText, MB_CUR_MAX);
if (charLen == -1)
return 0;
else if (charLen != 0)
charLen = strlen(srcText)/charLen;
if (charLen == -1)
return 0;
return charLen;
}
unsigned int Iconv390LCPTranscoder::calcRequiredSize(const XMLCh* const srcText
, MemoryManager* const manager)
{
if (!srcText)
return 0;
unsigned int wLent = getWideCharLength(srcText);
wchar_t tmpWideCharArr[gTempBuffArraySize];
wchar_t* allocatedArray = 0;
wchar_t* wideCharBuf = 0;
if (wLent >= gTempBuffArraySize)
wideCharBuf = allocatedArray = (wchar_t*) manager->allocate
(
(wLent + 1) * sizeof(wchar_t)
);//new wchar_t[wLent + 1];
else
wideCharBuf = tmpWideCharArr;
for (unsigned int i = 0; i < wLent; i++)
{
wideCharBuf[i] = srcText[i];
}
wideCharBuf[wLent] = 0x00;
const unsigned int retVal = ::wcstombs(NULL, wideCharBuf, 0);
manager->deallocate(allocatedArray);//delete [] allocatedArray;
if (retVal == -1)
return 0;
return retVal;
}
char* Iconv390LCPTranscoder::transcode(const XMLCh* const toTranscode)
{
if (!toTranscode)
return 0;
char* retVal = 0;
if (*toTranscode)
{
unsigned int wLent = getWideCharLength(toTranscode);
//
// Translate the input from Unicode XMLCh format into
// ibm-037 char format via the lookup table.
//
retVal = new char[wLent + 1];
const XMLCh *srcPtr = toTranscode;
char *outPtr = retVal;
while (*srcPtr != 0)
*outPtr++ = gUnicodeToIBM037XlatTable[*srcPtr++];
*outPtr=0;
}
else
{
retVal = new char[1];
retVal[0] = 0;
}
return retVal;
}
char* Iconv390LCPTranscoder::transcode(const XMLCh* const toTranscode,
MemoryManager* const manager)
{
if (!toTranscode)
return 0;
char* retVal = 0;
if (*toTranscode)
{
unsigned int wLent = getWideCharLength(toTranscode);
//
// Translate the input from Unicode XMLCh format into
// ibm-037 char format via the lookup table.
//
retVal = (char*) manager->allocate((wLent + 1) * sizeof(char));//new char[wLent + 1];
const XMLCh *srcPtr = toTranscode;
char *outPtr = retVal;
while (*srcPtr != 0)
*outPtr++ = gUnicodeToIBM037XlatTable[*srcPtr++];
*outPtr=0;
}
else
{
retVal = (char*) manager->allocate(sizeof(char));//new char[1];
retVal[0] = 0;
}
return retVal;
}
bool Iconv390LCPTranscoder::transcode( const XMLCh* const toTranscode
, char* const toFill
, const unsigned int maxBytes
, MemoryManager* const manager)
{
// Watch for a couple of pyscho corner cases
if (!toTranscode || !maxBytes)
{
toFill[0] = 0;
return true;
}
if (!*toTranscode)
{
toFill[0] = 0;
return true;
}
const XMLCh *srcPtr = toTranscode;
char *outPtr = toFill;
int bytectr = maxBytes;
while (bytectr-- && *srcPtr)
*outPtr++ = gUnicodeToIBM037XlatTable[*srcPtr++];
*outPtr=0;
return true;
}
XMLCh* Iconv390LCPTranscoder::transcode(const char* const toTranscode)
{
if (!toTranscode)
return 0;
XMLCh* retVal = 0;
if (*toTranscode)
{
const unsigned int len = calcRequiredSize(toTranscode);
if (len == 0)
{
retVal = new XMLCh[1];
retVal[0] = 0;
return retVal;
}
wchar_t tmpWideCharArr[gTempBuffArraySize];
wchar_t* allocatedArray = 0;
wchar_t* wideCharBuf = 0;
retVal = new XMLCh[len + 1];
size_t retCode;
char *tmpInPtr = (char*) toTranscode;
char *tmpOutPtr = (char*) retVal;
size_t inByteLeft = len;
size_t outByteLeft = len*2;
{
XMLMutexLock lockConverter(&converter->fMutex);
retCode = iconv(converter->fIconv390Descriptor, &tmpInPtr, &inByteLeft, &tmpOutPtr, &outByteLeft);
}
if (retCode == -1) {
delete [] retVal;
return 0;
}
retVal[len] = 0x00;
delete [] allocatedArray;
}
else
{
retVal = new XMLCh[1];
retVal[0] = 0;
}
return retVal;
}
XMLCh* Iconv390LCPTranscoder::transcode(const char* const toTranscode,
MemoryManager* const manager)
{
if (!toTranscode)
return 0;
XMLCh* retVal = 0;
if (*toTranscode)
{
const unsigned int len = calcRequiredSize(toTranscode, manager);
if (len == 0)
{
retVal = (XMLCh*) manager->allocate(sizeof(XMLCh));//new XMLCh[1];
retVal[0] = 0;
return retVal;
}
wchar_t tmpWideCharArr[gTempBuffArraySize];
wchar_t* allocatedArray = 0;
wchar_t* wideCharBuf = 0;
retVal = (XMLCh*) manager->allocate((len + 1) * sizeof(XMLCh));//new XMLCh[len + 1];
size_t retCode;
char *tmpInPtr = (char*) toTranscode;
char *tmpOutPtr = (char*) retVal;
size_t inByteLeft = len;
size_t outByteLeft = len*2;
{
XMLMutexLock lockConverter(&converter->fMutex);
retCode = iconv(converter->fIconv390Descriptor, &tmpInPtr, &inByteLeft, &tmpOutPtr, &outByteLeft);
}
if (retCode == -1) {
manager->deallocate(retVal);//delete [] retVal;
return 0;
}
retVal[len] = 0x00;
manager->deallocate(allocatedArray);//delete [] allocatedArray;
}
else
{
retVal = (XMLCh*) manager->allocate(sizeof(XMLCh));//new XMLCh[1];
retVal[0] = 0;
}
return retVal;
}
bool Iconv390LCPTranscoder::transcode( const char* const toTranscode
, XMLCh* const toFill
, const unsigned int maxChars
, MemoryManager* const manager)
{
// Check for a couple of psycho corner cases
if (!toTranscode || !maxChars)
{
toFill[0] = 0;
return true;
}
if (!*toTranscode)
{
toFill[0] = 0;
return true;
}
size_t retCode;
char *tmpInPtr = (char*) toTranscode;
char *tmpOutPtr = (char*) toFill;
size_t inByteLeft = maxChars;
size_t outByteLeft = maxChars*2;
{
XMLMutexLock lockConverter(&converter->fMutex);
retCode = iconv(converter->fIconv390Descriptor, &tmpInPtr, &inByteLeft, &tmpOutPtr, &outByteLeft);
}
if ( (retCode == -1) && (outByteLeft!=0) ) {
return false;
}
toFill[maxChars] = 0x00;
return true;
}
// ---------------------------------------------------------------------------
// Iconv390LCPTranscoder: Constructors and Destructor
// ---------------------------------------------------------------------------
Iconv390LCPTranscoder::Iconv390LCPTranscoder()
{
}
Iconv390LCPTranscoder::Iconv390LCPTranscoder(iconvconverter_t* const toAdopt) :
converter (toAdopt)
{
}
Iconv390LCPTranscoder::~Iconv390LCPTranscoder()
{
removeConverter(converter);
converter=0;
}
XERCES_CPP_NAMESPACE_END