|
Packit |
1c1d7e |
/****************************************************************************
|
|
Packit |
1c1d7e |
**
|
|
Packit |
1c1d7e |
**
|
|
Packit |
1c1d7e |
** Implementation of QEucCodec class
|
|
Packit |
1c1d7e |
**
|
|
Packit |
1c1d7e |
** Created : 981015
|
|
Packit |
1c1d7e |
**
|
|
Packit |
1c1d7e |
** Copyright (C)1998-2000 Trolltech AS. All rights reserved.
|
|
Packit |
1c1d7e |
**
|
|
Packit |
1c1d7e |
** This file is part of the tools module of the Qt GUI Toolkit.
|
|
Packit |
1c1d7e |
**
|
|
Packit |
1c1d7e |
** This file may be distributed under the terms of the Q Public License
|
|
Packit |
1c1d7e |
** as defined by Trolltech AS of Norway and appearing in the file
|
|
Packit |
1c1d7e |
** LICENSE.QPL included in the packaging of this file.
|
|
Packit |
1c1d7e |
**
|
|
Packit |
1c1d7e |
** This file may be distributed and/or modified under the terms of the
|
|
Packit |
1c1d7e |
** GNU General Public License version 2 as published by the Free Software
|
|
Packit |
1c1d7e |
** Foundation and appearing in the file LICENSE.GPL included in the
|
|
Packit |
1c1d7e |
** packaging of this file.
|
|
Packit |
1c1d7e |
**
|
|
Packit |
1c1d7e |
** Licensees holding valid Qt Enterprise Edition or Qt Professional Edition
|
|
Packit |
1c1d7e |
** licenses may use this file in accordance with the Qt Commercial License
|
|
Packit |
1c1d7e |
** Agreement provided with the Software.
|
|
Packit |
1c1d7e |
**
|
|
Packit |
1c1d7e |
** This file is provided AS IS with NO WARRANTY OF ANY KIND, INCLUDING THE
|
|
Packit |
1c1d7e |
** WARRANTY OF DESIGN, MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE.
|
|
Packit |
1c1d7e |
**
|
|
Packit |
1c1d7e |
** See http://www.trolltech.com/pricing.html or email sales@trolltech.com for
|
|
Packit |
1c1d7e |
** information about Qt Commercial License Agreements.
|
|
Packit |
1c1d7e |
** See http://www.trolltech.com/qpl/ for QPL licensing information.
|
|
Packit |
1c1d7e |
** See http://www.trolltech.com/gpl/ for GPL licensing information.
|
|
Packit |
1c1d7e |
**
|
|
Packit |
1c1d7e |
** Contact info@trolltech.com if any conditions of this licensing are
|
|
Packit |
1c1d7e |
** not clear to you.
|
|
Packit |
1c1d7e |
**
|
|
Packit |
1c1d7e |
**********************************************************************/
|
|
Packit |
1c1d7e |
|
|
Packit |
1c1d7e |
#include "qutfcodec.h"
|
|
Packit |
1c1d7e |
|
|
Packit |
1c1d7e |
#ifndef QT_NO_TEXTCODEC
|
|
Packit |
1c1d7e |
|
|
Packit |
1c1d7e |
int QUtf8Codec::mibEnum() const
|
|
Packit |
1c1d7e |
{
|
|
Packit |
1c1d7e |
return 106;
|
|
Packit |
1c1d7e |
}
|
|
Packit |
1c1d7e |
|
|
Packit |
1c1d7e |
QCString QUtf8Codec::fromUnicode(const QString& uc, int& len_in_out) const
|
|
Packit |
1c1d7e |
{
|
|
Packit |
1c1d7e |
int l = QMIN((int)uc.length(),len_in_out);
|
|
Packit |
1c1d7e |
int rlen = l*3+1;
|
|
Packit |
1c1d7e |
QCString rstr(rlen);
|
|
Packit |
1c1d7e |
uchar* cursor = (uchar*)rstr.data();
|
|
Packit |
1c1d7e |
for (int i=0; i
|
|
Packit |
1c1d7e |
QChar ch = uc[i];
|
|
Packit |
1c1d7e |
if ( !ch.row() && ch.cell() < 0x80 ) {
|
|
Packit |
1c1d7e |
*cursor++ = ch.cell();
|
|
Packit |
1c1d7e |
} else {
|
|
Packit |
1c1d7e |
uchar b = (ch.row() << 2) | (ch.cell() >> 6);
|
|
Packit |
1c1d7e |
if ( ch.row() < 0x08 ) {
|
|
Packit |
1c1d7e |
*cursor++ = 0xc0 | b;
|
|
Packit |
1c1d7e |
} else {
|
|
Packit |
1c1d7e |
*cursor++ = 0xe0 | (ch.row() >> 4);
|
|
Packit |
1c1d7e |
*cursor++ = 0x80 | (b&0x3f);
|
|
Packit |
1c1d7e |
}
|
|
Packit |
1c1d7e |
*cursor++ = 0x80 | (ch.cell()&0x3f);
|
|
Packit |
1c1d7e |
}
|
|
Packit |
1c1d7e |
}
|
|
Packit |
1c1d7e |
len_in_out = (int)(cursor - (uchar*)rstr.data());
|
|
Packit |
1c1d7e |
rstr.truncate(len_in_out);
|
|
Packit |
1c1d7e |
return rstr;
|
|
Packit |
1c1d7e |
}
|
|
Packit |
1c1d7e |
|
|
Packit |
1c1d7e |
const char* QUtf8Codec::name() const
|
|
Packit |
1c1d7e |
{
|
|
Packit |
1c1d7e |
return "UTF-8";
|
|
Packit |
1c1d7e |
}
|
|
Packit |
1c1d7e |
|
|
Packit |
1c1d7e |
int QUtf8Codec::heuristicContentMatch(const char* chars, int len) const
|
|
Packit |
1c1d7e |
{
|
|
Packit |
1c1d7e |
int score = 0;
|
|
Packit |
1c1d7e |
for (int i=0; i
|
|
Packit |
1c1d7e |
uchar ch = chars[i];
|
|
Packit |
1c1d7e |
// No nulls allowed.
|
|
Packit |
1c1d7e |
if ( !ch )
|
|
Packit |
1c1d7e |
return -1;
|
|
Packit |
1c1d7e |
if ( ch < 128 ) {
|
|
Packit |
1c1d7e |
// Inconclusive
|
|
Packit |
1c1d7e |
score++;
|
|
Packit |
1c1d7e |
} else if ( (ch&0xe0) == 0xc0 ) {
|
|
Packit |
1c1d7e |
if ( i < len-1 ) {
|
|
Packit |
1c1d7e |
uchar c2 = chars[++i];
|
|
Packit |
1c1d7e |
if ( (c2&0xc0) != 0x80 )
|
|
Packit |
1c1d7e |
return -1;
|
|
Packit |
1c1d7e |
score+=3;
|
|
Packit |
1c1d7e |
}
|
|
Packit |
1c1d7e |
} else if ( (ch&0xf0) == 0xe0 ) {
|
|
Packit |
1c1d7e |
if ( i < len-1 ) {
|
|
Packit |
1c1d7e |
uchar c2 = chars[++i];
|
|
Packit |
1c1d7e |
if ( (c2&0xc0) != 0x80 ) {
|
|
Packit |
1c1d7e |
return -1;
|
|
Packit |
1c1d7e |
#if 0
|
|
Packit |
1c1d7e |
if ( i < len-1 ) {
|
|
Packit |
1c1d7e |
uchar c3 = chars[++i];
|
|
Packit |
1c1d7e |
if ( (c3&0xc0) != 0x80 )
|
|
Packit |
1c1d7e |
return -1;
|
|
Packit |
1c1d7e |
score+=3;
|
|
Packit |
1c1d7e |
}
|
|
Packit |
1c1d7e |
#endif
|
|
Packit |
1c1d7e |
}
|
|
Packit |
1c1d7e |
score+=2;
|
|
Packit |
1c1d7e |
}
|
|
Packit |
1c1d7e |
}
|
|
Packit |
1c1d7e |
}
|
|
Packit |
1c1d7e |
return score;
|
|
Packit |
1c1d7e |
}
|
|
Packit |
1c1d7e |
|
|
Packit |
1c1d7e |
|
|
Packit |
1c1d7e |
|
|
Packit |
1c1d7e |
|
|
Packit |
1c1d7e |
class QUtf8Decoder : public QTextDecoder {
|
|
Packit |
1c1d7e |
ushort uc;
|
|
Packit |
1c1d7e |
int need;
|
|
Packit |
1c1d7e |
public:
|
|
Packit |
1c1d7e |
QUtf8Decoder() : need(0)
|
|
Packit |
1c1d7e |
{
|
|
Packit |
1c1d7e |
}
|
|
Packit |
1c1d7e |
|
|
Packit |
1c1d7e |
QString toUnicode(const char* chars, int len)
|
|
Packit |
1c1d7e |
{
|
|
Packit |
1c1d7e |
QString result;
|
|
Packit |
1c1d7e |
for (int i=0; i
|
|
Packit |
1c1d7e |
uchar ch = chars[i];
|
|
Packit |
1c1d7e |
if (need) {
|
|
Packit |
1c1d7e |
if ( (ch&0xc0) == 0x80 ) {
|
|
Packit |
1c1d7e |
uc = (uc << 6) | (ch & 0x3f);
|
|
Packit |
1c1d7e |
need--;
|
|
Packit |
1c1d7e |
if ( !need ) {
|
|
Packit |
1c1d7e |
result += QChar(uc);
|
|
Packit |
1c1d7e |
}
|
|
Packit |
1c1d7e |
} else {
|
|
Packit |
1c1d7e |
// error
|
|
Packit |
1c1d7e |
result += QChar::replacement;
|
|
Packit |
1c1d7e |
need = 0;
|
|
Packit |
1c1d7e |
}
|
|
Packit |
1c1d7e |
} else {
|
|
Packit |
1c1d7e |
if ( ch < 128 ) {
|
|
Packit |
1c1d7e |
result += QChar(ch);
|
|
Packit |
1c1d7e |
} else if ( (ch&0xe0) == 0xc0 ) {
|
|
Packit |
1c1d7e |
uc = ch &0x1f;
|
|
Packit |
1c1d7e |
need = 1;
|
|
Packit |
1c1d7e |
} else if ( (ch&0xf0) == 0xe0 ) {
|
|
Packit |
1c1d7e |
uc = ch &0x0f;
|
|
Packit |
1c1d7e |
need = 2;
|
|
Packit |
1c1d7e |
}
|
|
Packit |
1c1d7e |
}
|
|
Packit |
1c1d7e |
}
|
|
Packit |
1c1d7e |
return result;
|
|
Packit |
1c1d7e |
}
|
|
Packit |
1c1d7e |
};
|
|
Packit |
1c1d7e |
|
|
Packit |
1c1d7e |
QTextDecoder* QUtf8Codec::makeDecoder() const
|
|
Packit |
1c1d7e |
{
|
|
Packit |
1c1d7e |
return new QUtf8Decoder;
|
|
Packit |
1c1d7e |
}
|
|
Packit |
1c1d7e |
|
|
Packit |
1c1d7e |
|
|
Packit |
1c1d7e |
|
|
Packit |
1c1d7e |
|
|
Packit |
1c1d7e |
|
|
Packit |
1c1d7e |
|
|
Packit |
1c1d7e |
int QUtf16Codec::mibEnum() const
|
|
Packit |
1c1d7e |
{
|
|
Packit |
1c1d7e |
return 1000;
|
|
Packit |
1c1d7e |
}
|
|
Packit |
1c1d7e |
|
|
Packit |
1c1d7e |
const char* QUtf16Codec::name() const
|
|
Packit |
1c1d7e |
{
|
|
Packit |
1c1d7e |
return "ISO-10646-UCS-2";
|
|
Packit |
1c1d7e |
}
|
|
Packit |
1c1d7e |
|
|
Packit |
1c1d7e |
int QUtf16Codec::heuristicContentMatch(const char* chars, int len) const
|
|
Packit |
1c1d7e |
{
|
|
Packit |
1c1d7e |
uchar* uchars = (uchar*)chars;
|
|
Packit |
1c1d7e |
if ( len >= 2 && ((uchars[0] == 0xff && uchars[1] == 0xfe) ||
|
|
Packit |
1c1d7e |
(uchars[1] == 0xff && uchars[0] == 0xfe)) )
|
|
Packit |
1c1d7e |
return len;
|
|
Packit |
1c1d7e |
else
|
|
Packit |
1c1d7e |
return 0;
|
|
Packit |
1c1d7e |
}
|
|
Packit |
1c1d7e |
|
|
Packit |
1c1d7e |
|
|
Packit |
1c1d7e |
|
|
Packit |
1c1d7e |
|
|
Packit |
1c1d7e |
class QUtf16Encoder : public QTextEncoder {
|
|
Packit |
1c1d7e |
bool headerdone;
|
|
Packit |
1c1d7e |
public:
|
|
Packit |
1c1d7e |
QUtf16Encoder() : headerdone(FALSE)
|
|
Packit |
1c1d7e |
{
|
|
Packit |
1c1d7e |
}
|
|
Packit |
1c1d7e |
|
|
Packit |
1c1d7e |
QCString fromUnicode(const QString& uc, int& len_in_out)
|
|
Packit |
1c1d7e |
{
|
|
Packit |
1c1d7e |
if ( headerdone ) {
|
|
Packit |
1c1d7e |
len_in_out = uc.length()*(int)sizeof(QChar);
|
|
Packit |
1c1d7e |
QCString d(len_in_out);
|
|
Packit |
1c1d7e |
memcpy(d.rawData(),uc.unicode(),len_in_out);
|
|
Packit |
1c1d7e |
return d;
|
|
Packit |
1c1d7e |
} else {
|
|
Packit |
1c1d7e |
headerdone = TRUE;
|
|
Packit |
1c1d7e |
len_in_out = (1+uc.length())*(int)sizeof(QChar);
|
|
Packit |
1c1d7e |
QCString d(len_in_out);
|
|
Packit |
1c1d7e |
memcpy(d.rawData(),&QChar::byteOrderMark,sizeof(QChar));
|
|
Packit |
1c1d7e |
memcpy(d.rawData()+sizeof(QChar),uc.unicode(),uc.length()*sizeof(QChar));
|
|
Packit |
1c1d7e |
return d;
|
|
Packit |
1c1d7e |
}
|
|
Packit |
1c1d7e |
}
|
|
Packit |
1c1d7e |
};
|
|
Packit |
1c1d7e |
|
|
Packit |
1c1d7e |
class QUtf16Decoder : public QTextDecoder {
|
|
Packit |
1c1d7e |
uchar buf;
|
|
Packit |
1c1d7e |
bool half;
|
|
Packit |
1c1d7e |
bool swap;
|
|
Packit |
1c1d7e |
bool headerdone;
|
|
Packit |
1c1d7e |
|
|
Packit |
1c1d7e |
public:
|
|
Packit |
1c1d7e |
QUtf16Decoder() : half(FALSE), swap(FALSE), headerdone(FALSE)
|
|
Packit |
1c1d7e |
{
|
|
Packit |
1c1d7e |
}
|
|
Packit |
1c1d7e |
|
|
Packit |
1c1d7e |
QString toUnicode(const char* chars, int len)
|
|
Packit |
1c1d7e |
{
|
|
Packit |
1c1d7e |
QString r;
|
|
Packit |
1c1d7e |
|
|
Packit |
1c1d7e |
while ( len-- ) {
|
|
Packit |
1c1d7e |
if ( half ) {
|
|
Packit |
1c1d7e |
QChar ch;
|
|
Packit |
1c1d7e |
if ( swap ) {
|
|
Packit |
1c1d7e |
ch.row() = *chars++;
|
|
Packit |
1c1d7e |
ch.cell() = buf;
|
|
Packit |
1c1d7e |
} else {
|
|
Packit |
1c1d7e |
ch.row() = buf;
|
|
Packit |
1c1d7e |
ch.cell() = *chars++;
|
|
Packit |
1c1d7e |
}
|
|
Packit |
1c1d7e |
if ( !headerdone ) {
|
|
Packit |
1c1d7e |
if ( ch == QChar::byteOrderSwapped ) {
|
|
Packit |
1c1d7e |
swap = !swap;
|
|
Packit |
1c1d7e |
} else if ( ch == QChar::byteOrderMark ) {
|
|
Packit |
1c1d7e |
// Ignore ZWNBSP
|
|
Packit |
1c1d7e |
} else {
|
|
Packit |
1c1d7e |
r += ch;
|
|
Packit |
1c1d7e |
}
|
|
Packit |
1c1d7e |
headerdone = TRUE;
|
|
Packit |
1c1d7e |
} else
|
|
Packit |
1c1d7e |
r += ch;
|
|
Packit |
1c1d7e |
half = FALSE;
|
|
Packit |
1c1d7e |
} else {
|
|
Packit |
1c1d7e |
buf = *chars++;
|
|
Packit |
1c1d7e |
half = TRUE;
|
|
Packit |
1c1d7e |
}
|
|
Packit |
1c1d7e |
}
|
|
Packit |
1c1d7e |
|
|
Packit |
1c1d7e |
return r;
|
|
Packit |
1c1d7e |
}
|
|
Packit |
1c1d7e |
};
|
|
Packit |
1c1d7e |
|
|
Packit |
1c1d7e |
QTextDecoder* QUtf16Codec::makeDecoder() const
|
|
Packit |
1c1d7e |
{
|
|
Packit |
1c1d7e |
return new QUtf16Decoder;
|
|
Packit |
1c1d7e |
}
|
|
Packit |
1c1d7e |
|
|
Packit |
1c1d7e |
QTextEncoder* QUtf16Codec::makeEncoder() const
|
|
Packit |
1c1d7e |
{
|
|
Packit |
1c1d7e |
return new QUtf16Encoder;
|
|
Packit |
1c1d7e |
}
|
|
Packit |
1c1d7e |
|
|
Packit |
1c1d7e |
#endif // QT_NO_TEXTCODEC
|