Blame qtools/qutfcodec.cpp

Packit 1c1d7e
/****************************************************************************
Packit 1c1d7e
** 
Packit 1c1d7e
**
Packit 1c1d7e
** Implementation of QEucCodec class
Packit 1c1d7e
**
Packit 1c1d7e
** Created : 981015
Packit 1c1d7e
**
Packit 1c1d7e
** Copyright (C)1998-2000 Trolltech AS.  All rights reserved.
Packit 1c1d7e
**
Packit 1c1d7e
** This file is part of the tools module of the Qt GUI Toolkit.
Packit 1c1d7e
**
Packit 1c1d7e
** This file may be distributed under the terms of the Q Public License
Packit 1c1d7e
** as defined by Trolltech AS of Norway and appearing in the file
Packit 1c1d7e
** LICENSE.QPL included in the packaging of this file.
Packit 1c1d7e
**
Packit 1c1d7e
** This file may be distributed and/or modified under the terms of the
Packit 1c1d7e
** GNU General Public License version 2 as published by the Free Software
Packit 1c1d7e
** Foundation and appearing in the file LICENSE.GPL included in the
Packit 1c1d7e
** packaging of this file.
Packit 1c1d7e
**
Packit 1c1d7e
** Licensees holding valid Qt Enterprise Edition or Qt Professional Edition
Packit 1c1d7e
** licenses may use this file in accordance with the Qt Commercial License
Packit 1c1d7e
** Agreement provided with the Software.
Packit 1c1d7e
**
Packit 1c1d7e
** This file is provided AS IS with NO WARRANTY OF ANY KIND, INCLUDING THE
Packit 1c1d7e
** WARRANTY OF DESIGN, MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE.
Packit 1c1d7e
**
Packit 1c1d7e
** See http://www.trolltech.com/pricing.html or email sales@trolltech.com for
Packit 1c1d7e
**   information about Qt Commercial License Agreements.
Packit 1c1d7e
** See http://www.trolltech.com/qpl/ for QPL licensing information.
Packit 1c1d7e
** See http://www.trolltech.com/gpl/ for GPL licensing information.
Packit 1c1d7e
**
Packit 1c1d7e
** Contact info@trolltech.com if any conditions of this licensing are
Packit 1c1d7e
** not clear to you.
Packit 1c1d7e
**
Packit 1c1d7e
**********************************************************************/
Packit 1c1d7e
Packit 1c1d7e
#include "qutfcodec.h"
Packit 1c1d7e
Packit 1c1d7e
#ifndef QT_NO_TEXTCODEC
Packit 1c1d7e
Packit 1c1d7e
int QUtf8Codec::mibEnum() const
Packit 1c1d7e
{
Packit 1c1d7e
    return 106;
Packit 1c1d7e
}
Packit 1c1d7e
Packit 1c1d7e
QCString QUtf8Codec::fromUnicode(const QString& uc, int& len_in_out) const
Packit 1c1d7e
{
Packit 1c1d7e
    int l = QMIN((int)uc.length(),len_in_out);
Packit 1c1d7e
    int rlen = l*3+1;
Packit 1c1d7e
    QCString rstr(rlen);
Packit 1c1d7e
    uchar* cursor = (uchar*)rstr.data();
Packit 1c1d7e
    for (int i=0; i
Packit 1c1d7e
	QChar ch = uc[i];
Packit 1c1d7e
	if ( !ch.row() && ch.cell() < 0x80 ) {
Packit 1c1d7e
	    *cursor++ = ch.cell();
Packit 1c1d7e
	} else {
Packit 1c1d7e
	    uchar b = (ch.row() << 2) | (ch.cell() >> 6);
Packit 1c1d7e
	    if ( ch.row() < 0x08 ) {
Packit 1c1d7e
		*cursor++ = 0xc0 | b;
Packit 1c1d7e
	    } else {
Packit 1c1d7e
		*cursor++ = 0xe0 | (ch.row() >> 4);
Packit 1c1d7e
		*cursor++ = 0x80 | (b&0x3f);
Packit 1c1d7e
	    }
Packit 1c1d7e
	    *cursor++ = 0x80 | (ch.cell()&0x3f);
Packit 1c1d7e
	}
Packit 1c1d7e
    }
Packit 1c1d7e
    len_in_out = (int)(cursor - (uchar*)rstr.data());
Packit 1c1d7e
    rstr.truncate(len_in_out);
Packit 1c1d7e
    return rstr;
Packit 1c1d7e
}
Packit 1c1d7e
Packit 1c1d7e
const char* QUtf8Codec::name() const
Packit 1c1d7e
{
Packit 1c1d7e
    return "UTF-8";
Packit 1c1d7e
}
Packit 1c1d7e
Packit 1c1d7e
int QUtf8Codec::heuristicContentMatch(const char* chars, int len) const
Packit 1c1d7e
{
Packit 1c1d7e
    int score = 0;
Packit 1c1d7e
    for (int i=0; i
Packit 1c1d7e
	uchar ch = chars[i];
Packit 1c1d7e
	// No nulls allowed.
Packit 1c1d7e
	if ( !ch )
Packit 1c1d7e
	    return -1;
Packit 1c1d7e
	if ( ch < 128 ) {
Packit 1c1d7e
	    // Inconclusive
Packit 1c1d7e
	    score++;
Packit 1c1d7e
	} else if ( (ch&0xe0) == 0xc0 ) {
Packit 1c1d7e
	    if ( i < len-1 ) {
Packit 1c1d7e
		uchar c2 = chars[++i];
Packit 1c1d7e
		if ( (c2&0xc0) != 0x80 )
Packit 1c1d7e
		    return -1;
Packit 1c1d7e
		score+=3;
Packit 1c1d7e
	    }
Packit 1c1d7e
	} else if ( (ch&0xf0) == 0xe0 ) {
Packit 1c1d7e
	    if ( i < len-1 ) {
Packit 1c1d7e
		uchar c2 = chars[++i];
Packit 1c1d7e
		if ( (c2&0xc0) != 0x80 ) {
Packit 1c1d7e
		    return -1;
Packit 1c1d7e
#if 0
Packit 1c1d7e
		    if ( i < len-1 ) {
Packit 1c1d7e
			uchar c3 = chars[++i];
Packit 1c1d7e
			if ( (c3&0xc0) != 0x80 )
Packit 1c1d7e
			    return -1;
Packit 1c1d7e
			score+=3;
Packit 1c1d7e
		    }
Packit 1c1d7e
#endif
Packit 1c1d7e
		}
Packit 1c1d7e
		score+=2;
Packit 1c1d7e
	    }
Packit 1c1d7e
	}
Packit 1c1d7e
    }
Packit 1c1d7e
    return score;
Packit 1c1d7e
}
Packit 1c1d7e
Packit 1c1d7e
Packit 1c1d7e
Packit 1c1d7e
Packit 1c1d7e
class QUtf8Decoder : public QTextDecoder {
Packit 1c1d7e
    ushort uc;
Packit 1c1d7e
    int need;
Packit 1c1d7e
public:
Packit 1c1d7e
    QUtf8Decoder() : need(0)
Packit 1c1d7e
    {
Packit 1c1d7e
    }
Packit 1c1d7e
Packit 1c1d7e
    QString toUnicode(const char* chars, int len)
Packit 1c1d7e
    {
Packit 1c1d7e
	QString result;
Packit 1c1d7e
	for (int i=0; i
Packit 1c1d7e
	    uchar ch = chars[i];
Packit 1c1d7e
	    if (need) {
Packit 1c1d7e
		if ( (ch&0xc0) == 0x80 ) {
Packit 1c1d7e
		    uc = (uc << 6) | (ch & 0x3f);
Packit 1c1d7e
		    need--;
Packit 1c1d7e
		    if ( !need ) {
Packit 1c1d7e
			result += QChar(uc);
Packit 1c1d7e
		    }
Packit 1c1d7e
		} else {
Packit 1c1d7e
		    // error
Packit 1c1d7e
		    result += QChar::replacement;
Packit 1c1d7e
		    need = 0;
Packit 1c1d7e
		}
Packit 1c1d7e
	    } else {
Packit 1c1d7e
		if ( ch < 128 ) {
Packit 1c1d7e
		    result += QChar(ch);
Packit 1c1d7e
		} else if ( (ch&0xe0) == 0xc0 ) {
Packit 1c1d7e
		    uc = ch &0x1f;
Packit 1c1d7e
		    need = 1;
Packit 1c1d7e
		} else if ( (ch&0xf0) == 0xe0 ) {
Packit 1c1d7e
		    uc = ch &0x0f;
Packit 1c1d7e
		    need = 2;
Packit 1c1d7e
		}
Packit 1c1d7e
	    }
Packit 1c1d7e
	}
Packit 1c1d7e
	return result;
Packit 1c1d7e
    }
Packit 1c1d7e
};
Packit 1c1d7e
Packit 1c1d7e
QTextDecoder* QUtf8Codec::makeDecoder() const
Packit 1c1d7e
{
Packit 1c1d7e
    return new QUtf8Decoder;
Packit 1c1d7e
}
Packit 1c1d7e
Packit 1c1d7e
Packit 1c1d7e
Packit 1c1d7e
Packit 1c1d7e
Packit 1c1d7e
Packit 1c1d7e
int QUtf16Codec::mibEnum() const
Packit 1c1d7e
{
Packit 1c1d7e
    return 1000;
Packit 1c1d7e
}
Packit 1c1d7e
Packit 1c1d7e
const char* QUtf16Codec::name() const
Packit 1c1d7e
{
Packit 1c1d7e
    return "ISO-10646-UCS-2";
Packit 1c1d7e
}
Packit 1c1d7e
Packit 1c1d7e
int QUtf16Codec::heuristicContentMatch(const char* chars, int len) const
Packit 1c1d7e
{
Packit 1c1d7e
    uchar* uchars = (uchar*)chars;
Packit 1c1d7e
    if ( len >= 2 && ((uchars[0] == 0xff && uchars[1] == 0xfe) ||
Packit 1c1d7e
		      (uchars[1] == 0xff && uchars[0] == 0xfe)) )
Packit 1c1d7e
	return len;
Packit 1c1d7e
    else
Packit 1c1d7e
	return 0;
Packit 1c1d7e
}
Packit 1c1d7e
Packit 1c1d7e
Packit 1c1d7e
Packit 1c1d7e
Packit 1c1d7e
class QUtf16Encoder : public QTextEncoder {
Packit 1c1d7e
    bool headerdone;
Packit 1c1d7e
public:
Packit 1c1d7e
    QUtf16Encoder() : headerdone(FALSE)
Packit 1c1d7e
    {
Packit 1c1d7e
    }
Packit 1c1d7e
Packit 1c1d7e
    QCString fromUnicode(const QString& uc, int& len_in_out)
Packit 1c1d7e
    {
Packit 1c1d7e
	if ( headerdone ) {
Packit 1c1d7e
	    len_in_out = uc.length()*(int)sizeof(QChar);
Packit 1c1d7e
	    QCString d(len_in_out);
Packit 1c1d7e
	    memcpy(d.rawData(),uc.unicode(),len_in_out);
Packit 1c1d7e
	    return d;
Packit 1c1d7e
	} else {
Packit 1c1d7e
	    headerdone = TRUE;
Packit 1c1d7e
	    len_in_out = (1+uc.length())*(int)sizeof(QChar);
Packit 1c1d7e
	    QCString d(len_in_out);
Packit 1c1d7e
	    memcpy(d.rawData(),&QChar::byteOrderMark,sizeof(QChar));
Packit 1c1d7e
	    memcpy(d.rawData()+sizeof(QChar),uc.unicode(),uc.length()*sizeof(QChar));
Packit 1c1d7e
	    return d;
Packit 1c1d7e
	}
Packit 1c1d7e
    }
Packit 1c1d7e
};
Packit 1c1d7e
Packit 1c1d7e
class QUtf16Decoder : public QTextDecoder {
Packit 1c1d7e
    uchar buf;
Packit 1c1d7e
    bool half;
Packit 1c1d7e
    bool swap;
Packit 1c1d7e
    bool headerdone;
Packit 1c1d7e
Packit 1c1d7e
public:
Packit 1c1d7e
    QUtf16Decoder() : half(FALSE), swap(FALSE), headerdone(FALSE)
Packit 1c1d7e
    {
Packit 1c1d7e
    }
Packit 1c1d7e
Packit 1c1d7e
    QString toUnicode(const char* chars, int len)
Packit 1c1d7e
    {
Packit 1c1d7e
	QString r;
Packit 1c1d7e
Packit 1c1d7e
	while ( len-- ) {
Packit 1c1d7e
	    if ( half ) {
Packit 1c1d7e
		QChar ch;
Packit 1c1d7e
		if ( swap ) {
Packit 1c1d7e
		    ch.row() = *chars++;
Packit 1c1d7e
		    ch.cell() = buf;
Packit 1c1d7e
		} else {
Packit 1c1d7e
		    ch.row() = buf;
Packit 1c1d7e
		    ch.cell() = *chars++;
Packit 1c1d7e
		}
Packit 1c1d7e
		if ( !headerdone ) {
Packit 1c1d7e
		    if ( ch == QChar::byteOrderSwapped ) {
Packit 1c1d7e
			swap = !swap;
Packit 1c1d7e
		    } else if ( ch == QChar::byteOrderMark ) {
Packit 1c1d7e
			// Ignore ZWNBSP
Packit 1c1d7e
		    } else {
Packit 1c1d7e
			r += ch;
Packit 1c1d7e
		    }
Packit 1c1d7e
		    headerdone = TRUE;
Packit 1c1d7e
		} else
Packit 1c1d7e
		    r += ch;
Packit 1c1d7e
		half = FALSE;
Packit 1c1d7e
	    } else {
Packit 1c1d7e
		buf = *chars++;
Packit 1c1d7e
		half = TRUE;
Packit 1c1d7e
	    }
Packit 1c1d7e
	}
Packit 1c1d7e
Packit 1c1d7e
	return r;
Packit 1c1d7e
    }
Packit 1c1d7e
};
Packit 1c1d7e
Packit 1c1d7e
QTextDecoder* QUtf16Codec::makeDecoder() const
Packit 1c1d7e
{
Packit 1c1d7e
    return new QUtf16Decoder;
Packit 1c1d7e
}
Packit 1c1d7e
Packit 1c1d7e
QTextEncoder* QUtf16Codec::makeEncoder() const
Packit 1c1d7e
{
Packit 1c1d7e
    return new QUtf16Encoder;
Packit 1c1d7e
}
Packit 1c1d7e
Packit 1c1d7e
#endif // QT_NO_TEXTCODEC