diff options
Diffstat (limited to 'util/unicode/codecs/big5/main.cpp')
-rw-r--r-- | util/unicode/codecs/big5/main.cpp | 158 |
1 files changed, 158 insertions, 0 deletions
diff --git a/util/unicode/codecs/big5/main.cpp b/util/unicode/codecs/big5/main.cpp new file mode 100644 index 0000000..edd70e5 --- /dev/null +++ b/util/unicode/codecs/big5/main.cpp @@ -0,0 +1,158 @@ +/**************************************************************************** +** +** Copyright (C) 2009 Nokia Corporation and/or its subsidiary(-ies). +** Contact: Qt Software Information (qt-info@nokia.com) +** +** This file is part of the utils of the Qt Toolkit. +** +** $QT_BEGIN_LICENSE:LGPL$ +** No Commercial Usage +** This file contains pre-release code and may not be distributed. +** You may use this file in accordance with the terms and conditions +** contained in the either Technology Preview License Agreement or the +** Beta Release License Agreement. +** +** GNU Lesser General Public License Usage +** Alternatively, this file may be used under the terms of the GNU Lesser +** General Public License version 2.1 as published by the Free Software +** Foundation and appearing in the file LICENSE.LGPL included in the +** packaging of this file. Please review the following information to +** ensure the GNU Lesser General Public License version 2.1 requirements +** will be met: http://www.gnu.org/licenses/old-licenses/lgpl-2.1.html. +** +** In addition, as a special exception, Nokia gives you certain +** additional rights. These rights are described in the Nokia Qt LGPL +** Exception version 1.0, included in the file LGPL_EXCEPTION.txt in this +** package. +** +** GNU General Public License Usage +** Alternatively, this file may be used under the terms of the GNU +** General Public License version 3.0 as published by the Free Software +** Foundation and appearing in the file LICENSE.GPL included in the +** packaging of this file. Please review the following information to +** ensure the GNU General Public License version 3.0 requirements will be +** met: http://www.gnu.org/copyleft/gpl.html. +** +** If you are unsure which license is appropriate for your use, please +** contact the sales department at qt-sales@nokia.com. +** $QT_END_LICENSE$ +** +****************************************************************************/ +#include <qtextcodec.h> +#include <qbytearray.h> +#include <qstring.h> +#include <qdebug.h> +#include <qfile.h> +#include <qcoreapplication.h> +#include <qset.h> + +struct Map { Map(uint u, uint b) : uc(u), b5(b) {} uint uc; uint b5; }; + +int main(int argc, char **argv) +{ + QCoreApplication app(argc, argv); + QTextCodec *big5 = QTextCodec::codecForName("Big5-hkscs"); + +#if 0 + QFile f("/home/lars/dev/qt-4.0/util/unicode/data/big5-eten.txt"); + f.open(QFile::ReadOnly); + + while (!f.atEnd()) { + QByteArray line = f.readLine(); + if (line.startsWith("#")) + continue; + line.replace("0x", ""); + line.replace("U+", ""); + line.replace("\t", " "); + line = line.simplified(); + QList<QByteArray> split = line.split(' '); + bool ok; + int b5 = split.at(0).toInt(&ok, 16); + Q_ASSERT(ok); + int uc = split.at(1).toInt(&ok, 16); + Q_ASSERT(ok); + if (b5 < 0x100) + continue; +#else + QFile f(":/BIG5"); + f.open(QFile::ReadOnly); + + while (!f.atEnd()) { + QByteArray line = f.readLine(); + if (line.startsWith("CHARMAP")) + break; + } + QSet<uint> b5_ok; + QSet<uint> uc_ok; + QList<Map> b5_to_uc_map; + QList<Map> uc_to_b5_map; + while (!f.atEnd()) { + QByteArray line = f.readLine(); + if (line.startsWith("%")) + continue; + if (line.startsWith("END CHARMAP")) + break; + line.replace("/x", ""); + line.replace("<U", ""); + line.replace(">", ""); + line.replace("\t", " "); + line = line.simplified(); + QList<QByteArray> split = line.split(' '); + bool ok; + int b5 = split.at(1).toInt(&ok, 16); + Q_ASSERT(ok); + int uc = split.at(0).toInt(&ok, 16); + Q_ASSERT(ok); + if (b5 < 0x100 || uc > 0xffff) + continue; +#endif + +// qDebug() << hex << "testing: '" << b5 << "' - '" << uc << "'"; + QByteArray ba; + + ba += (char)(uchar)(b5 >> 8); + ba += (char)(uchar)(b5 & 0xff); + + QString s = big5->toUnicode(ba); + Q_ASSERT(s.length() == 1); + QString s2; + s2 = QChar(uc); + ba = big5->fromUnicode(s2); + Q_ASSERT(ba.length() <= 2); + int round; + if (ba.length() == 1) + round = (int)(uchar)ba[0]; + else + round = ((int)(uchar)ba[0] << 8) + (int)(uchar)ba[1]; + if (b5 != round) + uc_to_b5_map += Map(uc, b5); + else + b5_ok.insert(b5); + + if (s[0].unicode() != uc) + b5_to_uc_map += Map(uc, b5); + else + uc_ok.insert(uc); + }; + + QList<QByteArray> list; + foreach(Map m, b5_to_uc_map) { + if (!uc_ok.contains(m.b5)) + list += QByteArray(" { 0x" + QByteArray::number(m.b5, 16) + ", 0x" + QByteArray::number(m.uc, 16) + " }\n");; + } + QByteArray ba; + qSort(list); + foreach(QByteArray a, list) + ba += a; + qDebug() << "struct B5Map b5_to_uc_map = {\n" << ba + "\n};"; + + list = QList<QByteArray>(); + foreach(Map m, uc_to_b5_map) + if (!b5_ok.contains(m.uc)) + list += QByteArray(" { 0x" + QByteArray::number(m.uc, 16) + ", 0x" + QByteArray::number(m.b5, 16) + " }\n");; + ba = QByteArray(); + qSort(list); + foreach(QByteArray a, list) + ba += a; + qDebug() << "struct B5Map uc_to_b5_map = {\n" << ba + "\n};"; +} |