summaryrefslogtreecommitdiffstats
path: root/src/corelib/codecs/qtsciicodec.cpp
diff options
context:
space:
mode:
authorKarsten Heimrich <karsten.heimrich@qt.io>2020-06-17 12:33:40 +0200
committerKarsten Heimrich <karsten.heimrich@qt.io>2020-06-20 02:04:38 +0200
commit18ec53156ee704fdb4977436fccfdc85333e614b (patch)
treedf734ce7893d570f4a90f923fcfe9c80ddc3de05 /src/corelib/codecs/qtsciicodec.cpp
parent4455de24d453138411c57bae55af18f3fba58d4b (diff)
Move QTextCodec support out of QtCore
* Assume UTF-8 on all Unix like systems * Export some functions to be able to compile QTextCodec once moved to Qt5Compat. Task-number: QTBUG-75665 Change-Id: I52ec47a848bc0ba72e9c7689668b1bcc5d736c29 Reviewed-by: Lars Knoll <lars.knoll@qt.io>
Diffstat (limited to 'src/corelib/codecs/qtsciicodec.cpp')
-rw-r--r--src/corelib/codecs/qtsciicodec.cpp493
1 files changed, 0 insertions, 493 deletions
diff --git a/src/corelib/codecs/qtsciicodec.cpp b/src/corelib/codecs/qtsciicodec.cpp
deleted file mode 100644
index 936fc4206d..0000000000
--- a/src/corelib/codecs/qtsciicodec.cpp
+++ /dev/null
@@ -1,493 +0,0 @@
-/****************************************************************************
-**
-** Copyright (C) 2016 The Qt Company Ltd.
-** Contact: https://www.qt.io/licensing/
-**
-** This file is part of the QtCore module of the Qt Toolkit.
-**
-** $QT_BEGIN_LICENSE:LGPL$
-** Commercial License Usage
-** Licensees holding valid commercial Qt licenses may use this file in
-** accordance with the commercial license agreement provided with the
-** Software or, alternatively, in accordance with the terms contained in
-** a written agreement between you and The Qt Company. For licensing terms
-** and conditions see https://www.qt.io/terms-conditions. For further
-** information use the contact form at https://www.qt.io/contact-us.
-**
-** GNU Lesser General Public License Usage
-** Alternatively, this file may be used under the terms of the GNU Lesser
-** General Public License version 3 as published by the Free Software
-** Foundation and appearing in the file LICENSE.LGPL3 included in the
-** packaging of this file. Please review the following information to
-** ensure the GNU Lesser General Public License version 3 requirements
-** will be met: https://www.gnu.org/licenses/lgpl-3.0.html.
-**
-** GNU General Public License Usage
-** Alternatively, this file may be used under the terms of the GNU
-** General Public License version 2.0 or (at your option) the GNU General
-** Public license version 3 or any later version approved by the KDE Free
-** Qt Foundation. The licenses are as published by the Free Software
-** Foundation and appearing in the file LICENSE.GPL2 and LICENSE.GPL3
-** included in the packaging of this file. Please review the following
-** information to ensure the GNU General Public License requirements will
-** be met: https://www.gnu.org/licenses/gpl-2.0.html and
-** https://www.gnu.org/licenses/gpl-3.0.html.
-**
-** $QT_END_LICENSE$
-**
-****************************************************************************/
-
-// Most of the code here was originally written by Hans Petter Bieker,
-// and is included in Qt with the author's permission, and the grateful
-// thanks of the Qt team.
-
-#include "qtsciicodec_p.h"
-#include "qlist.h"
-
-QT_BEGIN_NAMESPACE
-
-static unsigned char qt_UnicodeToTSCII(ushort u1, ushort u2, ushort u3);
-static unsigned int qt_TSCIIToUnicode(unsigned int code, uint *s);
-
-#define IsTSCIIChar(c) (((c) >= 0x80) && ((c) <= 0xfd))
-
-/*! \class QTsciiCodec
- \inmodule QtCore
- \reentrant
- \internal
-*/
-
-/*!
- Destroys the text codec object.
-*/
-QTsciiCodec::~QTsciiCodec()
-{
-}
-
-/*!
- Converts the first \a len characters in \a uc from Unicode to this
- encoding, and returns the result in a byte array. The \a state contains
- some conversion flags, and is used by the codec to maintain state
- information.
-*/
-QByteArray QTsciiCodec::convertFromUnicode(const QChar *uc, int len, ConverterState *state) const
-{
- char replacement = '?';
- if (state) {
- if (state->flags & ConvertInvalidToNull)
- replacement = 0;
- }
- int invalid = 0;
-
- QByteArray rstr(len, Qt::Uninitialized);
- uchar* cursor = (uchar*)rstr.data();
- for (int i = 0; i < len; i++) {
- QChar ch = uc[i];
- uchar j;
- if (ch.row() == 0x00 && ch.cell() < 0x80) {
- // ASCII
- j = ch.cell();
- } else if ((j = qt_UnicodeToTSCII(uc[i].unicode(),
- uc[i + 1].unicode(),
- uc[i + 2].unicode()))) {
- // We have to check the combined chars first!
- i += 2;
- } else if ((j = qt_UnicodeToTSCII(uc[i].unicode(),
- uc[i + 1].unicode(), 0))) {
- i++;
- } else if ((j = qt_UnicodeToTSCII(uc[i].unicode(), 0, 0))) {
- } else {
- // Error
- j = replacement;
- ++invalid;
- }
- *cursor++ = j;
- }
- rstr.resize(cursor - (const uchar*)rstr.constData());
-
- if (state) {
- state->invalidChars += invalid;
- }
- return rstr;
-}
-
-/*!
- Converts the first \a len characters in \a chars from this encoding
- to Unicode, and returns the result in a QString. The \a state contains
- some conversion flags, and is used by the codec to maintain state
- information.
-*/
-QString QTsciiCodec::convertToUnicode(const char* chars, int len, ConverterState *state) const
-{
- QChar replacement = QChar::ReplacementCharacter;
- if (state) {
- if (state->flags & ConvertInvalidToNull)
- replacement = QChar::Null;
- }
- int invalid = 0;
-
- QString result;
- for (int i = 0; i < len; i++) {
- uchar ch = chars[i];
- if (ch < 0x80) {
- // ASCII
- result += QLatin1Char(ch);
- } else if (IsTSCIIChar(ch)) {
- // TSCII
- uint s[3];
- uint u = qt_TSCIIToUnicode(ch, s);
- uint *p = s;
- while (u--) {
- uint c = *p++;
- if (c)
- result += QChar(c);
- else {
- result += replacement;
- ++invalid;
- }
- }
- } else {
- // Invalid
- result += replacement;
- ++invalid;
- }
- }
-
- if (state) {
- state->invalidChars += invalid;
- }
- return result;
-}
-
-/*!
- Returns the official name for the encoding that is handled by the codec.
-
- \sa QTextCodec::name()
-*/
-QByteArray QTsciiCodec::name() const
-{
- return "TSCII";
-}
-
-/*!
- Returns the MIB enum for the encoding.
-
- \sa QTextCodec::mibEnum()
-*/
-int QTsciiCodec::mibEnum() const
-{
- return 2107;
-}
-
-static const int UnToTsLast = 124; // 125 items -- so the last will be 124
-static const ushort UnToTs [][4] = {
- // *Sorted* list of TSCII maping for unicode chars
- //FIRST SECOND THIRD TSCII
- {0x00A0, 0x0000, 0x0000, 0xA0},
- {0x00A9, 0x0000, 0x0000, 0xA9},
- {0x0B83, 0x0000, 0x0000, 0xB7},
- {0x0B85, 0x0000, 0x0000, 0xAB},
- {0x0B86, 0x0000, 0x0000, 0xAC},
- {0x0B87, 0x0000, 0x0000, 0xAD},
- {0x0B88, 0x0000, 0x0000, 0xAE},
- {0x0B89, 0x0000, 0x0000, 0xAF},
- {0x0B8A, 0x0000, 0x0000, 0xB0},
- {0x0B8E, 0x0000, 0x0000, 0xB1},
- {0x0B8F, 0x0000, 0x0000, 0xB2},
- {0x0B90, 0x0000, 0x0000, 0xB3},
- {0x0B92, 0x0000, 0x0000, 0xB4},
- {0x0B93, 0x0000, 0x0000, 0xB5},
- {0x0B94, 0x0000, 0x0000, 0xB6},
- {0x0B95, 0x0000, 0x0000, 0xB8},
- {0x0B95, 0x0B82, 0x0000, 0xEC},
- {0x0B95, 0x0BC1, 0x0000, 0xCC},
- {0x0B95, 0x0BC2, 0x0000, 0xDC},
- {0x0B99, 0x0000, 0x0000, 0xB9},
- {0x0B99, 0x0B82, 0x0000, 0xED},
- {0x0B99, 0x0BC1, 0x0000, 0x99},
- {0x0B99, 0x0BC2, 0x0000, 0x9B},
- {0x0B9A, 0x0000, 0x0000, 0xBA},
- {0x0B9A, 0x0B82, 0x0000, 0xEE},
- {0x0B9A, 0x0BC1, 0x0000, 0xCD},
- {0x0B9A, 0x0BC2, 0x0000, 0xDD},
- {0x0B9C, 0x0000, 0x0000, 0x83},
- {0x0B9C, 0x0B82, 0x0000, 0x88},
- {0x0B9E, 0x0000, 0x0000, 0xBB},
- {0x0B9E, 0x0B82, 0x0000, 0xEF},
- {0x0B9E, 0x0BC1, 0x0000, 0x9A},
- {0x0B9E, 0x0BC2, 0x0000, 0x9C},
- {0x0B9F, 0x0000, 0x0000, 0xBC},
- {0x0B9F, 0x0B82, 0x0000, 0xF0},
- {0x0B9F, 0x0BBF, 0x0000, 0xCA},
- {0x0B9F, 0x0BC0, 0x0000, 0xCB},
- {0x0B9F, 0x0BC1, 0x0000, 0xCE},
- {0x0B9F, 0x0BC2, 0x0000, 0xDE},
- {0x0BA1, 0x0B82, 0x0000, 0xF2},
- {0x0BA3, 0x0000, 0x0000, 0xBD},
- {0x0BA3, 0x0B82, 0x0000, 0xF1},
- {0x0BA3, 0x0BC1, 0x0000, 0xCF},
- {0x0BA3, 0x0BC2, 0x0000, 0xDF},
- {0x0BA4, 0x0000, 0x0000, 0xBE},
- {0x0BA4, 0x0BC1, 0x0000, 0xD0},
- {0x0BA4, 0x0BC2, 0x0000, 0xE0},
- {0x0BA8, 0x0000, 0x0000, 0xBF},
- {0x0BA8, 0x0B82, 0x0000, 0xF3},
- {0x0BA8, 0x0BC1, 0x0000, 0xD1},
- {0x0BA8, 0x0BC2, 0x0000, 0xE1},
- {0x0BA9, 0x0000, 0x0000, 0xC9},
- {0x0BA9, 0x0B82, 0x0000, 0xFD},
- {0x0BA9, 0x0BC1, 0x0000, 0xDB},
- {0x0BA9, 0x0BC2, 0x0000, 0xEB},
- {0x0BAA, 0x0000, 0x0000, 0xC0},
- {0x0BAA, 0x0B82, 0x0000, 0xF4},
- {0x0BAA, 0x0BC1, 0x0000, 0xD2},
- {0x0BAA, 0x0BC2, 0x0000, 0xE2},
- {0x0BAE, 0x0000, 0x0000, 0xC1},
- {0x0BAE, 0x0B82, 0x0000, 0xF5},
- {0x0BAE, 0x0BC1, 0x0000, 0xD3},
- {0x0BAE, 0x0BC2, 0x0000, 0xE3},
- {0x0BAF, 0x0000, 0x0000, 0xC2},
- {0x0BAF, 0x0B82, 0x0000, 0xF6},
- {0x0BAF, 0x0BC1, 0x0000, 0xD4},
- {0x0BAF, 0x0BC2, 0x0000, 0xE4},
- {0x0BB0, 0x0000, 0x0000, 0xC3},
- {0x0BB0, 0x0B82, 0x0000, 0xF7},
- {0x0BB0, 0x0BC1, 0x0000, 0xD5},
- {0x0BB0, 0x0BC2, 0x0000, 0xE5},
- {0x0BB1, 0x0000, 0x0000, 0xC8},
- {0x0BB1, 0x0B82, 0x0000, 0xFC},
- {0x0BB1, 0x0BC1, 0x0000, 0xDA},
- {0x0BB1, 0x0BC2, 0x0000, 0xEA},
- {0x0BB2, 0x0000, 0x0000, 0xC4},
- {0x0BB2, 0x0B82, 0x0000, 0xF8},
- {0x0BB2, 0x0BC1, 0x0000, 0xD6},
- {0x0BB2, 0x0BC2, 0x0000, 0xE6},
- {0x0BB3, 0x0000, 0x0000, 0xC7},
- {0x0BB3, 0x0B82, 0x0000, 0xFB},
- {0x0BB3, 0x0BC1, 0x0000, 0xD9},
- {0x0BB3, 0x0BC2, 0x0000, 0xE9},
- {0x0BB4, 0x0000, 0x0000, 0xC6},
- {0x0BB4, 0x0B82, 0x0000, 0xFA},
- {0x0BB4, 0x0BC1, 0x0000, 0xD8},
- {0x0BB4, 0x0BC2, 0x0000, 0xE8},
- {0x0BB5, 0x0000, 0x0000, 0xC5},
- {0x0BB5, 0x0B82, 0x0000, 0xF9},
- {0x0BB5, 0x0BC1, 0x0000, 0xD7},
- {0x0BB5, 0x0BC2, 0x0000, 0xE7},
- {0x0BB7, 0x0000, 0x0000, 0x84},
- {0x0BB7, 0x0B82, 0x0000, 0x89},
- {0x0BB8, 0x0000, 0x0000, 0x85},
- {0x0BB8, 0x0B82, 0x0000, 0x8A},
- {0x0BB9, 0x0000, 0x0000, 0x86},
- {0x0BB9, 0x0B82, 0x0000, 0x8B},
- {0x0BBE, 0x0000, 0x0000, 0xA1},
- {0x0BBF, 0x0000, 0x0000, 0xA2},
- {0x0BC0, 0x0000, 0x0000, 0xA3},
- {0x0BC1, 0x0000, 0x0000, 0xA4},
- {0x0BC2, 0x0000, 0x0000, 0xA5},
- {0x0BC6, 0x0000, 0x0000, 0xA6},
- {0x0BC7, 0x0000, 0x0000, 0xA7},
- {0x0BC8, 0x0000, 0x0000, 0xA8},
- {0x0BCC, 0x0000, 0x0000, 0xAA},
- {0x0BE6, 0x0000, 0x0000, 0x80},
- {0x0BE7, 0x0000, 0x0000, 0x81},
- {0x0BE7, 0x0BB7, 0x0000, 0x87},
- {0x0BE7, 0x0BB7, 0x0B82, 0x8C},
- {0x0BE8, 0x0000, 0x0000, 0x8D},
- {0x0BE9, 0x0000, 0x0000, 0x8E},
- {0x0BEA, 0x0000, 0x0000, 0x8F},
- {0x0BEB, 0x0000, 0x0000, 0x90},
- {0x0BEC, 0x0000, 0x0000, 0x95},
- {0x0BED, 0x0000, 0x0000, 0x96},
- {0x0BEE, 0x0000, 0x0000, 0x97},
- {0x0BEF, 0x0000, 0x0000, 0x98},
- {0x0BF0, 0x0000, 0x0000, 0x9D},
- {0x0BF1, 0x0000, 0x0000, 0x9E},
- {0x0BF2, 0x0000, 0x0000, 0x9F},
- {0x2018, 0x0000, 0x0000, 0x91},
- {0x2019, 0x0000, 0x0000, 0x92},
- {0x201C, 0x0000, 0x0000, 0x93},
- {0x201C, 0x0000, 0x0000, 0x94}
-};
-
-static const ushort TsToUn [][3] = {
- // Starting at 0x80
- {0x0BE6, 0x0000, 0x0000},
- {0x0BE7, 0x0000, 0x0000},
- {0x0000, 0x0000, 0x0000}, // unknown
- {0x0B9C, 0x0000, 0x0000},
- {0x0BB7, 0x0000, 0x0000},
- {0x0BB8, 0x0000, 0x0000},
- {0x0BB9, 0x0000, 0x0000},
- {0x0BE7, 0x0BB7, 0x0000},
- {0x0B9C, 0x0B82, 0x0000},
- {0x0BB7, 0x0B82, 0x0000},
- {0x0BB8, 0x0B82, 0x0000},
- {0x0BB9, 0x0B82, 0x0000},
- {0x0BE7, 0x0BB7, 0x0B82},
- {0x0BE8, 0x0000, 0x0000},
- {0x0BE9, 0x0000, 0x0000},
- {0x0BEA, 0x0000, 0x0000},
- {0x0BEB, 0x0000, 0x0000},
- {0x2018, 0x0000, 0x0000},
- {0x2019, 0x0000, 0x0000},
- {0x201C, 0x0000, 0x0000},
- {0x201C, 0x0000, 0x0000}, // two of the same??
- {0x0BEC, 0x0000, 0x0000},
- {0x0BED, 0x0000, 0x0000},
- {0x0BEE, 0x0000, 0x0000},
- {0x0BEF, 0x0000, 0x0000},
- {0x0B99, 0x0BC1, 0x0000},
- {0x0B9E, 0x0BC1, 0x0000},
- {0x0B99, 0x0BC2, 0x0000},
- {0x0B9E, 0x0BC2, 0x0000},
- {0x0BF0, 0x0000, 0x0000},
- {0x0BF1, 0x0000, 0x0000},
- {0x0BF2, 0x0000, 0x0000},
- {0x00A0, 0x0000, 0x0000},
- {0x0BBE, 0x0000, 0x0000},
- {0x0BBF, 0x0000, 0x0000},
- {0x0BC0, 0x0000, 0x0000},
- {0x0BC1, 0x0000, 0x0000},
- {0x0BC2, 0x0000, 0x0000},
- {0x0BC6, 0x0000, 0x0000},
- {0x0BC7, 0x0000, 0x0000},
- {0x0BC8, 0x0000, 0x0000},
- {0x00A9, 0x0000, 0x0000},
- {0x0BCC, 0x0000, 0x0000},
- {0x0B85, 0x0000, 0x0000},
- {0x0B86, 0x0000, 0x0000},
- {0x0B87, 0x0000, 0x0000},
- {0x0B88, 0x0000, 0x0000},
- {0x0B89, 0x0000, 0x0000},
- {0x0B8A, 0x0000, 0x0000},
- {0x0B8E, 0x0000, 0x0000},
- {0x0B8F, 0x0000, 0x0000},
- {0x0B90, 0x0000, 0x0000},
- {0x0B92, 0x0000, 0x0000},
- {0x0B93, 0x0000, 0x0000},
- {0x0B94, 0x0000, 0x0000},
- {0x0B83, 0x0000, 0x0000},
- {0x0B95, 0x0000, 0x0000},
- {0x0B99, 0x0000, 0x0000},
- {0x0B9A, 0x0000, 0x0000},
- {0x0B9E, 0x0000, 0x0000},
- {0x0B9F, 0x0000, 0x0000},
- {0x0BA3, 0x0000, 0x0000},
- {0x0BA4, 0x0000, 0x0000},
- {0x0BA8, 0x0000, 0x0000},
- {0x0BAA, 0x0000, 0x0000},
- {0x0BAE, 0x0000, 0x0000},
- {0x0BAF, 0x0000, 0x0000},
- {0x0BB0, 0x0000, 0x0000},
- {0x0BB2, 0x0000, 0x0000},
- {0x0BB5, 0x0000, 0x0000},
- {0x0BB4, 0x0000, 0x0000},
- {0x0BB3, 0x0000, 0x0000},
- {0x0BB1, 0x0000, 0x0000},
- {0x0BA9, 0x0000, 0x0000},
- {0x0B9F, 0x0BBF, 0x0000},
- {0x0B9F, 0x0BC0, 0x0000},
- {0x0B95, 0x0BC1, 0x0000},
- {0x0B9A, 0x0BC1, 0x0000},
- {0x0B9F, 0x0BC1, 0x0000},
- {0x0BA3, 0x0BC1, 0x0000},
- {0x0BA4, 0x0BC1, 0x0000},
- {0x0BA8, 0x0BC1, 0x0000},
- {0x0BAA, 0x0BC1, 0x0000},
- {0x0BAE, 0x0BC1, 0x0000},
- {0x0BAF, 0x0BC1, 0x0000},
- {0x0BB0, 0x0BC1, 0x0000},
- {0x0BB2, 0x0BC1, 0x0000},
- {0x0BB5, 0x0BC1, 0x0000},
- {0x0BB4, 0x0BC1, 0x0000},
- {0x0BB3, 0x0BC1, 0x0000},
- {0x0BB1, 0x0BC1, 0x0000},
- {0x0BA9, 0x0BC1, 0x0000},
- {0x0B95, 0x0BC2, 0x0000},
- {0x0B9A, 0x0BC2, 0x0000},
- {0x0B9F, 0x0BC2, 0x0000},
- {0x0BA3, 0x0BC2, 0x0000},
- {0x0BA4, 0x0BC2, 0x0000},
- {0x0BA8, 0x0BC2, 0x0000},
- {0x0BAA, 0x0BC2, 0x0000},
- {0x0BAE, 0x0BC2, 0x0000},
- {0x0BAF, 0x0BC2, 0x0000},
- {0x0BB0, 0x0BC2, 0x0000},
- {0x0BB2, 0x0BC2, 0x0000},
- {0x0BB5, 0x0BC2, 0x0000},
- {0x0BB4, 0x0BC2, 0x0000},
- {0x0BB3, 0x0BC2, 0x0000},
- {0x0BB1, 0x0BC2, 0x0000},
- {0x0BA9, 0x0BC2, 0x0000},
- {0x0B95, 0x0B82, 0x0000},
- {0x0B99, 0x0B82, 0x0000},
- {0x0B9A, 0x0B82, 0x0000},
- {0x0B9E, 0x0B82, 0x0000},
- {0x0B9F, 0x0B82, 0x0000},
- {0x0BA3, 0x0B82, 0x0000},
- {0x0BA1, 0x0B82, 0x0000},
- {0x0BA8, 0x0B82, 0x0000},
- {0x0BAA, 0x0B82, 0x0000},
- {0x0BAE, 0x0B82, 0x0000},
- {0x0BAF, 0x0B82, 0x0000},
- {0x0BB0, 0x0B82, 0x0000},
- {0x0BB2, 0x0B82, 0x0000},
- {0x0BB5, 0x0B82, 0x0000},
- {0x0BB4, 0x0B82, 0x0000},
- {0x0BB3, 0x0B82, 0x0000},
- {0x0BB1, 0x0B82, 0x0000},
- {0x0BA9, 0x0B82, 0x0000}
-};
-
-static int cmp(const ushort *s1, const ushort *s2, size_t len)
-{
- int diff = 0;
-
- while (len-- && (diff = *s1++ - *s2++) == 0)
- ;
-
- return diff;
-}
-
-static unsigned char qt_UnicodeToTSCII(ushort u1, ushort u2, ushort u3)
-{
- ushort s[3];
- s[0] = u1;
- s[1] = u2;
- s[2] = u3;
-
- int a = 0; // start pos
- int b = UnToTsLast; // end pos
-
- // do a binary search for the composed unicode in the list
- while (a <= b) {
- int w = (a + b) / 2;
- int j = cmp(UnToTs[w], s, 3);
-
- if (j == 0)
- // found it
- return UnToTs[w][3];
-
- if (j < 0)
- a = w + 1;
- else
- b = w - 1;
- }
-
- return 0;
-}
-
-static unsigned int qt_TSCIIToUnicode(uint code, uint *s)
-{
- int len = 0;
- for (int i = 0; i < 3; i++) {
- uint u = TsToUn[code & 0x7f][i];
- s[i] = u;
- if (s[i]) len = i + 1;
- }
-
- return len;
-}
-
-QT_END_NAMESPACE