Advance Wayland and KDE package bring-up

Ultraworked with [Sisyphus](https://github.com/code-yeongyu/oh-my-openagent) Co-authored-by: Sisyphus <clio-agent@sisyphuslabs.ai>
2026-04-14 10:51:06 +01:00
parent 51f3c21121
commit cf12defd28
15214 changed files with 20594243 additions and 269 deletions
@@ -0,0 +1,751 @@
+/*  -*- c++ -*-
+    SPDX-FileCopyrightText: 2002 Marc Mutz <mutz@kde.org>
+
+    SPDX-License-Identifier: LGPL-2.0-or-later
+*/
+/**
+  @file
+  This file is part of the API for handling @ref MIME data and
+  defines the @ref QuotedPrintable, @ref  RFC2047Q, and
+  @ref RFC2231 @ref Codec classes.
+
+  @brief
+  Defines the classes QuotedPrintableCodec, Rfc2047QEncodingCodec, and
+  Rfc2231EncodingCodec.
+
+  @authors Marc Mutz \<mutz@kde.org\>
+*/
+
+#include "kcodecsqp.h"
+#include "kcodecs_p.h"
+
+#include <QDebug>
+
+#include <cassert>
+
+using namespace KCodecs;
+
+namespace KCodecs
+{
+// none except a-zA-Z0-9!*+-/
+const uchar eTextMap[16] = {0x00, 0x00, 0x00, 0x00, 0x40, 0x35, 0xFF, 0xC0, 0x7F, 0xFF, 0xFF, 0xE0, 0x7F, 0xFF, 0xFF, 0xE0};
+
+// some helpful functions:
+
+/**
+  Converts a 4-bit @p value into its hexadecimal characater representation.
+  So input of value [0,15] returns ['0','1',... 'F'].  Input values
+  greater than 15 will produce undesired results.
+  @param value is an unsigned character containing the 4-bit input value.
+*/
+static inline char binToHex(uchar value)
+{
+    if (value > 9) {
+        return value + 'A' - 10;
+    } else {
+        return value + '0';
+    }
+}
+
+/**
+  Returns the high-order 4 bits of an 8-bit value in another 8-bit value.
+  @param ch is an unsigned character containing the 8-bit input value.
+*/
+static inline uchar highNibble(uchar ch)
+{
+    return ch >> 4;
+}
+
+/**
+  Returns the low-order 4 bits of an 8-bit value in another 8-bit value.
+  @param ch is an unsigned character containing the 8-bit input value.
+*/
+static inline uchar lowNibble(uchar ch)
+{
+    return ch & 0xF;
+}
+
+/**
+  Returns true if the specified value is a not Control character or
+  question mark; else true.
+  @param ch is an unsigned character containing the 8-bit input value.
+*/
+static inline bool keep(uchar ch)
+{
+    // no CTLs, except HT and not '?'
+    return !((ch < ' ' && ch != '\t') || ch == '?');
+}
+
+//
+// QuotedPrintableCodec
+//
+
+class QuotedPrintableEncoder : public Encoder
+{
+    char mInputBuffer[16];
+    uchar mCurrentLineLength; // 0..76
+    uchar mAccu;
+    uint mInputBufferReadCursor : 4; // 0..15
+    uint mInputBufferWriteCursor : 4; // 0..15
+    enum {
+        Never,
+        AtBOL,
+        Definitely,
+    } mAccuNeedsEncoding : 2;
+    bool mSawLineEnd : 1;
+    bool mSawCR : 1;
+    bool mFinishing : 1;
+    bool mFinished : 1;
+
+protected:
+    friend class QuotedPrintableCodec;
+    QuotedPrintableEncoder(Codec::NewlineType newline = Codec::NewlineLF)
+        : Encoder(newline)
+        , mCurrentLineLength(0)
+        , mAccu(0)
+        , mInputBufferReadCursor(0)
+        , mInputBufferWriteCursor(0)
+        , mAccuNeedsEncoding(Never)
+        , mSawLineEnd(false)
+        , mSawCR(false)
+        , mFinishing(false)
+        , mFinished(false)
+    {
+    }
+
+    bool needsEncoding(uchar ch)
+    {
+        return ch > '~' || (ch < ' ' && ch != '\t') || ch == '=';
+    }
+    bool needsEncodingAtEOL(uchar ch)
+    {
+        return ch == ' ' || ch == '\t';
+    }
+    bool needsEncodingAtBOL(uchar ch)
+    {
+        return ch == 'F' || ch == '.' || ch == '-';
+    }
+    bool fillInputBuffer(const char *&scursor, const char *const send);
+    bool processNextChar();
+    void createOutputBuffer(char *&dcursor, const char *const dend);
+
+public:
+    ~QuotedPrintableEncoder() override
+    {
+    }
+
+    bool encode(const char *&scursor, const char *const send, char *&dcursor, const char *const dend) override;
+
+    bool finish(char *&dcursor, const char *const dend) override;
+};
+
+class QuotedPrintableDecoder : public Decoder
+{
+    const char mEscapeChar;
+    char mBadChar;
+    /** @p accu holds the msb nibble of the hexchar or zero. */
+    uchar mAccu;
+    /** @p insideHexChar is true iff we're inside an hexchar (=XY).
+        Together with @ref mAccu, we can build this states:
+        @li @p insideHexChar == @p false:
+        normal text
+        @li @p insideHexChar == @p true, @p mAccu == 0:
+        saw the leading '='
+        @li @p insideHexChar == @p true, @p mAccu != 0:
+        saw the first nibble '=X'
+    */
+    const bool mQEncoding;
+    bool mInsideHexChar;
+    bool mFlushing;
+    bool mExpectLF;
+    bool mHaveAccu;
+    /** @p mLastChar holds the first char of an encoded char, so that
+        we are able to keep the first char if the second char is invalid. */
+    char mLastChar;
+
+protected:
+    friend class QuotedPrintableCodec;
+    friend class Rfc2047QEncodingCodec;
+    friend class Rfc2231EncodingCodec;
+    QuotedPrintableDecoder(Codec::NewlineType newline = Codec::NewlineLF, bool aQEncoding = false, char aEscapeChar = '=')
+        : Decoder(newline)
+        , mEscapeChar(aEscapeChar)
+        , mBadChar(0)
+        , mAccu(0)
+        , mQEncoding(aQEncoding)
+        , mInsideHexChar(false)
+        , mFlushing(false)
+        , mExpectLF(false)
+        , mHaveAccu(false)
+        , mLastChar(0)
+    {
+    }
+
+public:
+    ~QuotedPrintableDecoder() override
+    {
+    }
+
+    bool decode(const char *&scursor, const char *const send, char *&dcursor, const char *const dend) override;
+    bool finish(char *&dcursor, const char *const dend) override;
+};
+
+class Rfc2047QEncodingEncoder : public Encoder
+{
+    uchar mAccu;
+    uchar mStepNo;
+    const char mEscapeChar;
+    bool mInsideFinishing : 1;
+
+protected:
+    friend class Rfc2047QEncodingCodec;
+    friend class Rfc2231EncodingCodec;
+    Rfc2047QEncodingEncoder(Codec::NewlineType newline = Codec::NewlineLF, char aEscapeChar = '=')
+        : Encoder(newline)
+        , mAccu(0)
+        , mStepNo(0)
+        , mEscapeChar(aEscapeChar)
+        , mInsideFinishing(false)
+    {
+        // else an optimization in ::encode might break.
+        assert(aEscapeChar == '=' || aEscapeChar == '%');
+    }
+
+    bool isEText(uchar ch)
+    {
+        return (ch < 128) && (eTextMap[ch / 8] & 0x80 >> ch % 8);
+    }
+
+    // this code assumes that isEText( mEscapeChar ) == false!
+    bool needsEncoding(uchar ch)
+    {
+        if (ch > 'z') {
+            return true; // {|}~ DEL and 8bit chars need
+        }
+        if (!isEText(ch)) {
+            return true; // all but a-zA-Z0-9!/*+- need, too
+        }
+        if (mEscapeChar == '%' && (ch == '*' || ch == '/')) {
+            return true; // not allowed in rfc2231 encoding
+        }
+        return false;
+    }
+
+public:
+    ~Rfc2047QEncodingEncoder() override
+    {
+    }
+
+    bool encode(const char *&scursor, const char *const send, char *&dcursor, const char *const dend) override;
+    bool finish(char *&dcursor, const char *const dend) override;
+};
+
+// this doesn't access any member variables, so it can be defined static
+// but then we can't call it from virtual functions
+static qsizetype QuotedPrintableDecoder_maxDecodedSizeFor(qsizetype insize, Codec::NewlineType newline)
+{
+    // all chars unencoded:
+    qsizetype result = insize;
+    // but maybe all of them are \n and we need to make them \r\n :-o
+    if (newline == Codec::NewlineCRLF) {
+        result += insize;
+    }
+
+    // there might be an accu plus escape
+    result += 2;
+
+    return result;
+}
+
+Encoder *QuotedPrintableCodec::makeEncoder(Codec::NewlineType newline) const
+{
+    return new QuotedPrintableEncoder(newline);
+}
+
+Decoder *QuotedPrintableCodec::makeDecoder(Codec::NewlineType newline) const
+{
+    return new QuotedPrintableDecoder(newline);
+}
+
+qsizetype QuotedPrintableCodec::maxDecodedSizeFor(qsizetype insize, Codec::NewlineType newline) const
+{
+    return QuotedPrintableDecoder_maxDecodedSizeFor(insize, newline);
+}
+
+Encoder *Rfc2047QEncodingCodec::makeEncoder(Codec::NewlineType newline) const
+{
+    return new Rfc2047QEncodingEncoder(newline);
+}
+
+Decoder *Rfc2047QEncodingCodec::makeDecoder(Codec::NewlineType newline) const
+{
+    return new QuotedPrintableDecoder(newline, true);
+}
+
+qsizetype Rfc2047QEncodingCodec::maxDecodedSizeFor(qsizetype insize, Codec::NewlineType newline) const
+{
+    return QuotedPrintableDecoder_maxDecodedSizeFor(insize, newline);
+}
+
+Encoder *Rfc2231EncodingCodec::makeEncoder(Codec::NewlineType newline) const
+{
+    return new Rfc2047QEncodingEncoder(newline, '%');
+}
+
+Decoder *Rfc2231EncodingCodec::makeDecoder(Codec::NewlineType newline) const
+{
+    return new QuotedPrintableDecoder(newline, true, '%');
+}
+
+qsizetype Rfc2231EncodingCodec::maxDecodedSizeFor(qsizetype insize, Codec::NewlineType newline) const
+{
+    return QuotedPrintableDecoder_maxDecodedSizeFor(insize, newline);
+}
+
+/********************************************************/
+/********************************************************/
+/********************************************************/
+
+bool QuotedPrintableDecoder::decode(const char *&scursor, const char *const send, char *&dcursor, const char *const dend)
+{
+    if (d->newline == Codec::NewlineCRLF) {
+        qWarning() << "CRLF output for decoders isn't yet supported!";
+    }
+
+    while (scursor != send && dcursor != dend) {
+        if (mFlushing) {
+            // we have to flush chars in the aftermath of a decoding
+            // error. The way to request a flush is to
+            // - store the offending character in mBadChar and
+            // - set mFlushing to true.
+            // The supported cases are (H: hexchar, X: bad char):
+            // =X, =HX, CR
+            // mBadChar is only written out if it is not by itself illegal in
+            // quoted-printable (e.g. CTLs, 8Bits).
+            // A fast way to suppress mBadChar output is to set it to NUL.
+            if (mInsideHexChar) {
+                // output '='
+                *dcursor++ = mEscapeChar;
+                mInsideHexChar = false;
+            } else if (mHaveAccu) {
+                // output the high nibble of the accumulator:
+                *dcursor++ = mLastChar;
+                mHaveAccu = false;
+                mAccu = 0;
+            } else {
+                // output mBadChar
+                assert(mAccu == 0);
+                if (mBadChar) {
+                    if (mBadChar == '=') {
+                        mInsideHexChar = true;
+                    } else {
+                        *dcursor++ = mBadChar;
+                    }
+                    mBadChar = 0;
+                }
+                mFlushing = false;
+            }
+            continue;
+        }
+        assert(mBadChar == 0);
+
+        uchar ch = *scursor++;
+
+        if (mExpectLF && ch != '\n') {
+            // qWarning() << "QuotedPrintableDecoder:"
+            //              "illegally formed soft linebreak or lonely CR!";
+            mInsideHexChar = false;
+            mExpectLF = false;
+            if (mAccu != 0) {
+                return false;
+            }
+        }
+
+        if (mInsideHexChar) {
+            uchar value = 255;
+            // next char(s) represent nibble instead of itself:
+            if (ch <= '9') {
+                if (ch >= '0') {
+                    value = ch - '0';
+                } else {
+                    switch (ch) {
+                    case '\r':
+                        mExpectLF = true;
+                        break;
+                    case '\n':
+                        // soft line break, but only if mAccu is NUL.
+                        if (!mHaveAccu) {
+                            mExpectLF = false;
+                            mInsideHexChar = false;
+                            break;
+                        }
+                    // else fall through
+                    default:
+                        // qWarning() << "QuotedPrintableDecoder:"
+                        //              "illegally formed hex char! Outputting verbatim.";
+                        mBadChar = ch;
+                        mFlushing = true;
+                    }
+                    continue;
+                }
+            } else { // ch > '9'
+                if (ch <= 'F') {
+                    if (ch >= 'A') {
+                        value = 10 + ch - 'A';
+                    } else { // [:-@]
+                        mBadChar = ch;
+                        mFlushing = true;
+                        continue;
+                    }
+                } else { // ch > 'F'
+                    if (ch <= 'f' && ch >= 'a') {
+                        value = 10 + ch - 'a';
+                    } else {
+                        mBadChar = ch;
+                        mFlushing = true;
+                        continue;
+                    }
+                }
+            }
+
+            assert(value < 16);
+            assert(mBadChar == 0);
+            assert(!mExpectLF);
+
+            if (mHaveAccu) {
+                *dcursor++ = char(mAccu | value);
+                mAccu = 0;
+                mHaveAccu = false;
+                mInsideHexChar = false;
+            } else {
+                mHaveAccu = true;
+                mAccu = value << 4;
+                mLastChar = ch;
+            }
+        } else { // not mInsideHexChar
+            if ((ch <= '~' && ch >= ' ') || ch == '\t') {
+                if (ch == mEscapeChar) {
+                    mInsideHexChar = true;
+                } else if (mQEncoding && ch == '_') {
+                    *dcursor++ = char(0x20);
+                } else {
+                    *dcursor++ = char(ch);
+                }
+            } else if (ch == '\n') {
+                *dcursor++ = '\n';
+                mExpectLF = false;
+            } else if (ch == '\r') {
+                mExpectLF = true;
+            } else {
+                // qWarning() << "QuotedPrintableDecoder:" << ch <<
+                //  "illegal character in input stream!";
+                *dcursor++ = char(ch);
+            }
+        }
+    }
+
+    return scursor == send;
+}
+
+bool QuotedPrintableDecoder::finish(char *&dcursor, const char *const dend)
+{
+    while ((mInsideHexChar || mHaveAccu || mFlushing) && dcursor != dend) {
+        // we have to flush chars
+        if (mInsideHexChar) {
+            // output '='
+            *dcursor++ = mEscapeChar;
+            mInsideHexChar = false;
+        } else if (mHaveAccu) {
+            // output the high nibble of the accumulator:
+            *dcursor++ = mLastChar;
+            mHaveAccu = false;
+            mAccu = 0;
+        } else {
+            // output mBadChar
+            assert(mAccu == 0);
+            if (mBadChar) {
+                *dcursor++ = mBadChar;
+                mBadChar = 0;
+            }
+            mFlushing = false;
+        }
+    }
+
+    // return false if we are not finished yet; note that mInsideHexChar is always false
+    return !(mHaveAccu || mFlushing);
+}
+
+bool QuotedPrintableEncoder::fillInputBuffer(const char *&scursor, const char *const send)
+{
+    // Don't read more if there's still a tail of a line in the buffer:
+    if (mSawLineEnd) {
+        return true;
+    }
+
+    // Read until the buffer is full or we have found CRLF or LF (which
+    // don't end up in the input buffer):
+    for (; (mInputBufferWriteCursor + 1) % 16 != mInputBufferReadCursor && scursor != send; mInputBufferWriteCursor++) {
+        char ch = *scursor++;
+        if (ch == '\r') {
+            mSawCR = true;
+        } else if (ch == '\n') {
+            // remove the CR from the input buffer (if any) and return that
+            // we found a line ending:
+            if (mSawCR) {
+                mSawCR = false;
+                assert(mInputBufferWriteCursor != mInputBufferReadCursor);
+                mInputBufferWriteCursor--;
+            }
+            mSawLineEnd = true;
+            return true; // saw CRLF or LF
+        } else {
+            mSawCR = false;
+        }
+        mInputBuffer[mInputBufferWriteCursor] = ch;
+    }
+    mSawLineEnd = false;
+    return false; // didn't see a line ending...
+}
+
+bool QuotedPrintableEncoder::processNextChar()
+{
+    // If we process a buffer which doesn't end in a line break, we
+    // can't process all of it, since the next chars that will be read
+    // could be a line break. So we empty the buffer only until a fixed
+    // number of chars is left (except when mFinishing, which means that
+    // the data doesn't end in newline):
+    const int minBufferFillWithoutLineEnd = 4;
+
+    assert(d->outputBufferCursor == 0);
+
+    int bufferFill = int(mInputBufferWriteCursor) - int(mInputBufferReadCursor);
+    if (bufferFill < 0) {
+        bufferFill += 16;
+    }
+
+    assert(bufferFill >= 0 && bufferFill <= 15);
+
+    if (!mFinishing //
+        && !mSawLineEnd //
+        && bufferFill < minBufferFillWithoutLineEnd) {
+        return false;
+    }
+
+    // buffer is empty, return false:
+    if (mInputBufferReadCursor == mInputBufferWriteCursor) {
+        return false;
+    }
+
+    // Real processing goes here:
+    mAccu = mInputBuffer[mInputBufferReadCursor++];
+    if (needsEncoding(mAccu)) { // always needs encoding or
+        mAccuNeedsEncoding = Definitely;
+    } else if ((mSawLineEnd || mFinishing) // needs encoding at end of line
+               && bufferFill == 1 // or end of buffer
+               && needsEncodingAtEOL(mAccu)) {
+        mAccuNeedsEncoding = Definitely;
+    } else if (needsEncodingAtBOL(mAccu)) {
+        mAccuNeedsEncoding = AtBOL;
+    } else {
+        // never needs encoding
+        mAccuNeedsEncoding = Never;
+    }
+
+    return true;
+}
+
+// Outputs processed (verbatim or hex-encoded) chars and inserts soft
+// line breaks as necessary. Depends on processNextChar's directions
+// on whether to encode the current char, and whether
+// the current char is the last one in it's input line:
+void QuotedPrintableEncoder::createOutputBuffer(char *&dcursor, const char *const dend)
+{
+    const int maxLineLength = 76; // rfc 2045
+
+    assert(d->outputBufferCursor == 0);
+
+    /* clang-format off */
+    bool lastOneOnThisLine = mSawLineEnd
+                             && mInputBufferReadCursor == mInputBufferWriteCursor;
+    /* clang-format on */
+
+    int neededSpace = 1;
+    if (mAccuNeedsEncoding == Definitely) {
+        neededSpace = 3;
+    }
+
+    // reserve space for the soft hyphen (=)
+    if (!lastOneOnThisLine) {
+        neededSpace++;
+    }
+
+    if (mCurrentLineLength > maxLineLength - neededSpace) {
+        // current line too short, insert soft line break:
+        write('=', dcursor, dend);
+        writeCRLF(dcursor, dend);
+        mCurrentLineLength = 0;
+    }
+
+    if (Never == mAccuNeedsEncoding //
+        || (AtBOL == mAccuNeedsEncoding && mCurrentLineLength != 0)) {
+        write(mAccu, dcursor, dend);
+        mCurrentLineLength++;
+    } else {
+        write('=', dcursor, dend);
+        write(binToHex(highNibble(mAccu)), dcursor, dend);
+        write(binToHex(lowNibble(mAccu)), dcursor, dend);
+        mCurrentLineLength += 3;
+    }
+}
+
+bool QuotedPrintableEncoder::encode(const char *&scursor, const char *const send, char *&dcursor, const char *const dend)
+{
+    // support probing by the caller:
+    if (mFinishing) {
+        return true;
+    }
+
+    while (scursor != send && dcursor != dend) {
+        if (d->outputBufferCursor && !flushOutputBuffer(dcursor, dend)) {
+            return scursor == send;
+        }
+
+        assert(d->outputBufferCursor == 0);
+
+        // fill input buffer until eol has been reached or until the
+        // buffer is full, whatever comes first:
+        fillInputBuffer(scursor, send);
+
+        if (processNextChar()) {
+            // there was one...
+            createOutputBuffer(dcursor, dend);
+        } else if (mSawLineEnd && mInputBufferWriteCursor == mInputBufferReadCursor) {
+            // load a hard line break into output buffer:
+            writeCRLF(dcursor, dend);
+            // signal fillInputBuffer() we are ready for the next line:
+            mSawLineEnd = false;
+            mCurrentLineLength = 0;
+        } else {
+            // we are supposedly finished with this input block:
+            break;
+        }
+    }
+
+    // make sure we write as much as possible and don't stop _writing_
+    // just because we have no more _input_:
+    if (d->outputBufferCursor) {
+        flushOutputBuffer(dcursor, dend);
+    }
+
+    return scursor == send;
+
+} // encode
+
+bool QuotedPrintableEncoder::finish(char *&dcursor, const char *const dend)
+{
+    mFinishing = true;
+
+    if (mFinished) {
+        return flushOutputBuffer(dcursor, dend);
+    }
+
+    while (dcursor != dend) {
+        if (d->outputBufferCursor && !flushOutputBuffer(dcursor, dend)) {
+            return false;
+        }
+
+        assert(d->outputBufferCursor == 0);
+
+        if (processNextChar()) {
+            // there was one...
+            createOutputBuffer(dcursor, dend);
+        } else if (mSawLineEnd && mInputBufferWriteCursor == mInputBufferReadCursor) {
+            // load a hard line break into output buffer:
+            writeCRLF(dcursor, dend);
+            mSawLineEnd = false;
+            mCurrentLineLength = 0;
+        } else {
+            mFinished = true;
+            return flushOutputBuffer(dcursor, dend);
+        }
+    }
+
+    return mFinished && !d->outputBufferCursor;
+
+} // finish
+
+bool Rfc2047QEncodingEncoder::encode(const char *&scursor, const char *const send, char *&dcursor, const char *const dend)
+{
+    if (mInsideFinishing) {
+        return true;
+    }
+
+    while (scursor != send && dcursor != dend) {
+        uchar value = 0;
+        switch (mStepNo) {
+        case 0:
+            // read the next char and decide if and how do encode:
+            mAccu = *scursor++;
+            if (!needsEncoding(mAccu)) {
+                *dcursor++ = char(mAccu);
+            } else if (mEscapeChar == '=' && mAccu == 0x20) {
+                // shortcut encoding for 0x20 (latin-1/us-ascii SPACE)
+                // (not for rfc2231 encoding)
+                *dcursor++ = '_';
+            } else {
+                // needs =XY encoding - write escape char:
+                *dcursor++ = mEscapeChar;
+                mStepNo = 1;
+            }
+            continue;
+        case 1:
+            // extract hi-nibble:
+            value = highNibble(mAccu);
+            mStepNo = 2;
+            break;
+        case 2:
+            // extract lo-nibble:
+            value = lowNibble(mAccu);
+            mStepNo = 0;
+            break;
+        default:
+            assert(0);
+        }
+
+        // and write:
+        *dcursor++ = binToHex(value);
+    }
+
+    return scursor == send;
+} // encode
+
+bool Rfc2047QEncodingEncoder::finish(char *&dcursor, const char *const dend)
+{
+    mInsideFinishing = true;
+
+    // write the last bits of mAccu, if any:
+    while (mStepNo != 0 && dcursor != dend) {
+        uchar value = 0;
+        switch (mStepNo) {
+        case 1:
+            // extract hi-nibble:
+            value = highNibble(mAccu);
+            mStepNo = 2;
+            break;
+        case 2:
+            // extract lo-nibble:
+            value = lowNibble(mAccu);
+            mStepNo = 0;
+            break;
+        default:
+            assert(0);
+        }
+
+        // and write:
+        *dcursor++ = binToHex(value);
+    }
+
+    return mStepNo == 0;
+}
+
+} // namespace KCodecs