ktextaddons/html/ollamareply_8cpp_source.html

// SPDX-FileCopyrightText: 2023 Loren Burkholder <computersemiexpert@outlook.com>

// SPDX-FileCopyrightText: 2023 Klarälvdalens Datakonsult AB, a KDAB Group company <info@kdab.com>

// SPDX-FileCopyrightText: SPDX-FileCopyrightText: 2025 Laurent Montel <montel@kde.org>

// Based on Alpaka code

// SPDX-License-Identifier: GPL-2.0-or-later


#include "ollamareply.h"

#include "autogeneratetext_ollama_debug.h"

#include <QJsonArray>

#include <QNetworkReply>


using namespace Qt::StringLiterals;


OllamaReply::OllamaReply(QNetworkReply *netReply, QObject *parent)

    : QObject{parent}

    , mReply{netReply}

{

    connect(mReply, &QNetworkReply::finished, mReply, [this] {

        // Normally, we could assume that the tokens will never be empty once the request finishes, but it could be possible

        // that the request failed and we have no tokens to parse.

        if (!mTokens.empty()) {

            const auto finalResponse = mTokens.constLast();

            mContext.setContextData(finalResponse["context"_L1].toArray());

            mInfo.totalDuration = std::chrono::nanoseconds{finalResponse["total_duration"_L1].toVariant().toULongLong()};

            mInfo.loadDuration = std::chrono::nanoseconds{finalResponse["load_duration"_L1].toVariant().toULongLong()};

            mInfo.promptEvalTokenCount = finalResponse["prompt_eval_count"_L1].toVariant().toULongLong();

            mInfo.promptEvalDuration = std::chrono::nanoseconds{finalResponse["prompt_eval_duration"_L1].toVariant().toULongLong()};

            mInfo.tokenCount = finalResponse["eval_count"_L1].toVariant().toULongLong();

            mInfo.duration = std::chrono::nanoseconds{finalResponse["eval_duration"_L1].toVariant().toULongLong()};

        }


        qCDebug(AUTOGENERATETEXT_OLLAMA_LOG) << "Ollama response finished";

        mFinished = true;

        Q_EMIT finished();

    });

    connect(mReply, &QNetworkReply::errorOccurred, mReply, [](QNetworkReply::NetworkError e) {

        qCDebug(AUTOGENERATETEXT_OLLAMA_LOG) << "Ollama HTTP error:" << e;

    });

    connect(mReply, &QNetworkReply::downloadProgress, mReply, [this](qint64 received, qint64 /*total*/) {

        mIncompleteTokens += mReply->read(received - mReceivedSize);

        mReceivedSize = received;


        auto completeTokens = mIncompleteTokens.split('\n');

        if (completeTokens.size() <= 1) {

            return;

        }

        mIncompleteTokens = completeTokens.last();

        completeTokens.removeLast();


        mTokens.reserve(completeTokens.count());

        for (const auto &tok : std::as_const(completeTokens)) {

            mTokens.append(QJsonDocument::fromJson(tok));

        }


        Q_EMIT contentAdded();

    });

}


QString OllamaReply::readResponse() const

{

    QString ret;

    for (const auto &tok : mTokens) {

        ret += tok["response"_L1].toString();

    }

    return ret;

}


const TextAutogenerateText::TextAutogenerateTextContext &OllamaReply::context() const

{

    return mContext;

}


const OllamaReplyInfo &OllamaReply::info() const

{

    return mInfo;

}


bool OllamaReply::isFinished() const

{

    return mFinished;

}


#include "moc_ollamareply.cpp"

OllamaReply::context
const TextAutogenerateText::TextAutogenerateTextContext & context() const
Get the context token for this response.
Definition ollamareply.cpp:68

OllamaReply::readResponse
QString readResponse() const
Get the current response content.
Definition ollamareply.cpp:59

OllamaReply::isFinished
bool isFinished() const
Check whether the reply has finished.
Definition ollamareply.cpp:78

OllamaReply::info
const OllamaReplyInfo & info() const
Get extra information about the reply.
Definition ollamareply.cpp:73

TextAutogenerateText::TextAutogenerateTextContext
The TextAutogenerateTextContext class.
Definition textautogeneratetextcontext.h:17

QJsonDocument::fromJson
QJsonDocument fromJson(const QByteArray &json, QJsonParseError *error)

QNetworkReply

QNetworkReply::NetworkError
NetworkError

QNetworkReply::downloadProgress
void downloadProgress(qint64 bytesReceived, qint64 bytesTotal)

QNetworkReply::errorOccurred
void errorOccurred(QNetworkReply::NetworkError code)

QNetworkReply::finished
void finished()

QObject

QString

QtFuture::connect
QFuture< ArgsType< Signal > > connect(Sender *sender, Signal signal)

OllamaReplyInfo
The OllamaReplyInfo class represents information about a reply from an LLM.
Definition ollamareply.h:20