src/ChatWrapper.ts

import {
    ChatHistoryItem, ChatModelFunctionCall, ChatModelFunctions, ChatModelResponse, ChatModelSegmentType,
    ChatWrapperCheckModelCompatibilityParams, ChatWrapperGenerateContextStateOptions, ChatWrapperGeneratedContextState,
    ChatWrapperGenerateInitialHistoryOptions, ChatWrapperSettings, isChatModelResponseSegment
} from "./types.js";
import {LlamaText, SpecialTokensText} from "./utils/LlamaText.js";
import {ChatModelFunctionsDocumentationGenerator} from "./chatWrappers/utils/ChatModelFunctionsDocumentationGenerator.js";
import {jsonDumps} from "./chatWrappers/utils/jsonDumps.js";
import {defaultChatSystemPrompt} from "./config.js";
import {getChatWrapperSegmentDefinition} from "./utils/getChatWrapperSegmentDefinition.js";
import type {JinjaTemplateChatWrapperOptions} from "./chatWrappers/generic/JinjaTemplateChatWrapper.js";

export abstract class ChatWrapper {
    public static defaultSettings: ChatWrapperSettings = {
        supportsSystemMessages: true,
        functions: {
            call: {
                optionalPrefixSpace: true,
                prefix: "||call: ",
                paramsPrefix: LlamaText(new SpecialTokensText("(")),
                suffix: LlamaText(new SpecialTokensText(")")),
                emptyCallParamsPlaceholder: ""
            },
            result: {
                prefix: LlamaText(new SpecialTokensText("\n"), "||result: "),
                suffix: LlamaText(new SpecialTokensText("\n"))
            }
        },
        segments: {}
    };

    public abstract readonly wrapperName: string;
    public readonly settings: ChatWrapperSettings = ChatWrapper.defaultSettings;

    public generateContextState({
        chatHistory, availableFunctions, documentFunctionParams
    }: ChatWrapperGenerateContextStateOptions): ChatWrapperGeneratedContextState {
        const historyWithFunctions = this.addAvailableFunctionsSystemMessageToHistory(chatHistory, availableFunctions, {
            documentParams: documentFunctionParams
        });

        const texts = historyWithFunctions
            .map((item) => {
                if (item.type === "system")
                    return LlamaText(["system: ", LlamaText.fromJSON(item.text)]);
                else if (item.type === "user")
                    return LlamaText(["user: ", item.text]);
                else if (item.type === "model")
                    return LlamaText(["model: ", this.generateModelResponseText(item.response)]);

                return item satisfies never;
            });

        return {
            contextText: LlamaText.joinValues("\n", texts),
            stopGenerationTriggers: []
        };
    }

    public generateFunctionCallsAndResults(functionCalls: ChatModelFunctionCall[], useRawCall: boolean = true) {
        const calls: LlamaText[] = [];
        const results: LlamaText[] = [];
        const res: LlamaText[] = [];

        if (functionCalls.length === 0)
            return LlamaText([]);

        for (const functionCall of functionCalls) {
            if (useRawCall && functionCall.rawCall != null)
                calls.push(LlamaText.fromJSON(functionCall.rawCall));
            else
                calls.push(this.generateFunctionCall(functionCall.name, functionCall.params));

            results.push(this.generateFunctionCallResult(functionCall.name, functionCall.params, functionCall.result));
        }

        if (this.settings.functions.parallelism == null) {
            for (let i = 0; i < calls.length; i++) {
                res.push(calls[i]!);
                res.push(results[i]!);
            }

            return LlamaText(res);
        }

        res.push(LlamaText(this.settings.functions.parallelism.call.sectionPrefix ?? ""));
        for (let i = 0; i < calls.length; i++) {
            if (i > 0)
                res.push(LlamaText(this.settings.functions.parallelism.call.betweenCalls ?? ""));

            res.push(calls[i]!);
        }
        res.push(LlamaText(this.settings.functions.parallelism.call.sectionSuffix ?? ""));

        res.push(LlamaText(this.settings.functions.parallelism.result?.sectionPrefix ?? ""));
        for (let i = 0; i < results.length; i++) {
            if (i > 0)
                res.push(LlamaText(this.settings.functions.parallelism.result?.betweenResults ?? ""));

            res.push(results[i]!);
        }
        res.push(LlamaText(this.settings.functions.parallelism.result?.sectionSuffix ?? ""));

        return LlamaText(res);
    }

    public generateFunctionCall(name: string, params: any): LlamaText {
        const emptyCallParamsPlaceholder = this.settings.functions.call.emptyCallParamsPlaceholder;
        return LlamaText([
            this.settings.functions.call.prefix,
            name,
            this.settings.functions.call.paramsPrefix,
            (
                params === undefined
                    ? (emptyCallParamsPlaceholder === undefined || emptyCallParamsPlaceholder === "")
                        ? ""
                        : jsonDumps(emptyCallParamsPlaceholder)
                    : jsonDumps(params)
            ),
            this.settings.functions.call.suffix
        ]);
    }

    public generateFunctionCallResult(functionName: string, functionParams: any, result: any): LlamaText {
        function resolveParameters(text: string | LlamaText) {
            return LlamaText(text)
                .mapValues((value) => {
                    if (typeof value !== "string")
                        return value;

                    return value
                        .replaceAll("{{functionName}}", functionName)
                        .replaceAll("{{functionParams}}", functionParams === undefined ? "" : jsonDumps(functionParams));
                });
        }

        return LlamaText([
            resolveParameters(this.settings.functions.result.prefix),
            (
                result === undefined
                    ? "void"
                    : jsonDumps(result)
            ),
            resolveParameters(this.settings.functions.result.suffix)
        ]);
    }

    public generateModelResponseText(modelResponse: ChatModelResponse["response"], useRawValues: boolean = true): LlamaText {
        const res: LlamaText[] = [];
        const pendingFunctionCalls: ChatModelFunctionCall[] = [];
        const segmentStack: ChatModelSegmentType[] = [];
        let lastSegmentEndedWithoutSuffix: boolean = false;
        let needsToAddSegmentReminder = false;

        const addFunctionCalls = () => {
            if (pendingFunctionCalls.length === 0)
                return;

            res.push(this.generateFunctionCallsAndResults(pendingFunctionCalls, useRawValues));
            pendingFunctionCalls.length = 0;
            needsToAddSegmentReminder = true;
        };

        const addSegmentReminderIfNeeded = () => {
            if (lastSegmentEndedWithoutSuffix && segmentStack.length === 0 && this.settings.segments?.closeAllSegments != null) {
                lastSegmentEndedWithoutSuffix = false;
                res.push(LlamaText(this.settings.segments.closeAllSegments));
            } else if (needsToAddSegmentReminder && segmentStack.length > 0 && this.settings.segments?.reiterateStackAfterFunctionCalls) {
                for (const segmentType of segmentStack) {
                    const segmentDefinition = getChatWrapperSegmentDefinition(this.settings, segmentType);
                    if (segmentDefinition == null)
                        continue;

                    res.push(LlamaText(segmentDefinition.prefix));
                }
            }
        };

        for (const response of modelResponse) {
            if (typeof response === "string") {
                addFunctionCalls();
                addSegmentReminderIfNeeded();

                res.push(LlamaText(response));
                continue;
            } else if (isChatModelResponseSegment(response)) {
                addFunctionCalls();

                const segmentDefinition = getChatWrapperSegmentDefinition(this.settings, response.segmentType);
                if (response.raw != null && useRawValues)
                    res.push(LlamaText.fromJSON(response.raw));
                else
                    res.push(
                        LlamaText([
                            (segmentStack.length > 0 && segmentStack.at(-1) === response.segmentType)
                                ? ""
                                : segmentDefinition?.prefix ?? "",
                            response.text,
                            response.ended
                                ? (segmentDefinition?.suffix ?? "")
                                : ""
                        ])
                    );

                lastSegmentEndedWithoutSuffix = response.ended && segmentDefinition?.suffix == null;

                if (!response.ended && segmentStack.at(-1) !== response.segmentType)
                    segmentStack.push(response.segmentType);
                else if (response.ended && segmentStack.at(-1) === response.segmentType) {
                    segmentStack.pop();

                    if (segmentStack.length === 0 && segmentDefinition?.suffix == null && this.settings.segments?.closeAllSegments != null)
                        res.push(LlamaText(this.settings.segments.closeAllSegments));
                }

                continue;
            }

            if (response.startsNewChunk)
                addFunctionCalls();

            pendingFunctionCalls.push(response);
        }

        addFunctionCalls();
        addSegmentReminderIfNeeded();

        return LlamaText(res);
    }

    public generateAvailableFunctionsSystemText(availableFunctions: ChatModelFunctions, {documentParams = true}: {
        documentParams?: boolean
    }): LlamaText {
        const functionsDocumentationGenerator = new ChatModelFunctionsDocumentationGenerator(availableFunctions);

        if (!functionsDocumentationGenerator.hasAnyFunctions)
            return LlamaText([]);

        return LlamaText.joinValues("\n", [
            "The assistant calls the provided functions as needed to retrieve information instead of relying on existing knowledge.",
            "To fulfill a request, the assistant calls relevant functions in advance when needed before responding to the request, and does not tell the user prior to calling a function.",
            "Provided functions:",
            "```typescript",
            functionsDocumentationGenerator.getTypeScriptFunctionSignatures({documentParams}),
            "```",
            "",
            "Calling any of the provided functions can be done like this:",
            this.generateFunctionCall("getSomeInfo", {someKey: "someValue"}),
            "",
            "Note that the || prefix is mandatory.",
            "The assistant does not inform the user about using functions and does not explain anything before calling a function.",
            "After calling a function, the raw result appears afterwards and is not part of the conversation.",
            "To make information be part of the conversation, the assistant paraphrases and repeats the information without the function syntax."
        ]);
    }

    public addAvailableFunctionsSystemMessageToHistory(history: readonly ChatHistoryItem[], availableFunctions?: ChatModelFunctions, {
        documentParams = true
    }: {
        documentParams?: boolean
    } = {}) {
        const availableFunctionNames = Object.keys(availableFunctions ?? {});

        if (availableFunctions == null || availableFunctionNames.length === 0)
            return history;

        const res = history.slice();

        const firstNonSystemMessageIndex = res.findIndex((item) => item.type !== "system");
        res.splice(Math.max(0, firstNonSystemMessageIndex), 0, {
            type: "system",
            text: this.generateAvailableFunctionsSystemText(availableFunctions, {documentParams}).toJSON()
        });

        return res;
    }

    public generateInitialChatHistory({
        systemPrompt = defaultChatSystemPrompt
    }: ChatWrapperGenerateInitialHistoryOptions = {}): ChatHistoryItem[] {
        return [{
            type: "system",
            text: LlamaText(systemPrompt ?? defaultChatSystemPrompt).toJSON()
        }];
    }

    /** @internal */
    public static _getOptionConfigurationsToTestIfCanSupersedeJinjaTemplate(): ChatWrapperJinjaMatchConfiguration<typeof this> {
        return [{}] satisfies ChatWrapperJinjaMatchConfiguration<typeof this>;
    }

    /** @internal */
    public static _checkModelCompatibility(options: ChatWrapperCheckModelCompatibilityParams): boolean {
        return true;
    }
}

type FirstItemOfTupleOrFallback<T extends any[], Fallback> = T extends [infer U, ...any[]] ? U : Fallback;

export type ChatWrapperJinjaMatchConfiguration<T extends typeof ChatWrapper> = Array<
    FirstItemOfTupleOrFallback<ConstructorParameters<T>, object> |
    [
        testConfig: FirstItemOfTupleOrFallback<ConstructorParameters<T>, object>,
        applyConfig: FirstItemOfTupleOrFallback<ConstructorParameters<T>, object>,
        testJinjaChatWrapperOptions?: JinjaTemplateChatWrapperOptions
    ]
>;