8 changed files with 88 additions and 463 deletions
--- a/bun.lockb
+++ b/bun.lockb
--- a/package.json
+++ b/package.json
@ -8,8 +8,6 @@
    "bake": "bun build/build.ts"
  },
  "dependencies": {
-    "@huggingface/gguf": "0.1.12",
-    "@huggingface/hub": "0.19.0",
    "@huggingface/jinja": "0.3.1",
    "@inquirer/select": "2.3.10",
    "ace-builds": "1.36.3",
--- a/src/games/ai/components/ace.tsx
+++ b/src/games/ai/components/ace.tsx
@ -26,8 +26,6 @@ export const Ace = ({ value, onInput }: IAceProps) => {
                displayIndentGuides: false,
                fontSize: 16,
                maxLines: Infinity,
-                tabSize: 2,
-                useSoftTabs: true,
                wrap: "free",
            });
            return e;
--- a/src/games/ai/components/header/header.module.css
+++ b/src/games/ai/components/header/header.module.css
@ -17,11 +17,10 @@
    .inputs {
        display: flex;
        flex-direction: row;
-    }

-    .info {
-        margin: 0 8px;
-        line-height: 36px;
+        select {
+            text-transform: capitalize;
+        }
    }

    .buttons {
--- a/src/games/ai/components/header/header.tsx
+++ b/src/games/ai/components/header/header.tsx
@ -11,25 +11,38 @@ import styles from './header.module.css';
 import { Ace } from "../ace";

 export const Header = () => {
-    const { modelName, modelTemplate, contextLength, promptTokens, blockConnection } = useContext(LLMContext);
+    const { getContextLength } = useContext(LLMContext);
    const {
        messages, connectionUrl, systemPrompt, lore, userPrompt, bannedWords, instruct,
        setConnectionUrl, setSystemPrompt, setLore, setUserPrompt, addSwipe, setBannedWords, setInstruct
    } = useContext(StateContext);
+    const [urlValid, setUrlValid] = useState(false);
+    const [urlEditing, setUrlEditing] = useState(false);

    const loreOpen = useBool();
    const promptsOpen = useBool();
    const assistantOpen = useBool();

    const bannedWordsInput = useMemo(() => bannedWords.join('\n'), [bannedWords]);
-    const urlValid = useMemo(() => contextLength > 0, [contextLength]);
+
+    const handleFocusUrl = useCallback(() => setUrlEditing(true), []);

    const handleBlurUrl = useCallback(() => {
        const regex = /^(?:http(s?):\/\/)?(.*?)\/?$/i
        const normalizedConnectionUrl = connectionUrl.replace(regex, 'http$1://$2');
+        console.log({ connectionUrl, normalizedConnectionUrl })
        setConnectionUrl(normalizedConnectionUrl);
-        blockConnection.setFalse();
-    }, [connectionUrl, setConnectionUrl, blockConnection]);
+        setUrlEditing(false);
+        setUrlValid(false);
+    }, [connectionUrl, setConnectionUrl]);
+
+    useEffect(() => {
+        if (!urlEditing) {
+            getContextLength().then(length => {
+                setUrlValid(length > 0);
+            });
+        }
+    }, [connectionUrl, urlEditing]);

    const handleAssistantAddSwipe = useCallback((answer: string) => {
        const index = messages.findLastIndex(m => m.role === 'assistant');
@ -56,28 +69,17 @@ export const Header = () => {
            <div class={styles.inputs}>
                <input value={connectionUrl}
                    onInput={setConnectionUrl}
-                    onFocus={blockConnection.setTrue}
+                    onFocus={handleFocusUrl}
                    onBlur={handleBlurUrl}
-                    class={blockConnection.value ? '' : urlValid ? styles.valid : styles.invalid}
+                    class={urlEditing ? '' : urlValid ? styles.valid : styles.invalid}
                />
-                <select value={instruct} onChange={setInstruct} title='Instruct template'>
-                    {modelName && modelTemplate && <optgroup label='Native model template'>
-                        <option value={modelTemplate} title='Native for model'>{modelName}</option>
-                    </optgroup>}
-                    <optgroup label='Manual templates'>
-                        {Object.entries(Instruct).map(([label, value]) => (
-                            <option value={value} key={value}>
-                                {label.toLowerCase()}
-                            </option>
-                        ))}
-                    </optgroup>
-                    <optgroup label='Custom'>
-                        <option value={instruct}>Custom</option>
-                    </optgroup>
+                <select value={instruct} onChange={setInstruct}>
+                    {Object.entries(Instruct).map(([label, value]) => (
+                        <option value={value} key={value}>
+                            {label.toLowerCase()}
+                        </option>
+                    ))}
                </select>
-                <div class={styles.info}>
-                    {promptTokens} / {contextLength}
-                </div>
            </div>
            <div class={styles.buttons}>
                <button class='icon color' title='Edit lore' onClick={loreOpen.setTrue}>
@ -109,9 +111,6 @@ export const Header = () => {
                    <h4 class={styles.modalTitle}>User prompt template</h4>
                    <Ace value={userPrompt} onInput={setUserPrompt} />
                    <hr />
-                    <h4 class={styles.modalTitle}>Instruct template</h4>
-                    <Ace value={instruct} onInput={setInstruct} />
-                    <hr />
                    <h4 class={styles.modalTitle}>Banned phrases</h4>
                    <AutoTextarea
                        placeholder="Each phrase on separate line"
--- a/src/games/ai/contexts/llm.tsx
+++ b/src/games/ai/contexts/llm.tsx
@ -1,12 +1,17 @@
 import Lock from "@common/lock";
 import SSE from "@common/sse";
 import { createContext } from "preact";
-import { useCallback, useContext, useEffect, useMemo, useState } from "preact/hooks";
+import { useContext, useEffect, useMemo } from "preact/hooks";
 import { MessageTools, type IMessage } from "../messages";
-import { Instruct, StateContext } from "./state";
+import { StateContext } from "./state";
 import { useBool } from "@common/hooks/useBool";
 import { Template } from "@huggingface/jinja";
-import { Huggingface } from "../huggingface";
+
+
+interface ITemplateMessage {
+    role: 'user' | 'assistant' | 'system';
+    content: string;
+}

 interface ICompileArgs {
    keepUsers?: number;
@ -20,12 +25,6 @@ interface ICompiledPrompt {

 interface IContext {
    generating: boolean;
-    blockConnection: ReturnType<typeof useBool>;
-    modelName: string;
-    modelTemplate: string;
-    hasToolCalls: boolean;
-    promptTokens: number;
-    contextLength: number;
 }

 const DEFAULT_GENERATION_SETTINGS = {
@ -45,53 +44,23 @@ const DEFAULT_GENERATION_SETTINGS = {
 type IGenerationSettings = Partial<typeof DEFAULT_GENERATION_SETTINGS>;

 interface IActions {
+    applyChatTemplate: (messages: ITemplateMessage[], templateString: string, eosToken?: string) => string;
    compilePrompt: (messages: IMessage[], args?: ICompileArgs) => Promise<ICompiledPrompt>;
    generate: (prompt: string, extraSettings?: IGenerationSettings) => AsyncGenerator<string>;
-    countTokens: (prompt: string) => Promise<number>;
+    countTokens(prompt: string): Promise<number>;
+    getContextLength(): Promise<number>;
+
 }
 export type ILLMContext = IContext & IActions;

-export const normalizeModel = (model: string) => {
-    let currentModel = model.split(/[\\\/]/).at(-1);
-    currentModel = currentModel.split('::').at(0);
-    let normalizedModel: string;
-
-    do {
-        normalizedModel = currentModel;
-
-        currentModel = currentModel
-            .replace(/[ ._-]\d+(k$|-context)/i, '') // remove context length, i.e. -32k
-            .replace(/[ ._-](gptq|awq|exl2?|imat|i\d)/i, '') // remove quant name
-            .replace(/([ ._-]?gg(uf|ml)[ ._-]?(v[ ._-]?\d)?)/i, '') // remove gguf-v3/ggml/etc
-            .replace(/[ ._-]i?q([ ._-]?\d[ ._-]?(k?[ ._-]?x*[ ._-]?[lms]?)?)+/i, '') // remove quant size
-            .replace(/[ ._-]\d+(\.\d+)?bpw/i, '') // remove bpw
-            .replace(/[ ._-]f(p|loat)?(8|16|32)/i, '')
-            .replace(/^(debug-?)+/i, '')
-            .trim();
-    } while (normalizedModel !== currentModel);
-
-    return normalizedModel
-        .replace(/[ _-]+/ig, '-')
-        .replace(/\.{2,}/, '-')
-        .replace(/[ ._-]+$/ig, '')
-        .trim();
-}
-
 export const LLMContext = createContext<ILLMContext>({} as ILLMContext);

 export const LLMContextProvider = ({ children }: { children?: any }) => {
    const {
        connectionUrl, messages, triggerNext, lore, userPrompt, systemPrompt, bannedWords, instruct,
-        setTriggerNext, addMessage, editMessage, setInstruct,
+        setTriggerNext, addMessage, editMessage,
    } = useContext(StateContext);
-
    const generating = useBool(false);
-    const blockConnection = useBool(false);
-    const [promptTokens, setPromptTokens] = useState(0);
-    const [contextLength, setContextLength] = useState(0);
-    const [modelName, setModelName] = useState('');
-    const [modelTemplate, setModelTemplate] = useState('');
-    const [hasToolCalls, setHasToolCalls] = useState(false);

    const userPromptTemplate = useMemo(() => {
        try {
@ -103,41 +72,17 @@ export const LLMContextProvider = ({ children }: { children?: any }) => {
        }
    }, [userPrompt]);

-    const getContextLength = useCallback(async () => {
-        if (!connectionUrl || blockConnection.value) {
-            return 0;
-        }
-        try {
-            const response = await fetch(`${connectionUrl}/api/extra/true_max_context_length`);
-            if (response.ok) {
-                const { value } = await response.json();
-                return value;
-            }
-        } catch (e) {
-            console.log('Error getting max tokens', e);
-        }
-
-        return 0;
-    }, [connectionUrl, blockConnection.value]);
-
-    const getModelName = useCallback(async () => {
-        if (!connectionUrl || blockConnection.value) {
-            return '';
-        }
-        try {
-            const response = await fetch(`${connectionUrl}/api/v1/model`);
-            if (response.ok) {
-                const { result } = await response.json();
-                return result;
-            }
-        } catch (e) {
-            console.log('Error getting max tokens', e);
-        }
-
-        return '';
-    }, [connectionUrl, blockConnection.value]);
-
    const actions: IActions = useMemo(() => ({
+        applyChatTemplate: (messages: ITemplateMessage[], templateString: string) => {
+            const template = new Template(templateString);
+
+            const prompt = template.render({
+                messages,
+                add_generation_prompt: true,
+            });
+
+            return prompt;
+        },
        compilePrompt: async (messages, { keepUsers } = {}) => {
            const promptMessages = messages.slice();
            const lastMessage = promptMessages.at(-1);
@ -145,17 +90,17 @@ export const LLMContextProvider = ({ children }: { children?: any }) => {
            const isRegen = isAssistantLast && !MessageTools.getSwipe(lastMessage)?.content;
            const isContinue = isAssistantLast && !isRegen;

-            if (isContinue) {
-                promptMessages.push(MessageTools.create(userPromptTemplate.render({})));
-            }
-
            const userMessages = promptMessages.filter(m => m.role === 'user');
            const lastUserMessage = userMessages.at(-1);
            const firstUserMessage = userMessages.at(0);

+            if (isContinue) {
+                promptMessages.push(MessageTools.create(userPromptTemplate.render({})));
+            }
+
            const system = `${systemPrompt}\n\n${lore}`.trim();

-            const templateMessages: Huggingface.ITemplateMessage[] = [
+            const templateMessages: ITemplateMessage[] = [
                { role: 'system', content: system },
            ];

@ -183,6 +128,15 @@ export const LLMContextProvider = ({ children }: { children?: any }) => {
                        templateMessages.push({ role, content });
                    }
                }
+
+                if (templateMessages[1]?.role !== 'user') {
+                    const prompt = MessageTools.getSwipe(firstUserMessage)?.content;
+
+                    templateMessages.splice(1, 0, {
+                        role: 'user',
+                        content: userPromptTemplate.render({ prompt, isStart: true }),
+                    });
+                }
            } else {
                const story = promptMessages.filter(m => m.role === 'assistant')
                    .map(m => MessageTools.getSwipe(m)?.content.trim()).join('\n\n');
@ -203,16 +157,7 @@ export const LLMContextProvider = ({ children }: { children?: any }) => {
                }
            }

-            if (templateMessages[1]?.role !== 'user') {
-                const prompt = MessageTools.getSwipe(firstUserMessage)?.content;
-
-                templateMessages.splice(1, 0, {
-                    role: 'user',
-                    content: userPromptTemplate.render({ prompt, isStart: true }),
-                });
-            }
-
-            const prompt = Huggingface.applyChatTemplate(instruct, templateMessages);
+            const prompt = actions.applyChatTemplate(templateMessages, instruct);
            return {
                prompt,
                isContinue,
@ -303,6 +248,22 @@ export const LLMContextProvider = ({ children }: { children?: any }) => {
                console.log('Error counting tokens', e);
            }

+            return 0;
+        },
+        getContextLength: async () => {
+            if (!connectionUrl) {
+                return 0;
+            }
+            try {
+                const response = await fetch(`${connectionUrl}/api/extra/true_max_context_length`);
+                if (response.ok) {
+                    const { value } = await response.json();
+                    return value;
+                }
+            } catch (e) {
+                console.log('Error getting max tokens', e);
+            }
+
            return 0;
        },
    }), [connectionUrl, lore, userPromptTemplate, systemPrompt, bannedWords, instruct]);
@ -315,8 +276,6 @@ export const LLMContextProvider = ({ children }: { children?: any }) => {
            let text: string = '';

            const { prompt, isRegen } = await actions.compilePrompt(messages);
-            const tokens = await actions.countTokens(prompt);
-            setPromptTokens(tokens);

            if (!isRegen) {
                addMessage('', 'assistant');
@ -325,76 +284,18 @@ export const LLMContextProvider = ({ children }: { children?: any }) => {

            for await (const chunk of actions.generate(prompt)) {
                text += chunk;
-                setPromptTokens(tokens + Math.round(text.length * 0.25));
                editMessage(messageId, text);
            }

            text = MessageTools.trimSentence(text);
            editMessage(messageId, text);

-            setPromptTokens(0); // trigger calculation
-
            MessageTools.playReady();
        }
-    })(), [actions, triggerNext, messages, generating.value]);
-
-    useEffect(() => {
-        if (!blockConnection.value) {
-            setPromptTokens(0);
-            setContextLength(0);
-
-            getContextLength().then(setContextLength);
-        }
-    }, [connectionUrl, instruct, blockConnection.value]);
-
-    useEffect(() => {
-        if (!blockConnection.value) {
-            setModelName('');
-            getModelName().then(normalizeModel).then(setModelName);
-        }
-    }, [connectionUrl, blockConnection.value]);
-
-    useEffect(() => {
-        setModelTemplate('');
-        if (modelName) {
-            Huggingface.findModelTemplate(modelName)
-                .then((template) => {
-                    if (template) {
-                        setModelTemplate(template);
-                        setInstruct(template);
-                    } else {
-                        setInstruct(Instruct.CHATML);
-                    }
-                });
-        }
-    }, [modelName]);
-
-    useEffect(() => {
-        if (promptTokens === 0 && !blockConnection.value) {
-            actions.compilePrompt(messages)
-                .then(({ prompt }) => actions.countTokens(prompt))
-                .then(setPromptTokens)
-                .catch(e => console.error(`Could not count tokens`, e));
-        }
-    }, [actions, promptTokens, messages, blockConnection.value]);
-
-    useEffect(() => {
-        try {
-            const hasTools = Huggingface.testToolCalls(instruct);
-            setHasToolCalls(hasTools);
-        } catch {
-            setHasToolCalls(false);
-        }
-    }, [instruct]);
+    })(), [triggerNext, messages, generating.value]);

    const rawContext: IContext = {
        generating: generating.value,
-        blockConnection,
-        modelName,
-        modelTemplate,
-        hasToolCalls,
-        promptTokens,
-        contextLength,
    };

    const context = useMemo(() => rawContext, Object.values(rawContext));
--- a/src/games/ai/contexts/state.tsx
+++ b/src/games/ai/contexts/state.tsx
@ -38,13 +38,13 @@ interface IActions {
 const SAVE_KEY = 'ai_game_save_state';

 export enum Instruct {
-    CHATML = `{% for message in messages %}{{'<|im_start|>' + message['role'] + '\\n\\n' + message['content'] + '<|im_end|>' + '\\n'}}{% endfor %}{% if add_generation_prompt %}{{ '<|im_start|>assistant\\n\\n' }}{% endif %}`,
+    LLAMA = `{% for message in messages %}{% set content = '<|start_header_id|>' + message['role'] + '<|end_header_id|>\n\n' + message['content'] | trim + '<|eot_id|>' %}{{ content }}{% endfor %}{% if add_generation_prompt %}{{ '<|start_header_id|>assistant<|end_header_id|>\n\n' }}{% endif %}`,

-    LLAMA = `{% for message in messages %}{% set content = '<|start_header_id|>' + message['role'] + '<|end_header_id|>\\n\\n' + message['content'] | trim + '<|eot_id|>' %}{{ content }}{% endfor %}{% if add_generation_prompt %}{{ '<|start_header_id|>assistant<|end_header_id|>\\n\\n' }}{% endif %}`,
+    MISTRAL = `{%- if messages[0]['role'] == 'system' %}{%- set system_message = messages[0]['content'] %}{%- set loop_messages = messages[1:] %}{%- else %}{%- set loop_messages = messages %}{%- endif %}{%- for message in loop_messages %}{%- if message['role'] == 'user' %}{%- if loop.first and system_message is defined %}{{- ' [INST] ' + system_message + '\n\n' + message['content'] + ' [/INST]' }}{%- else %}{{- ' [INST] ' + message['content'] + ' [/INST]' }}{%- endif %}{%- elif message['role'] == 'assistant' %}{{- ' ' + message['content'] + '</s>'}}{%- endif %}{%- endfor %}`,

-    MISTRAL = `{%- if messages[0]['role'] == 'system' %}{%- set system_message = messages[0]['content'] %}{%- set loop_messages = messages[1:] %}{%- else %}{%- set loop_messages = messages %}{%- endif %}{%- for message in loop_messages %}{%- if message['role'] == 'user' %}{%- if loop.first and system_message is defined %}{{- ' [INST] ' + system_message + '\\n\\n' + message['content'] + ' [/INST]' }}{%- else %}{{- ' [INST] ' + message['content'] + ' [/INST]' }}{%- endif %}{%- elif message['role'] == 'assistant' %}{{- ' ' + message['content'] + '</s>'}}{%- endif %}{%- endfor %}`,
+    CHATML = `{% for message in messages %}{{'<|im_start|>' + message['role'] + '\n\n' + message['content'] + '<|im_end|>' + '\n'}}{% endfor %}{% if add_generation_prompt %}{{ '<|im_start|>assistant\n\n' }}{% endif %}`,

-    ALPACA = `{% for message in messages %}{% if message['role'] == 'system' and message['content'] %}{{ message['content'] + '\\n\\n'}}{% elif message['role'] == 'user' %}{{'### Instruction:\\n\\n' + message['content'] + '\\n\\n'}}{% elif message['role'] == 'assistant' %}{{'### Response:\\n\\n' + message['content'] + '\\n\\n'}}{% endif %}{% endfor %}{% if add_generation_prompt %}{{ '### Response:\\n\\n' }}{% endif %}`,
+    ALPACA = `{% for message in messages %}{% if message['role'] == 'system' and message['content'] %}{{ message['content'] + '\n\n'}}{% elif message['role'] == 'user' %}{{'### Instruction:\n\n' + message['content'] + '\n\n'}}{% elif message['role'] == 'assistant' %}{{'### Response:\n\n' + message['content'] + '\n\n'}}{% endif %}{% endfor %}{% if add_generation_prompt %}{{ '### Response:\n\n' }}{% endif %}`,
 };

 export const saveContext = (context: IContext) => {
@ -58,7 +58,7 @@ export const loadContext = (): IContext => {
    const defaultContext: IContext = {
        connectionUrl: 'http://localhost:5001',
        input: '',
-        instruct: Instruct.CHATML,
+        instruct: Instruct.LLAMA,
        systemPrompt: 'You are creative writer. Write a story based on the world description below.',
        lore: '',
        userPrompt: `{% if prompt %}{% if isStart %}Start{% else %}Continue{% endif %} this story, taking information into account: {{ prompt | trim }}
--- a/src/games/ai/huggingface.ts
+++ b/src/games/ai/huggingface.ts
@ -1,270 +0,0 @@
-import { gguf } from '@huggingface/gguf';
-import * as hub from '@huggingface/hub';
-import { Template } from '@huggingface/jinja';
-
-export namespace Huggingface {
-    export interface ITemplateMessage {
-        role: 'user' | 'assistant' | 'system';
-        content: string;
-    }
-
-    interface INumberParameter {
-        type: 'number';
-        enum?: number[];
-        description?: string;
-    }
-
-    interface IStringParameter {
-        type: 'string';
-        enum?: string[];
-        description?: string;
-    }
-
-    interface IArrayParameter {
-        type: 'array';
-        description?: string;
-        items: IParameter;
-    }
-
-    interface IObjectParameter {
-        type: 'object';
-        description?: string;
-        properties: Record<string, IParameter>;
-        required?: string[];
-    }
-
-    type IParameter = INumberParameter | IStringParameter | IArrayParameter | IObjectParameter;
-
-    interface ITool {
-        type: 'function',
-        function: {
-            name: string;
-            description?: string;
-            parameters?: IObjectParameter;
-        }
-    }
-
-    export interface IFunction {
-        name: string;
-        description?: string;
-        parameters?: Record<string, IParameter>;
-    }
-
-    interface TokenizerConfig {
-        chat_template: string;
-        bos_token?: string;
-        eos_token?: string;
-    }
-
-    const TEMPLATE_CACHE_KEY = 'ai_game_template_cache';
-
-    const loadCache = (): Record<string, string> => {
-        const json = localStorage.getItem(TEMPLATE_CACHE_KEY);
-
-        try {
-            if (json) {
-                const cache = JSON.parse(json);
-                if (cache && typeof cache === 'object') {
-                    return cache
-                }
-            }
-        } catch { }
-
-        return {};
-    };
-
-    const saveCache = (cache: Record<string, string>) => {
-        const json = JSON.stringify(cache);
-        localStorage.setItem(TEMPLATE_CACHE_KEY, json);
-    };
-
-    const templateCache: Record<string, string> = loadCache();
-
-    const hasField = <T extends string>(obj: unknown, field: T): obj is Record<T, unknown> => (
-        obj != null && typeof obj === 'object' && (field in obj)
-    );
-    const isTokenizerConfig = (obj: unknown): obj is TokenizerConfig => (
-        hasField(obj, 'chat_template') && (typeof obj.chat_template === 'string')
-        && (!hasField(obj, 'eos_token') || !obj.eos_token || typeof obj.eos_token === 'string')
-        && (!hasField(obj, 'bos_token') || !obj.bos_token || typeof obj.bos_token === 'string')
-    );
-
-    const loadHuggingfaceTokenizerConfig = async (modelName: string): Promise<TokenizerConfig | null> => {
-        console.log(`[huggingface] searching config for '${modelName}'`);
-
-        const hubModels = await Array.fromAsync(hub.listModels({ search: { query: modelName }, additionalFields: ['config'] }));
-        const models = hubModels.filter(m => {
-            if (m.gated) return false;
-            if (!m.name.toLowerCase().includes(modelName.toLowerCase())) return false;
-
-            return true;
-        }).sort((a, b) => b.downloads - a.downloads);
-
-        let tokenizerConfig: TokenizerConfig | null = null;
-
-        for (const model of models) {
-            const { config, name } = model;
-
-            if (name.toLowerCase().endsWith('-gguf')) continue;
-
-            if (hasField(config, 'tokenizer_config') && isTokenizerConfig(config.tokenizer_config)) {
-                tokenizerConfig = config.tokenizer_config;
-                break;
-            }
-
-            try {
-                console.log(`[huggingface] searching config in '${model.name}/tokenizer_config.json'`);
-                const fileResponse = await hub.downloadFile({ repo: model.name, path: 'tokenizer_config.json' });
-                if (fileResponse?.ok) {
-                    const maybeConfig = await fileResponse.json();
-                    if (isTokenizerConfig(maybeConfig)) {
-                        tokenizerConfig = maybeConfig;
-                        break;
-                    }
-                }
-            } catch { }
-        }
-
-        if (!tokenizerConfig) {
-            for (const model of models) {
-                try {
-                    for await (const file of hub.listFiles({ repo: model.name, recursive: true })) {
-                        if (file.type !== 'file' || !file.path.endsWith('.gguf')) continue;
-                        try {
-                            console.log(`[huggingface] searching config in '${model.name}/${file.path}'`);
-                            const fileInfo = await hub.fileDownloadInfo({ repo: model.name, path: file.path });
-                            if (fileInfo?.downloadLink) {
-                                const { metadata } = await gguf(fileInfo.downloadLink);
-                                if ('tokenizer.chat_template' in metadata) {
-                                    const chat_template = metadata['tokenizer.chat_template'];
-                                    const tokens = metadata['tokenizer.ggml.tokens'];
-                                    const bos_token = tokens[metadata['tokenizer.ggml.bos_token_id']];
-                                    const eos_token = tokens[metadata['tokenizer.ggml.eos_token_id']];
-
-                                    const maybeConfig = {
-                                        chat_template,
-                                        bos_token,
-                                        eos_token,
-                                    }
-
-                                    if (isTokenizerConfig(maybeConfig)) {
-                                        tokenizerConfig = maybeConfig;
-                                        break;
-                                    }
-                                } else if ('tokenizer.ggml.model' in metadata) {
-                                    break; // no reason to touch different quants
-                                }
-                            }
-                        } catch { }
-                    }
-
-                } catch { }
-
-                if (tokenizerConfig) {
-                    break;
-                }
-            }
-        }
-
-        if (tokenizerConfig) {
-            console.log(`[huggingface] found config for '${modelName}'`);
-            return {
-                chat_template: tokenizerConfig.chat_template,
-                eos_token: tokenizerConfig.eos_token,
-                bos_token: tokenizerConfig.bos_token,
-            };
-        }
-
-        console.log(`[huggingface] not found config for '${modelName}'`);
-        return null;
-    };
-
-    function updateRequired<T extends IParameter>(param: T): T {
-        if ('items' in param) {
-            updateRequired(param.items);
-        } else if ('properties' in param) {
-            for (const prop of Object.values(param.properties)) {
-                updateRequired(prop);
-            }
-            param.required = Object.keys(param.properties);
-        }
-
-        return param;
-    }
-
-    const convertFunctionToTool = (fn: IFunction): ITool => ({
-        type: 'function',
-        function: {
-            name: fn.name,
-            description: fn.description,
-            parameters: updateRequired({
-                type: 'object',
-                properties: fn.parameters ?? {},
-            })
-        }
-    })
-
-    export const testToolCalls = (template: string): boolean => {
-        const history: ITemplateMessage[] = [
-            { role: 'system', content: 'You are calculator.' },
-            { role: 'user', content: 'Calculate 2 + 2.' },
-        ];
-
-        const needle = '___AWOORWA_NEEDLE__';
-
-        const tools: IFunction[] = [{
-            name: 'add',
-            description: 'Test function',
-            parameters: {
-                a: { type: 'number' },
-                b: { type: 'number' },
-                c: { type: 'array', items: { type: 'number' } },
-                d: { type: 'object', properties: { inside: { type: 'number', description: needle } } },
-            }
-        }];
-
-        const text = applyChatTemplate(template, history, tools);
-
-        return text.includes(needle);
-    }
-
-    export const findModelTemplate = async (modelName: string): Promise<string | null> => {
-        const modelKey = modelName.toLowerCase();
-        let template = templateCache[modelKey] ?? null;
-
-        if (template) {
-            console.log(`[huggingface] found cached template for '${modelName}'`);
-        } else {
-            const config = await loadHuggingfaceTokenizerConfig(modelName);
-
-            if (config?.chat_template?.trim()) {
-                template = config.chat_template.trim()
-                    .replaceAll('eos_token', `'${config.eos_token ?? ''}'`)
-                    .replaceAll('bos_token', `''`);
-
-                if (config.bos_token) {
-                    template = template
-                        .replaceAll(config.bos_token, '')
-                        .replace(/\{\{ ?(''|"") ?\}\}/g, '');
-                }
-            }
-        }
-
-        templateCache[modelKey] = template;
-        saveCache(templateCache);
-
-        return template;
-    }
-
-    export const applyChatTemplate = (templateString: string, messages: ITemplateMessage[], functions?: IFunction[]) => {
-        const template = new Template(templateString);
-
-        const prompt = template.render({
-            messages,
-            add_generation_prompt: true,
-            tools: functions?.map(convertFunctionToTool),
-        });
-
-        return prompt;
-    };
-}