LLMUnity/LLMCharacter_8cs_source.html

using System;

using System.Collections.Generic;

using System.IO;

using System.Threading;

using System.Threading.Tasks;

using UnityEditor;

using UnityEngine;


namespace LLMUnity

{

    [DefaultExecutionOrder(-2)]


    public class LLMCharacter : LLMCaller

    {

        [LLM] public string save = "";

        [LLM] public bool saveCache = false;

        [LLM] public bool debugPrompt = false;

        [Model] public int numPredict = 256;

        [ModelAdvanced] public int slot = -1;

        [ModelAdvanced] public string grammar = null;

        [ModelAdvanced] public bool cachePrompt = true;

        [ModelAdvanced] public int seed = 0;

        [ModelAdvanced, Float(0f, 2f)] public float temperature = 0.2f;

        [ModelAdvanced, Int(-1, 100)] public int topK = 40;

        [ModelAdvanced, Float(0f, 1f)] public float topP = 0.9f;

        [ModelAdvanced, Float(0f, 1f)] public float minP = 0.05f;

        [ModelAdvanced, Float(0f, 2f)] public float repeatPenalty = 1.1f;

        [ModelAdvanced, Float(0f, 1f)] public float presencePenalty = 0f;

        [ModelAdvanced, Float(0f, 1f)] public float frequencyPenalty = 0f;


        [ModelAdvanced, Float(0f, 1f)] public float tfsZ = 1f;

        [ModelAdvanced, Float(0f, 1f)] public float typicalP = 1f;

        [ModelAdvanced, Int(0, 2048)] public int repeatLastN = 64;

        [ModelAdvanced] public bool penalizeNl = true;

        [ModelAdvanced] public string penaltyPrompt;

        [ModelAdvanced, Int(0, 2)] public int mirostat = 0;

        [ModelAdvanced, Float(0f, 10f)] public float mirostatTau = 5f;

        [ModelAdvanced, Float(0f, 1f)] public float mirostatEta = 0.1f;

        [ModelAdvanced, Int(0, 10)] public int nProbs = 0;

        [ModelAdvanced] public bool ignoreEos = false;


        public int nKeep = -1;

        public List<string> stop = new List<string>();

        public Dictionary<int, string> logitBias = null;


        [Chat] public bool stream = true;

        [Chat] public string playerName = "user";

        [Chat] public string AIName = "assistant";

        [TextArea(5, 10), Chat] public string prompt = "A chat between a curious human and an artificial intelligence assistant. The assistant gives helpful, detailed, and polite answers to the human's questions.";

        public bool setNKeepToPrompt = true;

        public List<ChatMessage> chat;

        public string grammarString;


        protected SemaphoreSlim chatLock = new SemaphoreSlim(1, 1);

        protected string chatTemplate;

        protected ChatTemplate template = null;


        public override void Awake()

        {

            if (!enabled) return;

            base.Awake();

            if (!remote)

            {

                int slotFromServer = llm.Register(this);

                if (slot == -1) slot = slotFromServer;

            }

            InitGrammar();

            InitHistory();

        }


        protected override void OnValidate()

        {

            base.OnValidate();

            if (llm != null && llm.parallelPrompts > -1 && (slot < -1 || slot >= llm.parallelPrompts)) LLMUnitySetup.LogError($"The slot needs to be between 0 and {llm.parallelPrompts-1}, or -1 to be automatically set");

        }


        protected override string NotValidLLMError()

        {

            return base.NotValidLLMError() + $", it is an embedding only model";

        }


        public override bool IsValidLLM(LLM llmSet)

        {

            return !llmSet.embeddingsOnly;

        }


        protected virtual void InitHistory()

        {

            InitPrompt();

            _ = LoadHistory();

        }


        protected virtual async Task LoadHistory()

        {

            if (save == "" || !File.Exists(GetJsonSavePath(save))) return;

            await chatLock.WaitAsync(); // Acquire the lock

            try

            {

                await Load(save);

            }

            finally

            {

                chatLock.Release(); // Release the lock

            }

        }


        protected virtual string GetSavePath(string filename)

        {

            return Path.Combine(Application.persistentDataPath, filename).Replace('\\', '/');

        }


        public virtual string GetJsonSavePath(string filename)

        {

            return GetSavePath(filename + ".json");

        }


        public virtual string GetCacheSavePath(string filename)

        {

            return GetSavePath(filename + ".cache");

        }


        protected virtual void InitPrompt(bool clearChat = true)

        {

            if (chat != null)

            {

                if (clearChat) chat.Clear();

            }

            else

            {

                chat = new List<ChatMessage>();

            }

            ChatMessage promptMessage = new ChatMessage { role = "system", content = prompt };

            if (chat.Count == 0)

            {

                chat.Add(promptMessage);

            }

            else

            {

                chat[0] = promptMessage;

            }

        }


        public virtual void SetPrompt(string newPrompt, bool clearChat = true)

        {

            prompt = newPrompt;

            nKeep = -1;

            InitPrompt(clearChat);

        }


        protected virtual bool CheckTemplate()

        {

            if (template == null)

            {

                LLMUnitySetup.LogError("Template not set!");

                return false;

            }

            return true;

        }


        protected virtual async Task<bool> InitNKeep()

        {

            if (setNKeepToPrompt && nKeep == -1)

            {

                if (!CheckTemplate()) return false;

                string systemPrompt = template.ComputePrompt(new List<ChatMessage>(){chat[0]}, playerName, "", false);

                List<int> tokens = await Tokenize(systemPrompt);

                if (tokens == null) return false;

                SetNKeep(tokens);

            }

            return true;

        }


        protected virtual void InitGrammar()

        {

            if (grammar != null && grammar != "")

            {

                grammarString = File.ReadAllText(LLMUnitySetup.GetAssetPath(grammar));

            }

        }


        protected virtual void SetNKeep(List<int> tokens)

        {

            // set the tokens to keep

            nKeep = tokens.Count;

        }


        public virtual async Task LoadTemplate()

        {

            string llmTemplate;

            if (remote)

            {

                llmTemplate = await AskTemplate();

            }

            else

            {

                llmTemplate = llm.GetTemplate();

            }

            if (llmTemplate != chatTemplate)

            {

                chatTemplate = llmTemplate;

                template = chatTemplate == null ? null : ChatTemplate.GetTemplate(chatTemplate);

                nKeep = -1;

            }

        }


        public virtual async void SetGrammar(string path)

        {

#if UNITY_EDITOR

            if (!EditorApplication.isPlaying) path = LLMUnitySetup.AddAsset(path);

#endif

            await LLMUnitySetup.AndroidExtractAsset(path, true);

            grammar = path;

            InitGrammar();

        }


        protected virtual List<string> GetStopwords()

        {

            if (!CheckTemplate()) return null;

            List<string> stopAll = new List<string>(template.GetStop(playerName, AIName));

            if (stop != null) stopAll.AddRange(stop);

            return stopAll;

        }


        protected virtual ChatRequest GenerateRequest(string prompt)

        {

            // setup the request struct

            ChatRequest chatRequest = new ChatRequest();

            if (debugPrompt) LLMUnitySetup.Log(prompt);

            chatRequest.prompt = prompt;

            chatRequest.id_slot = slot;

            chatRequest.temperature = temperature;

            chatRequest.top_k = topK;

            chatRequest.top_p = topP;

            chatRequest.min_p = minP;

            chatRequest.n_predict = numPredict;

            chatRequest.n_keep = nKeep;

            chatRequest.stream = stream;

            chatRequest.stop = GetStopwords();

            chatRequest.tfs_z = tfsZ;

            chatRequest.typical_p = typicalP;

            chatRequest.repeat_penalty = repeatPenalty;

            chatRequest.repeat_last_n = repeatLastN;

            chatRequest.penalize_nl = penalizeNl;

            chatRequest.presence_penalty = presencePenalty;

            chatRequest.frequency_penalty = frequencyPenalty;

            chatRequest.penalty_prompt = (penaltyPrompt != null && penaltyPrompt != "") ? penaltyPrompt : null;

            chatRequest.mirostat = mirostat;

            chatRequest.mirostat_tau = mirostatTau;

            chatRequest.mirostat_eta = mirostatEta;

            chatRequest.grammar = grammarString;

            chatRequest.seed = seed;

            chatRequest.ignore_eos = ignoreEos;

            chatRequest.logit_bias = logitBias;

            chatRequest.n_probs = nProbs;

            chatRequest.cache_prompt = cachePrompt;

            return chatRequest;

        }


        public virtual void AddMessage(string role, string content)

        {

            // add the question / answer to the chat list, update prompt

            chat.Add(new ChatMessage { role = role, content = content });

        }


        public virtual void AddPlayerMessage(string content)

        {

            AddMessage(playerName, content);

        }


        public virtual void AddAIMessage(string content)

        {

            AddMessage(AIName, content);

        }


        protected virtual string ChatContent(ChatResult result)

        {

            // get content from a chat result received from the endpoint

            return result.content.Trim();

        }


        protected virtual string MultiChatContent(MultiChatResult result)

        {

            // get content from a chat result received from the endpoint

            string response = "";

            foreach (ChatResult resultPart in result.data)

            {

                response += resultPart.content;

            }

            return response.Trim();

        }


        protected virtual string SlotContent(SlotResult result)

        {

            // get the tokens from a tokenize result received from the endpoint

            return result.filename;

        }


        protected virtual string TemplateContent(TemplateResult result)

        {

            // get content from a char result received from the endpoint in open AI format

            return result.template;

        }


        protected virtual async Task<string> CompletionRequest(string json, Callback<string> callback = null)

        {

            string result = "";

            if (stream)

            {

                result = await PostRequest<MultiChatResult, string>(json, "completion", MultiChatContent, callback);

            }

            else

            {

                result = await PostRequest<ChatResult, string>(json, "completion", ChatContent, callback);

            }

            return result;

        }


        public virtual async Task<string> Chat(string query, Callback<string> callback = null, EmptyCallback completionCallback = null, bool addToHistory = true)

        {

            // handle a chat message by the user

            // call the callback function while the answer is received

            // call the completionCallback function when the answer is fully received

            await LoadTemplate();

            if (!CheckTemplate()) return null;

            if (!await InitNKeep()) return null;


            string json;

            await chatLock.WaitAsync();

            try

            {

                AddPlayerMessage(query);

                string prompt = template.ComputePrompt(chat, playerName, AIName);

                json = JsonUtility.ToJson(GenerateRequest(prompt));

                chat.RemoveAt(chat.Count - 1);

            }

            finally

            {

                chatLock.Release();

            }


            string result = await CompletionRequest(json, callback);


            if (addToHistory && result != null)

            {

                await chatLock.WaitAsync();

                try

                {

                    AddPlayerMessage(query);

                    AddAIMessage(result);

                }

                finally

                {

                    chatLock.Release();

                }

                if (save != "") _ = Save(save);

            }


            completionCallback?.Invoke();

            return result;

        }


        public virtual async Task<string> Complete(string prompt, Callback<string> callback = null, EmptyCallback completionCallback = null)

        {

            // handle a completion request by the user

            // call the callback function while the answer is received

            // call the completionCallback function when the answer is fully received

            await LoadTemplate();


            string json = JsonUtility.ToJson(GenerateRequest(prompt));

            string result = await CompletionRequest(json, callback);

            completionCallback?.Invoke();

            return result;

        }


        public virtual async Task Warmup(EmptyCallback completionCallback = null)

        {

            await LoadTemplate();

            if (!CheckTemplate()) return;

            if (!await InitNKeep()) return;


            string prompt = template.ComputePrompt(chat, playerName, AIName);

            ChatRequest request = GenerateRequest(prompt);

            request.n_predict = 0;

            string json = JsonUtility.ToJson(request);

            await CompletionRequest(json);

            completionCallback?.Invoke();

        }


        public virtual async Task<string> AskTemplate()

        {

            return await PostRequest<TemplateResult, string>("{}", "template", TemplateContent);

        }


        protected override void CancelRequestsLocal()

        {

            if (slot >= 0) llm.CancelRequest(slot);

        }


        protected virtual async Task<string> Slot(string filepath, string action)

        {

            SlotRequest slotRequest = new SlotRequest();

            slotRequest.id_slot = slot;

            slotRequest.filepath = filepath;

            slotRequest.action = action;

            string json = JsonUtility.ToJson(slotRequest);

            return await PostRequest<SlotResult, string>(json, "slots", SlotContent);

        }


        public virtual async Task<string> Save(string filename)

        {

            string filepath = GetJsonSavePath(filename);

            string dirname = Path.GetDirectoryName(filepath);

            if (!Directory.Exists(dirname)) Directory.CreateDirectory(dirname);

            string json = JsonUtility.ToJson(new ChatListWrapper { chat = chat.GetRange(1, chat.Count - 1) });

            File.WriteAllText(filepath, json);


            string cachepath = GetCacheSavePath(filename);

            if (remote || !saveCache) return null;

            string result = await Slot(cachepath, "save");

            return result;

        }


        public virtual async Task<string> Load(string filename)

        {

            string filepath = GetJsonSavePath(filename);

            if (!File.Exists(filepath))

            {

                LLMUnitySetup.LogError($"File {filepath} does not exist.");

                return null;

            }

            string json = File.ReadAllText(filepath);

            List<ChatMessage> chatHistory = JsonUtility.FromJson<ChatListWrapper>(json).chat;

            InitPrompt(true);

            chat.AddRange(chatHistory);

            LLMUnitySetup.Log($"Loaded {filepath}");


            string cachepath = GetCacheSavePath(filename);

            if (remote || !saveCache || !File.Exists(GetSavePath(cachepath))) return null;

            string result = await Slot(cachepath, "restore");

            return result;

        }


        protected override async Task<Ret> PostRequestLocal<Res, Ret>(string json, string endpoint, ContentCallback<Res, Ret> getContent, Callback<Ret> callback = null)

        {

            if (endpoint != "completion") return await base.PostRequestLocal(json, endpoint, getContent, callback);


            while (!llm.failed && !llm.started) await Task.Yield();


            string callResult = null;

            bool callbackCalled = false;

            if (llm.embeddingsOnly) LLMUnitySetup.LogError("The LLM can't be used for completion, only for embeddings");

            else

            {

                Callback<string> callbackString = null;

                if (stream && callback != null)

                {

                    if (typeof(Ret) == typeof(string))

                    {

                        callbackString = (strArg) =>

                        {

                            callback(ConvertContent(strArg, getContent));

                        };

                    }

                    else

                    {

                        LLMUnitySetup.LogError($"wrong callback type, should be string");

                    }

                    callbackCalled = true;

                }

                callResult = await llm.Completion(json, callbackString);

            }


            Ret result = ConvertContent(callResult, getContent);

            if (!callbackCalled) callback?.Invoke(result);

            return result;

        }

    }


    [Serializable]

    public class ChatListWrapper

    {

        public List<ChatMessage> chat;

    }

}

LLMUnity.ChatTemplate
Class implementing the skeleton of a chat template.
Definition LLMChatTemplates.cs:13

LLMUnity.ChatTemplate.GetTemplate
static ChatTemplate GetTemplate(string template)
Creates the chat template based on the provided chat template name.
Definition LLMChatTemplates.cs:141

LLMUnity.LLMCaller
Class implementing calling of LLM functions (local and remote).
Definition LLMCaller.cs:17

LLMUnity.LLMCaller.Tokenize
virtual async Task< List< int > > Tokenize(string query, Callback< List< int > > callback=null)
Tokenises the provided query.
Definition LLMCaller.cs:337

LLMUnity.LLMCaller.remote
bool remote
toggle to use remote LLM server or local LLM
Definition LLMCaller.cs:21

LLMUnity.LLMCharacter
Class implementing the LLM characters.
Definition LLMCharacter.cs:19

LLMUnity.LLMCharacter.cachePrompt
bool cachePrompt
option to cache the prompt as it is being created by the chat to avoid reprocessing the entire prompt...
Definition LLMCharacter.cs:38

LLMUnity.LLMCharacter.slot
int slot
specify which slot of the server to use for computation (affects caching)
Definition LLMCharacter.cs:34

LLMUnity.LLMCharacter.Chat
virtual async Task< string > Chat(string query, Callback< string > callback=null, EmptyCallback completionCallback=null, bool addToHistory=true)
Chat functionality of the LLM. It calls the LLM completion based on the provided query including the ...
Definition LLMCharacter.cs:440

LLMUnity.LLMCharacter.stop
List< string > stop
stopwords to stop the LLM in addition to the default stopwords from the chat template.
Definition LLMCharacter.cs:92

LLMUnity.LLMCharacter.topP
float topP
top-p sampling (1.0 = disabled). The top p value controls the cumulative probability of generated tok...
Definition LLMCharacter.cs:53

LLMUnity.LLMCharacter.LoadTemplate
virtual async Task LoadTemplate()
Loads the chat template of the LLMCharacter.
Definition LLMCharacter.cs:281

LLMUnity.LLMCharacter.AIName
string AIName
the name of the AI
Definition LLMCharacter.cs:103

LLMUnity.LLMCharacter.nProbs
int nProbs
if greater than 0, the response also contains the probabilities of top N tokens for each generated to...
Definition LLMCharacter.cs:85

LLMUnity.LLMCharacter.ignoreEos
bool ignoreEos
ignore end of stream token and continue generating.
Definition LLMCharacter.cs:87

LLMUnity.LLMCharacter.mirostatTau
float mirostatTau
set the Mirostat target entropy, parameter tau.
Definition LLMCharacter.cs:81

LLMUnity.LLMCharacter.numPredict
int numPredict
number of tokens to predict (-1 = infinity, -2 = until context filled). This is the amount of tokens ...
Definition LLMCharacter.cs:32

LLMUnity.LLMCharacter.prompt
string prompt
a description of the AI role. This defines the LLMCharacter system prompt
Definition LLMCharacter.cs:105

LLMUnity.LLMCharacter.temperature
float temperature
LLM temperature, lower values give more deterministic answers. The temperature setting adjusts how ra...
Definition LLMCharacter.cs:45

LLMUnity.LLMCharacter.Awake
override void Awake()
The Unity Awake function that initializes the state before the application starts....
Definition LLMCharacter.cs:128

LLMUnity.LLMCharacter.presencePenalty
float presencePenalty
repeated token presence penalty (0.0 = disabled). Positive values penalize new tokens based on whethe...
Definition LLMCharacter.cs:62

LLMUnity.LLMCharacter.AskTemplate
virtual async Task< string > AskTemplate()
Asks the LLM for the chat template to use.
Definition LLMCharacter.cs:534

LLMUnity.LLMCharacter.playerName
string playerName
the name of the player
Definition LLMCharacter.cs:101

LLMUnity.LLMCharacter.GetCacheSavePath
virtual string GetCacheSavePath(string filename)
Allows to get the save path of the LLM cache based on the provided filename or relative path.
Definition LLMCharacter.cs:202

LLMUnity.LLMCharacter.mirostatEta
float mirostatEta
set the Mirostat learning rate, parameter eta.
Definition LLMCharacter.cs:83

LLMUnity.LLMCharacter.minP
float minP
minimum probability for a token to be used. The probability is defined relative to the probability of...
Definition LLMCharacter.cs:56

LLMUnity.LLMCharacter.typicalP
float typicalP
enable locally typical sampling with parameter p (1.0 = disabled).
Definition LLMCharacter.cs:70

LLMUnity.LLMCharacter.Load
virtual async Task< string > Load(string filename)
Load the chat history and cache from the provided filename / relative path.
Definition LLMCharacter.cs:578

LLMUnity.LLMCharacter.nKeep
int nKeep
number of tokens to retain from the prompt when the model runs out of context (-1 = LLMCharacter prom...
Definition LLMCharacter.cs:90

LLMUnity.LLMCharacter.SetGrammar
virtual async void SetGrammar(string path)
Sets the grammar file of the LLMCharacter.
Definition LLMCharacter.cs:304

LLMUnity.LLMCharacter.penalizeNl
bool penalizeNl
penalize newline tokens when applying the repeat penalty.
Definition LLMCharacter.cs:74

LLMUnity.LLMCharacter.debugPrompt
bool debugPrompt
select to log the constructed prompt the Unity Editor.
Definition LLMCharacter.cs:27

LLMUnity.LLMCharacter.saveCache
bool saveCache
toggle to save the LLM cache. This speeds up the prompt calculation but also requires ~100MB of space...
Definition LLMCharacter.cs:25

LLMUnity.LLMCharacter.topK
int topK
top-k sampling (0 = disabled). The top k value controls the top k most probable tokens at each step o...
Definition LLMCharacter.cs:48

LLMUnity.LLMCharacter.grammar
string grammar
grammar file used for the LLM in .cbnf format (relative to the Assets/StreamingAssets folder)
Definition LLMCharacter.cs:36

LLMUnity.LLMCharacter.Save
virtual async Task< string > Save(string filename)
Saves the chat history and cache to the provided filename / relative path.
Definition LLMCharacter.cs:559

LLMUnity.LLMCharacter.AddAIMessage
virtual void AddAIMessage(string content)
Allows to add a AI message in the chat history.
Definition LLMCharacter.cs:381

LLMUnity.LLMCharacter.penaltyPrompt
string penaltyPrompt
prompt for the purpose of the penalty evaluation. Can be either null, a string or an array of numbers...
Definition LLMCharacter.cs:77

LLMUnity.LLMCharacter.IsValidLLM
override bool IsValidLLM(LLM llmSet)
Checks if a LLM is valid for the LLMCaller.
Definition LLMCharacter.cs:157

LLMUnity.LLMCharacter.AddPlayerMessage
virtual void AddPlayerMessage(string content)
Allows to add a player message in the chat history.
Definition LLMCharacter.cs:372

LLMUnity.LLMCharacter.repeatPenalty
float repeatPenalty
control the repetition of token sequences in the generated text. The penalty is applied to repeated t...
Definition LLMCharacter.cs:59

LLMUnity.LLMCharacter.GetJsonSavePath
virtual string GetJsonSavePath(string filename)
Allows to get the save path of the chat history based on the provided filename or relative path.
Definition LLMCharacter.cs:192

LLMUnity.LLMCharacter.stream
bool stream
option to receive the reply from the model as it is produced (recommended!). If it is not selected,...
Definition LLMCharacter.cs:99

LLMUnity.LLMCharacter.frequencyPenalty
float frequencyPenalty
repeated token frequency penalty (0.0 = disabled). Positive values penalize new tokens based on their...
Definition LLMCharacter.cs:65

LLMUnity.LLMCharacter.Warmup
virtual async Task Warmup(EmptyCallback completionCallback=null)
Allow to warm-up a model by processing the prompt. The prompt processing will be cached (if cacheProm...
Definition LLMCharacter.cs:516

LLMUnity.LLMCharacter.mirostat
int mirostat
enable Mirostat sampling, controlling perplexity during text generation (0 = disabled,...
Definition LLMCharacter.cs:79

LLMUnity.LLMCharacter.setNKeepToPrompt
bool setNKeepToPrompt
option to set the number of tokens to retain from the prompt (nKeep) based on the LLMCharacter system...
Definition LLMCharacter.cs:107

LLMUnity.LLMCharacter.repeatLastN
int repeatLastN
last n tokens to consider for penalizing repetition (0 = disabled, -1 = ctx-size).
Definition LLMCharacter.cs:72

LLMUnity.LLMCharacter.seed
int seed
seed for reproducibility. For random results every time set to -1.
Definition LLMCharacter.cs:40

LLMUnity.LLMCharacter.tfsZ
float tfsZ
enable tail free sampling with parameter z (1.0 = disabled).
Definition LLMCharacter.cs:68

LLMUnity.LLMCharacter.grammarString
string grammarString
the grammar to use
Definition LLMCharacter.cs:111

LLMUnity.LLMCharacter.logitBias
Dictionary< int, string > logitBias
the logit bias option allows to manually adjust the likelihood of specific tokens appearing in the ge...
Definition LLMCharacter.cs:95

LLMUnity.LLMCharacter.Complete
virtual async Task< string > Complete(string prompt, Callback< string > callback=null, EmptyCallback completionCallback=null)
Pure completion functionality of the LLM. It calls the LLM completion based solely on the provided pr...
Definition LLMCharacter.cs:493

LLMUnity.LLMCharacter.AddMessage
virtual void AddMessage(string role, string content)
Allows to add a message in the chat history.
Definition LLMCharacter.cs:362

LLMUnity.LLMCharacter.chat
List< ChatMessage > chat
the chat history as list of chat messages
Definition LLMCharacter.cs:109

LLMUnity.LLMCharacter.save
string save
file to save the chat history. The file is saved only for Chat calls with addToHistory set to true....
Definition LLMCharacter.cs:23

LLMUnity.LLMCharacter.SetPrompt
virtual void SetPrompt(string newPrompt, bool clearChat=true)
Set the system prompt for the LLMCharacter.
Definition LLMCharacter.cs:233

LLMUnity.LLMUnitySetup
Class implementing helper functions for setup and process management.
Definition LLMUnitySetup.cs:100

LLMUnity.LLM
Class implementing the LLM server.
Definition LLM.cs:19

LLMUnity.LLM.GetTemplate
string GetTemplate()
Returns the chat template of the LLM.
Definition LLM.cs:387

LLMUnity.LLM.CancelRequest
void CancelRequest(int id_slot)
Allows to cancel the requests in a specific slot of the LLM.
Definition LLM.cs:791

LLMUnity.LLM.parallelPrompts
int parallelPrompts
number of prompts that can happen in parallel (-1 = number of LLMCaller objects)
Definition LLM.cs:35

LLMUnity.LLM.started
bool started
Boolean set to true if the server has started and is ready to receive requests, false otherwise.
Definition LLM.cs:46

LLMUnity.LLM.Completion
async Task< string > Completion(string json, Callback< string > streamCallback=null)
Allows to use the chat and completion functionality of the LLM.
Definition LLM.cs:766

LLMUnity.LLM.Register
int Register(LLMCaller llmCaller)
Registers a local LLMCaller object. This allows to bind the LLMCaller "client" to a specific slot of ...
Definition LLM.cs:557

LLMUnity.LLM.failed
bool failed
Boolean set to true if the server has failed to start.
Definition LLM.cs:48

LLMUnity
Definition LLM.cs:12