4using System.Collections.Generic;
6using System.Threading.Tasks;
20 public string filename;
23 public string chatTemplate;
25 public bool embeddingOnly;
26 public int embeddingLength;
27 public bool includeInBuild;
28 public int contextLength;
30 static List<string> embeddingOnlyArchs =
new List<string> {
"bert",
"nomic-bert",
"jina-bert-v2",
"t5",
"t5encoder"};
41 if (File.Exists(assetPath) &&
LLMUnitySetup.IsSubPath(assetPath, basePath))
45 return Path.GetFileName(path);
55 public ModelEntry(
string path,
bool lora =
false,
string label =
null,
string url =
null)
58 this.label = label ==
null ? Path.GetFileName(filename) : label;
62 includeInBuild =
true;
65 embeddingOnly =
false;
73 contextLength = reader.
GetIntField($
"{arch}.context_length");
74 embeddingLength = reader.
GetIntField($
"{arch}.embedding_length");
76 embeddingOnly = embeddingOnlyArchs.Contains(arch);
89 entry.path = entry.filename;
96 public class LLMManagerStore
98 public bool downloadOnStart;
99 public List<ModelEntry> modelEntries;
100 public int debugMode;
101 public bool fullLlamaLib;
105 [DefaultExecutionOrder(-2)]
112 public static bool downloadOnStart =
false;
113 public static List<ModelEntry> modelEntries =
new List<ModelEntry>();
114 static List<LLM> llms =
new List<LLM>();
116 public static float downloadProgress = 1;
117 public static List<Callback<float>> downloadProgressCallbacks =
new List<Callback<float>>();
118 static Task<bool> SetupTask;
119 static readonly
object lockObject =
new object();
120 static long totalSize;
121 static long currFileSize;
122 static long completedSize;
130 downloadProgress = (completedSize + progress * currFileSize) / totalSize;
131 foreach (Callback<float> downloadProgressCallback
in downloadProgressCallbacks) downloadProgressCallback?.Invoke(downloadProgress);
142 if (SetupTask ==
null) SetupTask =
SetupOnce();
156 List<StringPair> downloads =
new List<StringPair>();
157 foreach (
ModelEntry modelEntry
in modelEntries)
159 string target =
LLMUnitySetup.GetAssetPath(modelEntry.filename);
160 if (File.Exists(target))
continue;
162 if (!downloadOnStart ||
string.IsNullOrEmpty(modelEntry.url))
165 if (!File.Exists(target))
LLMUnitySetup.LogError($
"Model {modelEntry.filename} could not be found!");
169 target =
LLMUnitySetup.GetDownloadAssetPath(modelEntry.filename);
170 downloads.Add(
new StringPair {source = modelEntry.url, target = target});
173 if (downloads.Count == 0)
return true;
177 downloadProgress = 0;
182 Dictionary<string, long> fileSizes =
new Dictionary<string, long>();
183 foreach (StringPair pair
in downloads)
185 long size = client.GetURLFileSize(pair.source);
186 fileSizes[pair.source] = size;
190 foreach (StringPair pair
in downloads)
192 currFileSize = fileSizes[pair.source];
194 await
LLMUnitySetup.AndroidExtractFile(Path.GetFileName(pair.target));
195 completedSize += currFileSize;
198 completedSize = totalSize;
203 LLMUnitySetup.LogError($
"Error downloading the models: {ex.Message}");
214 public static void SetTemplate(
string filename,
string chatTemplate)
226 if (entry ==
null)
return;
227 entry.chatTemplate = chatTemplate;
228 foreach (
LLM llm
in llms)
230 if (llm !=
null && llm.
model == entry.filename) llm.
SetTemplate(chatTemplate);
244 string filename = Path.GetFileName(path);
248 if (entry.filename == filename || entry.path == fullPath)
return entry;
261 if (entry ==
null)
return "";
274 public static int Num(
bool lora)
279 if (entry.lora == lora) num++;
327 downloadOnStart = store.downloadOnStart;
328 modelEntries = store.modelEntries;
329 LLMUnitySetup.DebugMode = (
LLMUnitySetup.DebugModeType)store.debugMode;
330 LLMUnitySetup.FullLlamaLib = store.fullLlamaLib;
334 static string LLMManagerPref =
"LLMManager";
336 [HideInInspector]
public static float modelProgress = 1;
337 [HideInInspector]
public static float loraProgress = 1;
339 [InitializeOnLoadMethod]
340 static void InitializeOnLoad()
352 int indexToInsert = modelEntries.Count;
355 if (modelEntries.Count > 0 && modelEntries[0].lora) indexToInsert = 0;
358 for (
int i = modelEntries.Count - 1; i >= 0; i--)
360 if (!modelEntries[i].lora)
362 indexToInsert = i + 1;
368 modelEntries.Insert(indexToInsert, entry);
370 return entry.filename;
381 public static string AddEntry(
string path,
bool lora =
false,
string label =
null,
string url =
null)
394 public static async Task<string>
Download(
string url,
bool lora =
false,
bool log =
false,
string label =
null)
398 if (entry.url == url)
400 if (log)
LLMUnitySetup.Log($
"Found existing entry for {url}");
401 return entry.filename;
405 string modelName = Path.GetFileName(url).Split(
"?")[0];
407 if (entryPath !=
null)
409 if (log)
LLMUnitySetup.Log($
"Found existing entry for {modelName}");
410 return entryPath.filename;
414 float preModelProgress = modelProgress;
415 float preLoraProgress = loraProgress;
431 modelProgress = preModelProgress;
432 loraProgress = preLoraProgress;
433 LLMUnitySetup.LogError($
"Error downloading the model from URL '{url}': " + ex.Message);
436 return AddEntry(modelPath, lora, label, url);
447 public static string Load(
string path,
bool lora =
false,
bool log =
false,
string label =
null)
452 if (log)
LLMUnitySetup.Log($
"Found existing entry for {entry.filename}");
453 return entry.filename;
465 public static async Task<string>
DownloadModel(
string url,
bool log =
false,
string label =
null)
467 return await
Download(url,
false, log, label);
477 public static async Task<string>
DownloadLora(
string url,
bool log =
false,
string label =
null)
479 return await
Download(url,
true, log, label);
489 public static string LoadModel(
string path,
bool log =
false,
string label =
null)
491 return Load(path,
false, log, label);
501 public static string LoadLora(
string path,
bool log =
false,
string label =
null)
503 return Load(path,
true, log, label);
511 public static void SetURL(
string filename,
string url)
523 if (entry ==
null)
return;
545 if (entry ==
null)
return;
546 entry.includeInBuild = includeInBuild;
556 downloadOnStart = value;
562 if (entry.url ==
null || entry.url ==
"") warn =
true;
564 if (warn)
LLMUnitySetup.LogWarning(
"Some models do not have a URL and will be copied in the build. To resolve this fill in the URL field in the expanded view of the LLM Model list.");
573 public static void Remove(
string filename)
584 if (entry ==
null)
return;
585 modelEntries.Remove(entry);
587 foreach (
LLM llm
in llms)
589 if (!entry.lora && llm.
model == entry.filename) llm.model =
"";
590 else if (entry.lora) llm.
RemoveLora(entry.filename);
600 modelProgress = progress;
609 loraProgress = progress;
617 string json = JsonUtility.ToJson(
new LLMManagerStore
619 modelEntries = modelEntries,
620 downloadOnStart = downloadOnStart,
622 PlayerPrefs.SetString(LLMManagerPref, json);
631 string pref = PlayerPrefs.GetString(LLMManagerPref);
632 if (pref ==
null || pref ==
"")
return;
633 LLMManagerStore store = JsonUtility.FromJson<LLMManagerStore>(pref);
634 downloadOnStart = store.downloadOnStart;
635 modelEntries = store.modelEntries;
643 List<ModelEntry> modelEntriesBuild =
new List<ModelEntry>();
644 foreach (
ModelEntry modelEntry
in modelEntries)
646 if (!modelEntry.includeInBuild)
continue;
649 string json = JsonUtility.ToJson(
new LLMManagerStore
651 modelEntries = modelEntriesBuild,
652 downloadOnStart = downloadOnStart,
663 public static void Build(ActionCallback copyCallback)
667 foreach (
ModelEntry modelEntry
in modelEntries)
669 string target =
LLMUnitySetup.GetAssetPath(modelEntry.filename);
670 if (!modelEntry.includeInBuild || File.Exists(target))
continue;
671 if (!downloadOnStart ||
string.IsNullOrEmpty(modelEntry.url)) copyCallback(modelEntry.path, target);
Class implementing the skeleton of a chat template.
static string FromGGUF(string path)
Determines the chat template name from a GGUF file. It reads the GGUF file and then determines the ch...
Class implementing the GGUF reader.
int GetIntField(string key)
Allows to retrieve an integer GGUF field.
string GetStringField(string key)
Allows to retrieve a string GGUF field.
Class implementing the LLM model manager.
static void SetTemplate(ModelEntry entry, string chatTemplate)
Sets the chat template for a model and distributes it to all LLMs using it.
static void SaveToDisk()
Saves the model manager to disk for the build.
static void SetIncludeInBuild(ModelEntry entry, bool includeInBuild)
Sets whether to include a model to the build.
static void SetLoraProgress(float progress)
Sets the LORA download progress.
static void Unregister(LLM llm)
Removes a LLM from the model manager.
static async Task< string > Download(string url, bool lora=false, bool log=false, string label=null)
Downloads a model and adds a model entry to the model manager.
static string GetAssetPath(string filename)
Gets the asset path based on whether the application runs locally in the editor or in a build.
static int NumModels()
Returns the number of LLM models.
static ModelEntry Get(string path)
Gets the model entry for a model path.
static Task< bool > Setup()
Setup of the models.
static int Num(bool lora)
Returns the number of LLM/LORA models.
static void Register(LLM llm)
Registers a LLM to the model manager.
static void SetURL(string filename, string url)
Sets the URL for a model.
static void SetModelProgress(float progress)
Sets the LLM download progress.
static void Build(ActionCallback copyCallback)
Saves the model manager to disk along with models that are not (or can't) be downloaded for the build...
static void Save()
Serialises and saves the model manager.
static string AddEntry(string path, bool lora=false, string label=null, string url=null)
Creates and adds a model entry to the model manager.
static void Load()
Deserialises and loads the model manager.
static void SetDownloadOnStart(bool value)
Sets whether to download files on start.
static void SetIncludeInBuild(string filename, bool includeInBuild)
Sets whether to include a model to the build.
static int NumLoras()
Returns the number of LORA models.
static async Task< string > DownloadModel(string url, bool log=false, string label=null)
Downloads a LLM model from disk and adds a model entry to the model manager.
static string LoadModel(string path, bool log=false, string label=null)
Loads a LLM model from disk and adds a model entry to the model manager.
static void SetTemplate(string filename, string chatTemplate)
Sets the chat template for a model and distributes it to all LLMs using it.
static void Remove(string filename)
Removes a model from the model manager.
static void LoadFromDisk()
Loads the model manager from a file.
static void SetDownloadProgress(float progress)
Sets the model download progress in all registered callbacks.
static string Load(string path, bool lora=false, bool log=false, string label=null)
Loads a model from disk and adds a model entry to the model manager.
static string AddEntry(ModelEntry entry)
Adds a model entry to the model manager.
static async Task< bool > SetupOnce()
Task performing the setup of the models.
static async Task< string > DownloadLora(string url, bool log=false, string label=null)
Downloads a Lora model from disk and adds a model entry to the model manager.
static void Remove(ModelEntry entry)
Removes a model from the model manager.
static string LoadLora(string path, bool log=false, string label=null)
Loads a LORA model from disk and adds a model entry to the model manager.
static void SetURL(ModelEntry entry, string url)
Sets the URL for a model.
Class implementing helper functions for setup and process management.
static string LLMManagerPath
Path of file with build information for runtime.
static string modelDownloadPath
Model download path.
Class implementing the LLM server.
void RemoveLora(string path)
Allows to remove a LORA model from the LLM. Models supported are in .gguf format.
string model
LLM model to use (.gguf format)
void SetTemplate(string templateName, bool setDirty=true)
Set the chat template for the LLM.
Class implementing a LLM model entry.
ModelEntry(string path, bool lora=false, string label=null, string url=null)
Constructs a LLM model entry.
static string GetFilenameOrRelativeAssetPath(string path)
Returns the relative asset path if it is in the AssetPath folder (StreamingAssets or persistentPath),...
ModelEntry OnlyRequiredFields()
Returns only the required fields for bundling the model in the build.
Class implementing a resumable Web client.