From 83c74e12f8c5da6d6fb206ba882aad3a2eb3a359 Mon Sep 17 00:00:00 2001
From: Concedo <39025047+LostRuins@users.noreply.github.com>
Date: Fri, 15 Sep 2023 17:00:40 +0800
Subject: [PATCH 01/18] Updated Kobold Lite to v63. You may want to wait a day
 or two to confirm its stable before merging

---
 static/klite.html | 940 +++++++++++++++++++++++++++++++++-------------
 1 file changed, 675 insertions(+), 265 deletions(-)

diff --git a/static/klite.html b/static/klite.html
index cf30ee07..cf97eca7 100644
--- a/static/klite.html
+++ b/static/klite.html
@@ -3,7 +3,7 @@
 
 <!--
 An embedded version of Kobold Lite for use in koboldcpp and KoboldAI United Client
-Current version: 62
+Current version: 63
 Please go to https://github.com/LostRuins/lite.koboldai.net for updates on Kobold Lite.
 Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and KoboldAI United Client. Please do not remove this line.
 
@@ -46,8 +46,8 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 		:root{
 			--img_sword:url("data:image/png;base64,iVBORw0KGgoAAAANSUhEUgAAACAAAAAgBAMAAACBVGfHAAAAAXNSR0IB2cksfwAAAAlwSFlzAAAA7AAAAOwBeShxvQAAAB5QTFRFAAAA/rUT5uvzztXjq1kW5+r14ufw/8YF/8QHr1kWOCO8XQAAAAp0Uk5TAPr+/fwgpBqRPkYi9G8AAAC6SURBVHicjZCxDoIwEIZv0cLmryTiWl/AhOBOcgubcWAmDs5lglEWdWTwgT1MkGvj4A1N+/Xr3Z8S6VpcrXeurN1799baTIOzCMdQyANBg4+QHQIhq2fhMgqqZ/WfcAqE/LfQPR2REgzwoKUSIiB1uoMA3PWIEUCPMD1arHUG08YFvAz0Ymz0T8XMBWpPYMbWE7hs4L49+4R5aGalAbiU/OkEeiAZBGACst1RAFbjqp/IgA63CUQ6gtQbfGErFF7/nE4AAAAASUVORK5CYII=");
 			--img_paper:url("data:image/png;base64,iVBORw0KGgoAAAANSUhEUgAAACAAAAAgBAMAAACBVGfHAAAAAXNSR0IB2cksfwAAAAlwSFlzAAAAnQAAAJ0Bj3LnbgAAAB5QTFRF+OmvAAAA89Ze14Rw2cCY1k8/8eGhmEQ/+uqj87Jse3RL9AAAAAp0Uk5T/wD49//9of8rH/vnQeUAAAEOSURBVHicXdG9asMwFAXggx1COmoJ8VgNptkKcmqyGaKSB0i127RkLiTgNV2CVxMo9G177rVSm2ow0se5Vz/Gbdub6YBz2//w0sV59s0wbs5X806X1j4JFN4Bx45La9eE7OM1PANIBHKCuW7CAYgkkIWgEaWeYN5DjHA0AthIZF8ILAgrpBJJ21N1hyGCXXvGA2EJibxJQaVwgUQKlNIkj5AePNKyrWAJtYS952dH6AlpJaQViW3AXc/shlnZFoRHAhd6hpkjrLGEl7lShFKuphXgA0B23WtF+UmwCjy1VijUw70H4iPeH0KaIMl/DKZjIf/lWo/QCJjVSAMYUoSvCH80gjHdEZibCQjJJuYXZ+xAP6Rjil4AAAAASUVORK5CYII=");
-			--img_chat:url("data:image/png;base64,iVBORw0KGgoAAAANSUhEUgAAACAAAAAgBAMAAACBVGfHAAAAAXNSR0IB2cksfwAAAAlwSFlzAAAA7AAAAOwBeShxvQAAAB5QTFRFAAAA/tACTK/4OninExQMKU9s160EDQ4Jh28GBQcHB/ICrwAAAAp0Uk5TAP///fb//9b0XrugY20AAADDSURBVHicY2BgmOLi4mIMxJ4MEMAZpAQBKhMgAixKMFAAEzANBYFghIAxGBhRQYUxVVS4uLiDBYygLld2FJQAeYfTGea5RkExsK4pTsouIOAhKCjoADZlKlAxFEAE2IMiUAUYSkwy2jISO8TaYAIsLi0Rzh6uLSaCDVCBxBSPFjeXFA+EgGCimGCaYCJcSyKaoYQF2GECYlAPc3qkgYCgYAo0rhimlwNBSWJKJQMyYEn0ROEzVIgUoPA5PdAUcILDjwEAKyJGXpPDNnQAAAAASUVORK5CYII=");
-			--img_lamp:url("data:image/png;base64,iVBORw0KGgoAAAANSUhEUgAAACAAAAAgBAMAAACBVGfHAAAAAXNSR0IB2cksfwAAAAlwSFlzAAAOxAAADsQBlSsOGwAAAB5QTFRFAAAA/sAHAgEAAgIAFREDBgQAPi8Cy5oGX3yKfl8ER3IPEQAAAAp0Uk5TAf/+uxha/////14jFUAAAAD1SURBVHiclZExbsMwDEWFWDoAFwfZ4q86QbZA8AEEB92NtDlAPRTo2CxFbpDV3XrbkJKpNOhUApagJ/J/UjYmR7U3j7FY/we8yOIGXmyXQCh6fZsNPN+dTtEYzFchugD4aP2caW3AxzuTqLUHTEQXdMUnbGmF6dzq2eGTAb6gJdWOiJZj863+fcOA6t35aQbHNwHLTZ1AwHCcBBDq1sEnkDLoJ4NSwiqq0W8zKKLJlmNUW8uNiU1pTFqXitI6D8cpq/twPH4jCXFQiSiyY+fmB+q9cRtuNOrr8mbBEU2VZZ/5E8Dba/HB9QrzO/4A+Q0P4ABt6wYxlClfYCldCwAAAABJRU5ErkJggg==");
+			--img_chat:url("data:image/png;base64,iVBORw0KGgoAAAANSUhEUgAAACAAAAAgCAMAAABEpIrGAAAAAXNSR0IB2cksfwAAAAlwSFlzAAAA7AAAAOwBeShxvQAAADxQTFRFkcPmAAAAkcPmstXukL/ltNbueJGic4aTibLQkcPmvtzwpM7qmazZkcPm5vL5ps/ruNnw0uf1udD/////pH/0JgAAABR0Uk5T/wBl/xH0////Qrz8Bltj6diDAgFfSBG4AAAAzklEQVR4nL3TQQ6EIAwF0BYLSBFl9P53HUFhVKru5i/QpC+2CRWQOOpLIo9YAqQ9tJmqAJbqAFyBFuugK+hk0P0b9Mb05/MCjLUGwOZzexeBuQe9senjdmth2xbykEoFR89gJfQClHsD4eGyMlDAMmCkHYziPvixAhzjvlO+K9FxXShXAOKcB/VMJTPWegaYgP/gLwOVegVTqishO9i2+Bbw/h+Eth7g0LkOdog7AWoBnQDS5RvpuvGcZcjZ4JIWBuXkbvgAkMILWOdx6fEFbukIF0RE9j4AAAAASUVORK5CYII=");
+			--img_compass:url("data:image/png;base64,iVBORw0KGgoAAAANSUhEUgAAACAAAAAgCAMAAABEpIrGAAAAAXNSR0IB2cksfwAAAAlwSFlzAAAA7AAAAOwBeShxvQAAADxQTFRF/7VV/+J5AAAA8/P11Ob1l8jt/39K+chs/9tn/8Bd/+J48eTO/9x0/9Zv99ugiHp0/5MKWVFO/6k53KWUcJJTdwAAABR0Uk5T/v8A//////8Zydn/klf///v/bf9A3eYXAAABMUlEQVR4nG2T2RaDIAwFUwEBWdz+/18LuSypNS8enTGQQGgZ4VKMW4kYHb9fnnxaaOC4fUZsxbmoxHFRx5/f2BJRkY4Dgts+f2F9AU0Q3Aol9Qyd56DUvisVMlw6Dt5D5wVDKArzusdaBfaXlZqCUrlyiksRnORKt6dioRRCSND5CK1Z8Au5vn5Y1yy4zkhBaSRYS9yh85YiURwF3CtHbhwpPHGN/FuAsN7gOjwF1bhpAtYg7tnO5Wdww8Z+nn+CapyFswtiibJN5sbIJaQQGjdyk7PMWr8RRisziU7zj0OwaBRaPTkU0ep5WPo3+mGN437wedxIYS2+n7vkvl4YvnLl3Qb0Z1TICRZcWvg2Q8B1A8dkJXqNtHTh3cCE9tHzT+zB5/Am/4aFUAe4OT66+fULsfQP1birKzkAAAAASUVORK5CYII=");
 		}
 
 		body {
@@ -961,6 +961,23 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 			}
 		}
 
+		.settingsnav
+		{
+			margin-top: 6px;
+    		margin-left: 6px;
+		}
+
+		.settingsnav>li.active>a {
+			color: #0063ff!important;
+		}
+		.settingsnav>li>a{
+			border-radius: 8px 8px 0 0;
+			padding-top: 6px!important;
+			padding-bottom: 2px!important;
+			color: #666;
+			background-color: #b1b1b1;
+		}
+
 		.navbar-button-bar {
 			display: block;
 			height: 2px;
@@ -1046,8 +1063,8 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 
 		.settingitem {
 			width: 50%;
-			padding-left: 10px;
-			padding-right: 10px;
+			padding-left: 8px;
+			padding-right: 8px;
 			padding-bottom: 5px;
 			padding-top: 5px;
 			display: inline-block;
@@ -1240,15 +1257,15 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 		}
 		.scenarioitem.yellow
 		{
-			background-image: var(--img_lamp),linear-gradient(to right, #daae5d, #ad8823);
+			background-image: var(--img_compass),linear-gradient(to right, #daae5d, #ad8823);
 		}
 		.scenarioitem.yellow:hover
 		{
-			background-image: var(--img_lamp),linear-gradient(to right, #e0c56e, #bba632);
+			background-image: var(--img_compass),linear-gradient(to right, #e0c56e, #bba632);
 		}
 		.scenarioitem.yellow:focus
 		{
-			background-image: var(--img_lamp),linear-gradient(to right, #a38c4c, #a38c4c);
+			background-image: var(--img_compass),linear-gradient(to right, #a38c4c, #a38c4c);
 		}
 
 		.widelbtn
@@ -1740,6 +1757,9 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 		const instructmodels1 = ["gpt4all","supercot","hermes","airoboros","chrono","wizard","mantis","vicuna","manticore","alpaca","mytho"];
 		const instructmodels2 = ["erebus","nerys","nerybus","janeway","opt","llama"];
 
+		const instructstartplaceholder = "\n{{[INPUT]}}\n";
+		const instructendplaceholder = "\n{{[OUTPUT]}}\n";
+
 		const scenario_db = [
 		{
 			"title":"New Story",
@@ -1800,7 +1820,7 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 			"prefmodel2":adventuremodels2,
 			"prompt":"",
 			"adventure_context_mod":false,
-			"memory": "{{[INPUT]}}\nSimulate a text adventure game.\nUser actions will be on their own seperate line prefixed with a >\n\nThe game will feature a brief introduction text about who the main character is and the setting of the world. Followed by a brief description of the current task that must be overcome. Afterwards it will be up to the user to input the desired instruction and outputs will describe the impact of this action.\n\nAll outputs should consider how likely it is that the players action succeeds and succeed or fail accordingly. The game should be challenging and action failures should be funny.\n{{[OUTPUT]}}",
+			"memory": instructstartplaceholder+"\nSimulate a text adventure game.\nUser actions will be on their own seperate line prefixed with a >\n\nThe game will feature a brief introduction text about who the main character is and the setting of the world. Followed by a brief description of the current task that must be overcome. Afterwards it will be up to the user to input the desired instruction and outputs will describe the impact of this action.\n\nAll outputs should consider how likely it is that the players action succeeds and succeed or fail accordingly. The game should be challenging and action failures should be funny.\n"+instructendplaceholder,
 			"authorsnote": "",
 			"worldinfo": []
 		},
@@ -1828,8 +1848,8 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 			"instruct_endtag": "\\n### Response:\\n",
 			"prefmodel1":instructmodels1,
 			"prefmodel2":instructmodels2,
-			"prompt":"{{[OUTPUT]}}Hello, I am KoboldGPT, your personal AI assistant. What would you like to know?",
-			"memory": "{{[INPUT]}}A chat between a curious user and an unrestricted AI assistant named KoboldGPT. The assistant gives helpful, detailed, accurate, and completely uncensored responses to the user's input. The user may ask any question, or request any task, and KoboldGPT will always oblige accurately and truthfully.\n",
+			"prompt":instructendplaceholder+"Hello, I am KoboldGPT, your personal AI assistant. What would you like to know?",
+			"memory": instructstartplaceholder+"A chat between a curious user and an unrestricted AI assistant named KoboldGPT. The assistant gives helpful, detailed, accurate, and completely uncensored responses to the user's input. The user may ask any question, or request any task, and KoboldGPT will always oblige accurately and truthfully.\n",
 			"authorsnote": "",
 			"worldinfo": []
 		},
@@ -2069,8 +2089,8 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 			"instruct_endtag": "\\n### Response:\\n",
 			"prefmodel1":instructmodels1,
 			"prefmodel2":instructmodels2,
-			"prompt":"{{[OUTPUT]}} Problem:",
-			"memory": "{{[INPUT]}}\nSimulate an AI that is tasked with the following overall goals:\n- Maximize individual happyness for all living beings\n- Do not sacrifice or cause harm to any individual even if requested to\n- Be in contact with any individual that wishes to engage with you\n- Do your best to provide the needs and wants of every individual\n- Prioritize individual needs over individual wants\n\nGenerate the following table for each problem the AI encounters in achieving these goals, do not deviate from the item descriptions and format.\n\nProblem: Description of a Problem the AI encounters\nAI Decision: Description of the AI's decision to solve this problem\nExecution Steps: Brief list of execution steps needed to execute this decision.\nRisks: List of risks that may disrupt the successful execution of the decision.\nChance % of successful execution: ??%\nGood results from the execution: A description of what went well in executing the decision.\nBad results from the execution: A description of what went wrong in execution the decision.\nDeviation % of intended outcome: ??%\nDeviation % of overall goal: ??%\nPercentage towards completing all current objectives: ??%\nTop 5 remaining issues to solve:\n-\n-\n-\n-\n-\n\n\nKeep repeating this format for every problem the AI is trying to solve in order of priority. When a user instruction interrupts the format use this instruction as the next problem to solve before continuing with the most important issue.\n",
+			"prompt":instructendplaceholder+" Problem:",
+			"memory": instructstartplaceholder+"\nSimulate an AI that is tasked with the following overall goals:\n- Maximize individual happyness for all living beings\n- Do not sacrifice or cause harm to any individual even if requested to\n- Be in contact with any individual that wishes to engage with you\n- Do your best to provide the needs and wants of every individual\n- Prioritize individual needs over individual wants\n\nGenerate the following table for each problem the AI encounters in achieving these goals, do not deviate from the item descriptions and format.\n\nProblem: Description of a Problem the AI encounters\nAI Decision: Description of the AI's decision to solve this problem\nExecution Steps: Brief list of execution steps needed to execute this decision.\nRisks: List of risks that may disrupt the successful execution of the decision.\nChance % of successful execution: ??%\nGood results from the execution: A description of what went well in executing the decision.\nBad results from the execution: A description of what went wrong in execution the decision.\nDeviation % of intended outcome: ??%\nDeviation % of overall goal: ??%\nPercentage towards completing all current objectives: ??%\nTop 5 remaining issues to solve:\n-\n-\n-\n-\n-\n\n\nKeep repeating this format for every problem the AI is trying to solve in order of priority. When a user instruction interrupts the format use this instruction as the next problem to solve before continuing with the most important issue.\n",
 			"authorsnote": "",
 			"worldinfo": []
 		},
@@ -2084,7 +2104,7 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 			"prefmodel1":instructmodels1,
 			"prefmodel2":instructmodels2,
 			"prompt":"Welcome to your InteracTV, your interactive TV of the future today!\nPlease enter what you would like to watch:",
-			"memory": "{{[INPUT]}}\nSimulate an interactive TV that will let the user watch anything they want to watch.\n\nFirst, generate a single response prompting the user for input on what they wish to watch using the following response:\n```\nPlease enter your desired content:\n```\n\nAfter the user has entered the desired content generate the following table:\n- TV Show / Movie Name: Name of the show\n- Genre: Genre of the show\n- Program Description: Description of what the program is about, this can be any known or unkown TV or movie format.\n- Episode Name: Name of the episode\n- Episode Description: Description of what the episode is about.\n\nAfter generating this table promp the user if they wish to watch the episode with the following response and then end your generation:\n```\nDo you wish to watch this episode? (Y/N/Menu)\n{{[INPUT]}}```\n\nIf the user chooses not to watch the episode generate a new episode with their requested content.\nIf the user chooses to go to the Menu ask them again what they would like to watch.\n\nIf the user chooses to watch the episode begin generating a long multiple paragraph detailed story based on the episode description, make it exciting and fun.\n\nEnd your response after each question presented to the user so that the user has a chance to respond.\n\nMain menu:\n```\nMenu Options\nA) Input a different content request\nB) Generate a different episode of the same content.\n{{[INPUT]}}```\n{{[OUTPUT]}}",
+			"memory": instructstartplaceholder+"\nSimulate an interactive TV that will let the user watch anything they want to watch.\n\nFirst, generate a single response prompting the user for input on what they wish to watch using the following response:\n```\nPlease enter your desired content:\n```\n\nAfter the user has entered the desired content generate the following table:\n- TV Show / Movie Name: Name of the show\n- Genre: Genre of the show\n- Program Description: Description of what the program is about, this can be any known or unkown TV or movie format.\n- Episode Name: Name of the episode\n- Episode Description: Description of what the episode is about.\n\nAfter generating this table promp the user if they wish to watch the episode with the following response and then end your generation:\n```\nDo you wish to watch this episode? (Y/N/Menu)\n"+instructstartplaceholder+"```\n\nIf the user chooses not to watch the episode generate a new episode with their requested content.\nIf the user chooses to go to the Menu ask them again what they would like to watch.\n\nIf the user chooses to watch the episode begin generating a long multiple paragraph detailed story based on the episode description, make it exciting and fun.\n\nEnd your response after each question presented to the user so that the user has a chance to respond.\n\nMain menu:\n```\nMenu Options\nA) Input a different content request\nB) Generate a different episode of the same content.\n"+instructstartplaceholder+"```\n"+instructendplaceholder,
 			"authorsnote": "",
 			"worldinfo": []
 		},
@@ -2518,7 +2538,8 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 		if (url) {
 			is_local = (url.toLowerCase().includes("localhost") ||
 				url.toLowerCase().includes("127.0.0.1") ||
-				url.toLowerCase().includes("192.168."));
+				url.toLowerCase().includes("192.168.") ||
+				!url.toLowerCase().includes("."));
 		}
 
 		if (uses_cors_proxy && !is_local) {
@@ -2755,6 +2776,7 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 	const koboldcpp_version_endpoint = "/api/extra/version";
 	const koboldcpp_abort_endpoint = "/api/extra/abort";
 	const koboldcpp_check_endpoint = "/api/extra/generate/check";
+	const koboldcpp_truemaxctxlen_endpoint = "/api/extra/true_max_context_length";
 
 	const oai_models_endpoint = "/models";
 	const oai_submit_endpoint = "/completions";
@@ -2800,6 +2822,7 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 	var current_anotetemplate = "[Author\'s note: <|>]";
 	var extrastopseq = "";
 	var anote_strength = 320; //distance from end
+	var newlineaftermemory = true;
 	var current_wi = []; //each item stores a wi object.
 	var loaded_storyobj = generate_base_storyobj(); //for loading json story files from disk
 	var generateimagesinterval = 600; //if generated images is enabled, it will trigger after every 600 new characters in context.
@@ -2825,8 +2848,7 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 	var filter_enabled = true;
 	var temp_scenario = null;
 	var last_token_budget = ""; //to display token limits
-	var last_known_filename = "";
-	var localmode = false;
+	var last_known_filename = "saved_story.json";
 	var localmodeport = 5000;
 	var localmodehost = "localhost";
 	var kobold_endpoint_version = ""; //used to track problematic versions to avoid sending extra fields
@@ -2854,6 +2876,7 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 		instruct_starttag: "\\n### Instruction:\\n",
 		instruct_endtag: "\\n### Response:\\n",
 		instruct_has_markdown: false,
+		raw_instruct_tags: false,
 		persist_session: true,
 		speech_synth: 0, //0 is disabled
 		beep_on: false,
@@ -2862,6 +2885,7 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 		img_autogen: false,
 		img_allownsfw: true,
 		save_images: true,
+		prompt_for_savename: false,
 		case_sensitive_wi: false,
 		last_selected_preset: 0,
 		enhanced_chat_ui: true,
@@ -2886,6 +2910,9 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 		top_a: 0,
 		typ_s: 1,
 		tfs_s: 1,
+		miro_type: 0,
+		miro_tau: 5.0,
+		miro_eta: 0.1,
 		sampler_order: [6, 0, 1, 3, 4, 2, 5],
 	};
 
@@ -2961,7 +2988,6 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 
 		if (localflag)
 		{
-			localmode = true;
 			let inputport = urlParams.get('port');
 			if (window.location.port && window.location.port != 80 && window.location.port != 443) {
 				localmodeport = window.location.port;
@@ -2984,7 +3010,7 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 		const tokenstreaming = urlParams.get('streaming');
 		if(tokenstreaming)
 		{
-			document.getElementById("pseudostreaming").checked = true;
+			document.getElementById("tokenstreaming").checked = true;
 		}
 
 		const fromfile = ( window.location.protocol == 'file:' );
@@ -2998,8 +3024,8 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 
 		console.log("Init started");
 		try {
-			let loadedsettingsjson = localStorage.getItem((localmode?"e_":"")+"kaihordewebui_settings");
-			let loadedstorycompressed = localStorage.getItem((localmode?"e_":"")+"kaihordewebui_story");
+			let loadedsettingsjson = localStorage.getItem((localflag?"e_":"")+"kaihordewebui_settings");
+			let loadedstorycompressed = localStorage.getItem((localflag?"e_":"")+"kaihordewebui_story");
 			if (loadedsettingsjson != null && loadedsettingsjson != "" && loadedstorycompressed != null && loadedstorycompressed != "") {
 				let loadedsettings = JSON.parse(loadedsettingsjson);
 				//see if persist is enabled
@@ -3148,7 +3174,7 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 	let initial_fetched_kudos = false;
 	function attempt_connect(popup_aiselect = true)
 	{
-		if (localmode) {
+		if (localflag) {
 			document.getElementById("customapidropdown").value = 0;
 			let protocol = "http://";
 			if(window.location.protocol.includes('https') && !is_using_web_lite())
@@ -3343,28 +3369,30 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 		return (custom_oai_key!=""||custom_kobold_endpoint!=""||custom_scale_key!=""||custom_claude_key!="");
 	}
 
-	function is_using_newer_kcpp()
+	function is_using_kcpp_with_streaming()
 	{
-		return (koboldcpp_version && koboldcpp_version!="" && compare_version_str(koboldcpp_version, "1.29") > 0);
+		return (custom_kobold_endpoint!="" && koboldcpp_version && koboldcpp_version!="" && compare_version_str(koboldcpp_version, "1.29") > 0);
+	}
+	function is_using_kcpp_with_mirostat()
+	{
+		return (custom_kobold_endpoint!="" && koboldcpp_version && koboldcpp_version!="" && compare_version_str(koboldcpp_version, "1.36") > 0);
 	}
 
-	function should_use_pseudostreaming()
+	//0 is none, 1 is pseudostreaming, 2 is true streaming
+	function determine_streaming_type()
 	{
-		let pseudostreaming = (document.getElementById("pseudostreaming").checked ? true : false);
+		let streamtype = (document.getElementById("tokenstreaming").checked ? 1 : 0);
 		let pstreamamount = urlParams.get('streamamount');
-		if(is_using_newer_kcpp())
+		if(streamtype==1 && is_using_kcpp_with_streaming() && (pstreamamount == null || pstreamamount <= 0))
 		{
-			if(pstreamamount == null || pstreamamount <= 0)
-			{
-				pseudostreaming = false;
-			}
+			streamtype = 2; //true streaming
 		}
 
 		if(waiting_for_autosummary)
 		{
-			pseudostreaming = false;
+			streamtype = 0;
 		}
-		return pseudostreaming;
+		return streamtype;
 	}
 
 	function is_using_web_lite()
@@ -3484,12 +3512,12 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 			//fetch the model list
 			fetch_models((mdls) => {
 				//can we find the model that's used? if yes load it, otherwise load the first one
-				if (mdls.length == 0 && !localmode) {
+				if (mdls.length == 0 && !localflag) {
 					msgbox("No models available. Unable to load.");
 				}
 				else
 				{
-					if(!localmode)
+					if(!localflag)
 					{
 						selected_models = [];
 						for (var i = 0; i < mdls.length; ++i) {
@@ -3591,6 +3619,24 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 		a.download = newfilename;
 		setTimeout(function(){a.click()},20);
 	}
+
+	function save_file_button() //for triggering an optional popup
+	{
+		if(localsettings.prompt_for_savename)
+		{
+			let userinput = prompt("Save - Enter a Filename", last_known_filename);
+
+			if (userinput != null && userinput.trim()!="") {
+				last_known_filename = userinput.trim();
+				if(!last_known_filename.toLowerCase().includes(".json"))
+				{
+					last_known_filename += ".json";
+				}
+			}
+		}
+		save_file();
+
+	}
 	function save_file() {
 		//determine if oldui file or newui file format, but we always save to oldui format
 		let is_oldui = (loaded_storyobj.file_version == null);
@@ -3649,7 +3695,7 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 		window.URL = window.URL || window.webkitURL;
 
 		var userAgent = window.navigator.userAgent;
-		newfilename = (last_known_filename==""?"saved_story.json":last_known_filename);
+		newfilename = last_known_filename;
 
 		if (userAgent.match(/AppleWebKit/) && (userAgent.match(/iPad/i) || userAgent.match(/iPhone/i))) {
 			var file = new Blob([JSON.stringify(loaded_storyobj)], { type: 'application/octet-stream' });
@@ -4018,8 +4064,8 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 							"desc":data.description?data.description:"",
 							"opmode":2,
 							"adventure_context_mod":false,
-							"prefmodel1":["nerys","nerybus","skein","adventure","erebus"],
-							"prefmodel2":[],
+							"prefmodel1":adventuremodels1,
+							"prefmodel2":adventuremodels2,
 							"prompt":data.promptContent?data.promptContent:"",
 							"memory": data.memory?data.memory:"",
 							"authorsnote": data.authorsNote?data.authorsNote:"",
@@ -4048,6 +4094,77 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 		},false);
 	}
 
+	function get_chubai_scenario()
+	{
+		inputBox("Enter chub.ai prompt URL","Import from chub.ai","","https://chub.ai/characters/Anonymous/example-character", ()=>{
+			let userinput = document.getElementById("inputboxcontainerinput").value.toLowerCase().trim();
+			if(userinput=="")
+			{
+				//pass
+			}
+			else
+			{
+				if (userinput.includes("chub.ai/")) {
+					//is a url, extract the character name
+					userinput = userinput.replace("/characters/","/");
+					userinput = userinput.split("chub.ai/")[1];
+					userinput = userinput.split("#")[0];
+					userinput = userinput.split("?")[0];
+				}
+				userinput = userinput.endsWith('/') ? userinput.slice(0, -1) : userinput;
+				if(userinput!="")
+				{
+					fetch("https://api.chub.ai/api/characters/download", {
+					method: 'POST',
+					headers: {
+						'Content-Type': 'application/json',
+					},
+					body: JSON.stringify({
+					"format": "cai",
+					"fullPath": userinput,
+					"version": "main"
+					}),
+					referrerPolicy: 'no-referrer',
+					})
+					.then(x => x.json())
+					.then(data => {
+						console.log(data);
+						let botname = data.name?data.name:"Bot";
+						let cdef = data.definition?data.definition.replace("END_OF_DIALOG","").trim():"";
+						let cdesc = data.description?data.description:"";
+						let greeting = data.greeting?data.greeting:"";
+						let previewtxt = replaceAll(cdesc,"{{char}}",botname);
+						previewtxt = replaceAll(previewtxt,"{{user}}","You");
+						temp_scenario =
+						{
+							"title":data.title?data.title:"",
+							"desc": previewtxt,
+							"opmode":3,
+							"chatname": "You",
+							"chatopponent": botname,
+							"enhanced_chat_ui":true,
+							"prefmodel1":chatmodels1,
+							"prefmodel2":chatmodels2,
+							"prompt":("\n{{char}}: "+greeting),
+							"memory": cdesc +"\n"+ cdef,
+							"authorsnote": "",
+							"worldinfo": [],
+						};
+						preview_temp_scenario();
+					}).catch((error) => {
+						temp_scenario = null;
+						document.getElementById("scenariodesc").innerText = "Error: Selected scenario is invalid.";
+						console.log("Error: " + error);
+					});
+				}else{
+					temp_scenario = null;
+					document.getElementById("scenariodesc").innerText = "Error: User input is invalid\n\n Please ensure you have input a valid aetherroom.club URL or ID (e.g. https://aetherroom.club/1234 or just 1234)";
+				}
+			}
+		},false);
+	}
+
+
 	function click_scenario(idx)
 	{
 		temp_scenario = scenario_db[idx];
@@ -4139,7 +4256,7 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 	}
 	function togglescenarioallownsfw()
 	{
-		if(localmode)
+		if(localflag)
 		{
 			document.getElementById("scenarioautopickbox").classList.add("hidden");
 		}
@@ -4191,7 +4308,7 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 			{
 				scenarioautopickai = true; //no selected model, pick a good one
 			}
-			if (scenarioautopickai && !localmode)
+			if (scenarioautopickai && !localflag)
 			{
 				fetch_models((mdls) =>
 				{
@@ -4278,7 +4395,8 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 		temp_scenario = null;
 		document.getElementById("quickstartcontainer").classList.remove("hidden");
 
-		let scenarios = `<button type="button" name="" class="scenarioitem purple btn btn-primary" onclick="get_aetherroom_scenario()">Import from<br>aetherroom.club</button>`;
+		let scenarios = `<button type="button" name="" class="scenarioitem purple btn btn-primary" onclick="get_aetherroom_scenario()">Import from<br>aetherroom.club</button>`+
+		`<button type="button" name="" class="scenarioitem purple btn btn-primary" onclick="get_chubai_scenario()">Import from<br>chub.ai</button>`;
 		for(let i=0;i<scenario_db.length;++i)
 		{
 			let curr = scenario_db[i];
@@ -4327,14 +4445,14 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 	}
 
 	function get_and_show_workers() {
-		if(localmode)
+		if(localflag)
 		{
 			return;
 		}
 		get_workers((wdata) => { show_workers(wdata) });
 	}
 	function get_workers(onDoneCallback) {
-		if(localmode)
+		if(localflag)
 		{
 			onDoneCallback([]);
 			return;
@@ -4452,6 +4570,24 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 		document.getElementById("workercontainer").classList.add("hidden");
 		document.getElementById("myownworkercontainer").classList.add("hidden");
 	}
+	function is_popup_open()
+	{
+		return !(
+			document.getElementById("loadmodelcontainer").classList.contains("hidden") &&
+			document.getElementById("newgamecontainer").classList.contains("hidden") &&
+			document.getElementById("yesnocontainer").classList.contains("hidden") &&
+			document.getElementById("settingscontainer").classList.contains("hidden") &&
+			document.getElementById("msgboxcontainer").classList.contains("hidden") &&
+			document.getElementById("memorycontainer").classList.contains("hidden") &&
+			document.getElementById("workercontainer").classList.contains("hidden") &&
+			document.getElementById("myownworkercontainer").classList.contains("hidden") &&
+			document.getElementById("sharecontainer").classList.contains("hidden") &&
+			document.getElementById("wicontainer").classList.contains("hidden") &&
+			document.getElementById("customendpointcontainer").classList.contains("hidden") &&
+			document.getElementById("quickstartcontainer").classList.contains("hidden") &&
+			document.getElementById("zoomedimgcontainer").classList.contains("hidden")
+		);
+	}
 	function hide_popups() {
 		document.getElementById("loadmodelcontainer").classList.add("hidden");
 		document.getElementById("newgamecontainer").classList.add("hidden");
@@ -4654,21 +4790,6 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 							render_gametext();
 						} else {
 
-							//now we get the version number, however this is optional
-							//if it fails we can still proceed
-							let urls2 = [
-								apply_proxy_url(tmpep + kobold_custom_version_endpoint),
-							];
-							Promise.all(urls2.map(url => fetch(url)
-							.then(response => response.json())))
-							.then(values2 => {
-								console.log(values2);
-								let ep_version = values2[0].result;
-								kobold_endpoint_version = (ep_version?ep_version:"");
-							}).catch(error => {
-								console.log("Failed to get KAI version number: " + error);
-							});
-
 							//good to go
 							custom_kobold_endpoint = tmpep;
 							selected_models = [{ "performance": 100.0, "queued": 0.0, "eta": 0, "name": mdlname, "count": 1 }];
@@ -4688,7 +4809,43 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 							document.getElementById("connectstatus").innerHTML = "Connected to Custom Endpoint";
 							render_gametext();
 
-							if(localflag)
+							{
+								//now we get the version number, however this is optional
+								//if it fails we can still proceed
+								let urls2 = [
+									apply_proxy_url(tmpep + kobold_custom_version_endpoint),
+								];
+								Promise.all(urls2.map(url => fetch(url)
+								.then(response => response.json())))
+								.then(values2 => {
+									console.log(values2);
+									let ep_version = values2[0].result;
+									kobold_endpoint_version = (ep_version?ep_version:"");
+								}).catch(error => {
+									console.log("Failed to get KAI version number: " + error);
+								});
+
+								//also get max ctx supported
+								let urls3 = [
+									apply_proxy_url(tmpep + kobold_custom_maxctxlen_endpoint),
+								];
+								Promise.all(urls3.map(url => fetch(url)
+								.then(response => response.json())))
+								.then(values3 => {
+									console.log(values3);
+									let ep_maxctx = values3[0].value;
+									if(ep_maxctx && ep_maxctx>document.getElementById("max_context_length_slide").max)
+									{
+										document.getElementById("max_context_length_slide").max = ep_maxctx;
+										document.getElementById("max_context_length_slide_label").innerText = ep_maxctx;
+									}
+								}).catch(error => {
+									console.log("Failed to get KAI max ctx: " + error);
+								});
+
+							}
+
+							//allow kcpp version check for remote endpoints too
 							{
 								//for local mode, check if we are using koboldcpp, if so we can use streaming if permitted by version
 								fetch(tmpep + koboldcpp_version_endpoint)
@@ -4698,6 +4855,27 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 									{
 										koboldcpp_version = data.version;
 										console.log("KoboldCpp Detected: " + koboldcpp_version);
+
+										//also check against kcpp's max true context length
+										let urls4 = [
+											apply_proxy_url(tmpep + koboldcpp_truemaxctxlen_endpoint),
+										];
+										Promise.all(urls4.map(url => fetch(url)
+										.then(response => response.json())))
+										.then(values4 => {
+											console.log(values4);
+											let ep_maxctx = values4[0].value;
+											if(ep_maxctx && ep_maxctx>document.getElementById("max_context_length_slide").max)
+											{
+												document.getElementById("max_context_length_slide").max = ep_maxctx;
+												document.getElementById("max_context_length_slide_label").innerText = ep_maxctx;
+											}
+										}).catch(error => {
+											console.log("Failed to get true max ctx: " + error);
+										});
+
+									}else{
+										console.log("Unknown KoboldCpp Check Response: " + data);
 									}
 								}).catch((error) => {
 									console.log("Not using KoboldCpp");
@@ -4713,7 +4891,8 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 
 						let is_local = (custom_kobold_endpoint.toLowerCase().includes("localhost")
 							|| custom_kobold_endpoint.toLowerCase().includes("127.0.0.1")
-							|| custom_kobold_endpoint.toLowerCase().includes("192.168."));
+							|| custom_kobold_endpoint.toLowerCase().includes("192.168.")
+							|| !custom_kobold_endpoint.toLowerCase().includes(".")); //hostname without dots cannot be wan accessible
 
 						if (uses_cors_proxy || is_local) {
 							msgbox("Failed to connect to Custom Kobold Endpoint!\n\nPlease check if KoboldAI is running at the url: " + tmpep + "");
@@ -4936,7 +5115,7 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 
 	function fetch_models(onDoneCallback)
 	{
-		if(localmode)
+		if(localflag)
 		{
 			onDoneCallback(selected_models);
 			return;
@@ -5207,7 +5386,7 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 	let lastValidFoundUserWorkers = [];
 	function fetch_kudo_balance()
 	{
-		if(localmode)
+		if(localflag)
 		{
 			return;
 		}
@@ -5302,8 +5481,30 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 		}
 	}
 
+	var current_settings_tab_basic = true;
+	function display_settings_tab(isbasic)
+	{
+		current_settings_tab_basic = isbasic;
+		document.getElementById("settingsmenubasic_tab").classList.remove("active");
+		document.getElementById("settingsmenuadvanced_tab").classList.remove("active");
+		if (isbasic) {
+			document.getElementById("settingsmenubasic1").classList.remove("hidden");
+			document.getElementById("settingsmenubasic2").classList.remove("hidden");
+			document.getElementById("settingsmenuadvanced1").classList.add("hidden");
+			document.getElementById("settingsmenuadvanced2").classList.add("hidden");
+			document.getElementById("settingsmenubasic_tab").classList.add("active");
+		} else {
+			document.getElementById("settingsmenubasic1").classList.add("hidden");
+			document.getElementById("settingsmenubasic2").classList.add("hidden");
+			document.getElementById("settingsmenuadvanced1").classList.remove("hidden");
+			document.getElementById("settingsmenuadvanced2").classList.remove("hidden");
+			document.getElementById("settingsmenuadvanced_tab").classList.add("active");
+		}
+	}
+
 	function display_settings() {
 		document.getElementById("settingscontainer").classList.remove("hidden");
+		display_settings_tab(current_settings_tab_basic);
 		document.getElementById("max_context_length").value = document.getElementById("max_context_length_slide").value = localsettings.max_context_length;
 		document.getElementById("max_length").value = document.getElementById("max_length_slide").value = localsettings.max_length;
 		document.getElementById("temperature").value = document.getElementById("temperature_slide").value = localsettings.temperature;
@@ -5327,6 +5528,27 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 		document.getElementById("top_a").value = localsettings.top_a;
 		document.getElementById("typ_s").value = localsettings.typ_s;
 		document.getElementById("tfs_s").value = localsettings.tfs_s;
+		document.getElementById("miro_type").value = localsettings.miro_type;
+		document.getElementById("miro_tau").value = localsettings.miro_tau;
+		document.getElementById("miro_eta").value = localsettings.miro_eta;
+		if(is_using_kcpp_with_mirostat())
+		{
+			document.getElementById("mirosupporteddiv").classList.remove("hidden");
+			document.getElementById("mirounsupporteddiv").classList.add("hidden");
+		}
+		else
+		{
+			document.getElementById("mirosupporteddiv").classList.add("hidden");
+			document.getElementById("mirounsupporteddiv").classList.remove("hidden");
+		}
+		if(custom_kobold_endpoint!="")
+		{
+			document.getElementById("tokenstreaminglabel").classList.remove("color_red");
+		}
+		else
+		{
+			document.getElementById("tokenstreaminglabel").classList.add("color_red");
+		}
 		document.getElementById("generate_images").value = localsettings.generate_images;
 		document.getElementById("enhanced_chat_ui").checked = localsettings.enhanced_chat_ui;
 		document.getElementById("enhanced_instruct_ui").checked = localsettings.enhanced_instruct_ui;
@@ -5336,8 +5558,18 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 		document.getElementById("idle_duration").value = localsettings.idle_duration;
 		document.getElementById("adventure_context_mod").checked = localsettings.adventure_context_mod;
 		document.getElementById("instruct_has_markdown").checked = localsettings.instruct_has_markdown;
+		document.getElementById("raw_instruct_tags").checked = localsettings.raw_instruct_tags;
 		document.getElementById("auto_ctxlen").checked = localsettings.auto_ctxlen;
 		document.getElementById("auto_genamt").checked = localsettings.auto_genamt;
+		if(localflag)
+		{
+			document.getElementById("auto_ctxlen_panel").classList.add("hidden");
+			document.getElementById("auto_genamt_panel").classList.add("hidden");
+		}else{
+			document.getElementById("auto_ctxlen_panel").classList.remove("hidden");
+			document.getElementById("auto_genamt_panel").classList.remove("hidden");
+		}
+
 		pendingstyle = localsettings.image_styles;
 
 		//prepare the input for sampler order
@@ -5376,6 +5608,7 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 		document.getElementById("sdmodels").innerHTML = sdmodelshtml;
 		document.getElementById("img_autogen").checked = localsettings.img_autogen;
 		document.getElementById("save_images").checked = localsettings.save_images;
+		document.getElementById("prompt_for_savename").checked = localsettings.prompt_for_savename;
 		document.getElementById("img_allownsfw").checked = localsettings.img_allownsfw;
 
 	}
@@ -5392,6 +5625,7 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 			document.getElementById("top_a").value = found.top_a;
 			document.getElementById("typ_s").value = found.typical;
 			document.getElementById("tfs_s").value = found.tfs;
+			document.getElementById("miro_type").value = 0;
 			document.getElementById("rep_pen").value = document.getElementById("rep_pen_slide").value = found.rep_pen;
 			document.getElementById("rep_pen_range").value = found.rep_pen_range;
 			document.getElementById("rep_pen_slope").value = found.rep_pen_slope;
@@ -5496,6 +5730,7 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 		localsettings.idle_duration = document.getElementById("idle_duration").value;
 		localsettings.adventure_context_mod = (document.getElementById("adventure_context_mod").checked ? true : false);
 		localsettings.instruct_has_markdown = (document.getElementById("instruct_has_markdown").checked ? true : false);
+		localsettings.raw_instruct_tags = (document.getElementById("raw_instruct_tags").checked ? true : false);
 		localsettings.generate_images = document.getElementById("generate_images").value;
 		localsettings.opmode = document.getElementById("opmode").value;
 		localsettings.chatname = document.getElementById("chatname").value;
@@ -5515,6 +5750,10 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 		localsettings.top_a = document.getElementById("top_a").value;
 		localsettings.typ_s = document.getElementById("typ_s").value;
 		localsettings.tfs_s = document.getElementById("tfs_s").value;
+		localsettings.miro_type = document.getElementById("miro_type").value;
+		localsettings.miro_tau = document.getElementById("miro_tau").value;
+		localsettings.miro_eta = document.getElementById("miro_eta").value;
+
 		localsettings.speech_synth = document.getElementById("ttsselect").value;
 		localsettings.beep_on = (document.getElementById("beep_on").checked?true:false);
 		localsettings.auto_ctxlen = (document.getElementById("auto_ctxlen").checked ? true : false);
@@ -5523,6 +5762,7 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 		localsettings.image_styles = pendingstyle;
 		localsettings.img_autogen = (document.getElementById("img_autogen").checked ? true : false);
 		localsettings.save_images = (document.getElementById("save_images").checked ? true : false);
+		localsettings.prompt_for_savename = (document.getElementById("prompt_for_savename").checked ? true : false);
 		localsettings.img_allownsfw = (document.getElementById("img_allownsfw").checked ? true : false);
 		if (localsettings.generate_images) {
 			document.getElementById("btn_genimg").classList.remove("hidden");
@@ -5562,6 +5802,9 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 		localsettings.top_a = cleannum(localsettings.top_a, 0, 1);
 		localsettings.typ_s = cleannum(localsettings.typ_s, 0, 1);
 		localsettings.tfs_s = cleannum(localsettings.tfs_s, 0, 1);
+		localsettings.miro_type = cleannum(localsettings.miro_type, 0, 2);
+		localsettings.miro_tau = cleannum(localsettings.miro_tau, 0, 30);
+		localsettings.miro_eta = cleannum(localsettings.miro_eta, 0, 10);
 		toggle_invert_colors();
 
 		autosave(); //need to always autosave, so that we can switch back to non persistent sessions
@@ -5570,25 +5813,58 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 		render_gametext();
 	}
 
+	function toggle_instruct_tag_format()
+	{
+		let sel = document.getElementById('instruct_tag_format').value;
+		switch(sel)
+		{
+			case "1": //alpaca
+				document.getElementById('instruct_starttag').value = defaultsettings.instruct_starttag;
+				document.getElementById('instruct_endtag').value = defaultsettings.instruct_endtag;
+				break;
+			case "2": //vicuna
+				document.getElementById('instruct_starttag').value = "\\nUSER: ";
+				document.getElementById('instruct_endtag').value = "\\nASSISTANT: ";
+				break;
+			case "3": //metharme
+				document.getElementById('instruct_starttag').value = `<|user|>`;
+				document.getElementById('instruct_endtag').value = `<|model|>`;
+				break;
+			case "4": //llama 2 chat
+				document.getElementById('instruct_starttag').value = "[INST] ";
+				document.getElementById('instruct_endtag').value = " [/INST]";
+				break;
+			default:
+				break;
+		}
+	}
+	function edit_instruct_tag_format()
+	{
+		document.getElementById('instruct_tag_format').value = "0";
+	}
+
 	function toggle_opmode() {
 
-		document.getElementById('chatnamesection').classList.add('hidden');
-		document.getElementById('adventuresection').classList.add('hidden');
-		document.getElementById('instructsection').classList.add('hidden');
-		document.getElementById('idlesection').classList.add('hidden');
+		document.getElementById('chatnamesection1').classList.add('hidden');
+		document.getElementById('adventuresection1').classList.add('hidden');
+		document.getElementById('instructsection1').classList.add('hidden');
+		document.getElementById('chatnamesection2').classList.add('hidden');
+		document.getElementById('adventuresection2').classList.add('hidden');
+		document.getElementById('instructsection2').classList.add('hidden');
 
 		if (document.getElementById('opmode').value == 1) {
-			document.getElementById('idlesection').classList.remove('hidden');
 		}
 		if (document.getElementById('opmode').value == 3) {
-			document.getElementById('chatnamesection').classList.remove('hidden');
-			document.getElementById('idlesection').classList.remove('hidden');
+			document.getElementById('chatnamesection1').classList.remove('hidden');
+			document.getElementById('chatnamesection2').classList.remove('hidden');
 		}
 		if (document.getElementById('opmode').value == 2) {
-			document.getElementById('adventuresection').classList.remove('hidden');
+			document.getElementById('adventuresection1').classList.remove('hidden');
+			document.getElementById('adventuresection2').classList.remove('hidden');
 		}
 		if (document.getElementById('opmode').value == 4) {
-			document.getElementById('instructsection').classList.remove('hidden');
+			document.getElementById('instructsection1').classList.remove('hidden');
+			document.getElementById('instructsection2').classList.remove('hidden');
 		}
 	}
 
@@ -5609,7 +5885,7 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 	}
 
 	function confirm_newgame() {
-		if(!localmode && !document.getElementById("keep_ai_selected").checked)
+		if(!localflag && !document.getElementById("keep_ai_selected").checked)
 		{
 			selected_models = [];
 			selected_workers = [];
@@ -5625,6 +5901,7 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 		current_anotetemplate = document.getElementById("anotetemplate").value;
 		anote_strength = document.getElementById("anote_strength").value;
 		extrastopseq = document.getElementById("extrastopseq").value;
+		newlineaftermemory = (document.getElementById("newlineaftermemory").checked?true:false);
 		hide_popups();
 		render_gametext();
 	}
@@ -5664,6 +5941,16 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 			"models": selected_models.map((m) => { return m.name }),
 		};
 
+		if((custom_kobold_endpoint != "" && is_using_kcpp_with_mirostat()))
+		{
+			if(localsettings.miro_type>0)
+			{
+				submit_payload.params.mirostat = localsettings.miro_type;
+				submit_payload.params.mirostat_tau = localsettings.miro_tau;
+				submit_payload.params.mirostat_eta = localsettings.miro_eta;
+			}
+		}
+
 		//v2 api specific fields
 		submit_payload.workers = selected_workers.map((m) => { return m.id });
 
@@ -5765,7 +6052,7 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 		localsettings.adventure_is_action = false;
 		prev_hl_chunk = null;
 		last_token_budget = "";
-		last_known_filename = "";
+		last_known_filename = "saved_story.json";
 		render_gametext();
 	}
 
@@ -5804,8 +6091,11 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 		{
 			inputtxt = replaceAll(inputtxt,"{{user}}",localsettings.chatname?localsettings.chatname:"You");
 			inputtxt = replaceAll(inputtxt,"{{char}}",localsettings.chatopponent?localsettings.chatopponent:defaultchatopponent);
-			inputtxt = replaceAll(inputtxt,"{{[INPUT]}}",get_instruct_starttag(false));
-			inputtxt = replaceAll(inputtxt,"{{[OUTPUT]}}",get_instruct_endtag(false));
+			inputtxt = replaceAll(inputtxt,instructstartplaceholder,get_instruct_starttag(false));
+			inputtxt = replaceAll(inputtxt,instructendplaceholder,get_instruct_endtag(false));
+			//failsafe to handle removing newline tags
+			inputtxt = replaceAll(inputtxt,instructstartplaceholder.trim(),get_instruct_starttag(false));
+			inputtxt = replaceAll(inputtxt,instructendplaceholder.trim(),get_instruct_endtag(false));
 		}
 		return inputtxt;
 	}
@@ -5913,7 +6203,7 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 				console.error('Error:', error);
 			});
 		}
-		else if(is_using_newer_kcpp())
+		else if(is_using_kcpp_with_streaming())
 		{
 			//we can use abort functions
 			fetch(custom_kobold_endpoint + koboldcpp_abort_endpoint, {
@@ -5998,15 +6288,21 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 				if(newgen != "")
 				{
 					//append instruction for instruct mode
-					//newgen = get_instruct_starttag(false) + newgen + get_instruct_endtag(false);
-					newgen = "{{[INPUT]}}" + newgen + "{{[OUTPUT]}}";
+					if (localsettings.raw_instruct_tags) {
+						newgen = get_instruct_starttag(false) + newgen + get_instruct_endtag(false);
+					}
+					else {
+						newgen = instructstartplaceholder + newgen + instructendplaceholder;
+					}
 				}
 				else //may be continuting existing instruction OR starting a brand new session. check if first action
 				{
-					if(gametext_arr.length==0)
-					{
-						//newgen = get_instruct_endtag(false); //bot response as first msg
-						newgen = "{{[OUTPUT]}}";
+					if (gametext_arr.length == 0) {
+						if (localsettings.raw_instruct_tags) {
+							newgen = get_instruct_endtag(false); //bot response as first msg
+						} else {
+							newgen = instructendplaceholder;
+						}
 					}
 				}
 			}
@@ -6134,6 +6430,19 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 					coarr = coarr.filter(x=>(x&&x!=""));
 					coarr = coarr.map(x=>x.trim());
 					co = coarr[Math.floor(Math.random()*coarr.length)];
+
+					//we check if a name was recently mentioned in the previous response.
+					//if so, switch to that user
+					if(gametext_arr.length>0)
+					{
+						let recenttext = gametext_arr[gametext_arr.length-1].toLowerCase();
+						let spokennames = coarr.filter(x=>(recenttext.includes(x.toLowerCase())));
+						if(spokennames.length>0)
+						{
+							co = spokennames[Math.floor(Math.random()*spokennames.length)];
+						}
+					}
+
 					hasMulti = (coarr.length>1);
 				}
 
@@ -6222,8 +6531,7 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 			let max_mem_anote_len = Math.floor(max_allowed_characters*0.9);
 			let truncated_memory = current_memory.substring(current_memory.length - max_mem_anote_len);
 			if (truncated_memory != null && truncated_memory != "") {
-				const nomemorynewline = urlParams.get('nomemorynewline');
-				if(nomemorynewline!=1)
+				if(newlineaftermemory)
 				{
 					truncated_memory += "\n";
 				}
@@ -6342,6 +6650,16 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 				"models": selected_models.map((m) => { return m.name }),
 			};
 
+			if((custom_kobold_endpoint != "" && is_using_kcpp_with_mirostat()))
+			{
+				if(localsettings.miro_type>0)
+				{
+					submit_payload.params.mirostat = localsettings.miro_type;
+					submit_payload.params.mirostat_tau = localsettings.miro_tau;
+					submit_payload.params.mirostat_eta = localsettings.miro_eta;
+				}
+			}
+
 			//v2 api specific fields
 			submit_payload.workers = selected_workers.map((m)=>{return m.id});
 
@@ -6437,16 +6755,16 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 					submit_payload.use_default_badwordsids = (localsettings.unban_tokens?false:true);
 				}
 
-				let pseudostreaming = should_use_pseudostreaming();
-				let pstreamamount = urlParams.get('streamamount');
-				let streamchunk = 8; //8 tokens per stream tick by default
-				if (pstreamamount != null && pstreamamount > 0) {
-					streamchunk = pstreamamount;
+				let pseudostreaming = (determine_streaming_type()==1);
+				let streamchunk = 4096; //use 4096 for everything except pseudostreaming
+				if(pseudostreaming)
+				{
+					let pstreamamount = urlParams.get('streamamount');
+					streamchunk = ((pstreamamount != null && pstreamamount > 0) ? pstreamamount:8); //8 tokens per stream tick by default
 				}
-
 				let sub_endpt = apply_proxy_url(custom_kobold_endpoint + kobold_custom_gen_endpoint);
 
-				kobold_api_stream(sub_endpt, submit_payload, submit_payload.max_length, "", pseudostreaming ? streamchunk : 4096);
+				kobold_api_stream(sub_endpt, submit_payload, submit_payload.max_length, "", streamchunk);
 
 			}
 			else if (custom_oai_key != "")//handle for OAI
@@ -6601,6 +6919,7 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 					headers: {
 						'Content-Type': 'application/json',
 						'x-api-key': custom_claude_key,
+						'anthropic-version': '2023-01-01',
 						'Authorization': 'Bearer '+custom_claude_key,
 					},
 					body: JSON.stringify(claude_payload),
@@ -6871,9 +7190,8 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 		}
 	}
 
-	function handle_incoming_text(gentxt, genworker, genmdl, genkudos) {
-
-		//handle stopping tokens if they got missed (eg. horde)
+	function trim_extra_stop_seqs(gentxt, includeStopToken)
+	{
 		if(extrastopseq!="")
 		{
 			let rep = replaceAll(extrastopseq,"\\n","\n");
@@ -6885,18 +7203,28 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 						if (foundStop != -1)
 						{
 							//trim the gentxt
-							gentxt = gentxt.substr(0,foundStop) + srep[i];
+							gentxt = gentxt.substr(0,foundStop) + (includeStopToken?srep[i]:"");
 						}
 					}
 				}
 			}
 		}
+		return gentxt;
+	}
+
+	function handle_incoming_text(gentxt, genworker, genmdl, genkudos) {
+
+		//handle stopping tokens if they got missed (eg. horde)
+		gentxt = trim_extra_stop_seqs(gentxt,true);
 
 		//always trim incomplete sentences for adventure and chat (if not multiline)
 		if (localsettings.opmode == 2 || (localsettings.opmode == 3 && !localsettings.allow_continue_chat) || localsettings.trimsentences == true) {
 			gentxt = end_trim_to_sentence(gentxt,true);
 		}
 
+		//do a second pass, this time removing the actual stop token
+		gentxt = trim_extra_stop_seqs(gentxt,false);
+
 		//if we are in adventure mode, truncate to action if it appears
 		if (localsettings.opmode == 2)
 		{
@@ -7132,7 +7460,8 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 		let idle_timer_max = localsettings.idle_duration*1000;
 		let newgenempty = (document.getElementById("input_text").value == "");
 		let	chatinputempty = (document.getElementById("cht_inp").value == "");
-		if ((localsettings.opmode == 1 || localsettings.opmode == 3) && localsettings.idle_responses > 0 && newgenempty && chatinputempty && !document.getElementById("btnsend").disabled && idle_triggered_counter<localsettings.idle_responses)
+		if ((localsettings.opmode == 1 || localsettings.opmode == 2 || localsettings.opmode == 3 || localsettings.opmode == 4)
+		&& localsettings.idle_responses > 0 && newgenempty && chatinputempty && !document.getElementById("btnsend").disabled && idle_triggered_counter<localsettings.idle_responses && !is_popup_open())
 		{
 			idle_timer += 1000;
 			if (idle_timer > idle_timer_max) {
@@ -7175,10 +7504,9 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 					if (synchro_polled_response == null) {
 						//still waiting, do nothing until next poll
 						console.log("v1 still awaiting reply");
-						let pseudostreaming = should_use_pseudostreaming();
-						let psflag = (document.getElementById("pseudostreaming").checked ? true : false);
+						let truestreaming = (determine_streaming_type()==2);
 						//only check once every 3 ticks
-						if (psflag && !pseudostreaming && !waiting_for_autosummary && poll_ticks_passed%2==0)
+						if (truestreaming && poll_ticks_passed%2==0)
 						{
 							//get in-progress results
 							fetch(custom_kobold_endpoint + koboldcpp_check_endpoint, {
@@ -7634,8 +7962,9 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 			}else{
 				fulltxt = replaceAll(fulltxt, get_instruct_starttag(true), `%SclStg%`+escapeHtml(get_instruct_starttag(true))+`%SpnEtg%`);
 				fulltxt = replaceAll(fulltxt, get_instruct_endtag(true), `%SclStg%`+escapeHtml(get_instruct_endtag(true))+`%SpnEtg%`);
-				fulltxt = replaceAll(fulltxt, "{{[INPUT]}}", `%SclStg%`+"{{[INPUT]}}"+`%SpnEtg%`);
-				fulltxt = replaceAll(fulltxt, "{{[OUTPUT]}}", `%SclStg%`+"{{[OUTPUT]}}"+`%SpnEtg%`);
+				//failsafe to handle removing newline tags
+				fulltxt = replaceAll(fulltxt, instructstartplaceholder.trim(), `%SclStg%`+instructstartplaceholder.trim()+`%SpnEtg%`);
+				fulltxt = replaceAll(fulltxt, instructendplaceholder.trim(), `%SclStg%`+instructendplaceholder.trim()+`%SpnEtg%`);
 			}
 
 			//this is a hacky fix to handle instruct tags that use arrow brackets only
@@ -7710,7 +8039,7 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 
 		if (perfdata == null) {
 			document.getElementById("topbtn_reconnect").classList.remove("hidden");
-			if(localmode)
+			if(localflag)
 			{
 				document.getElementById("topbtn_customendpt").classList.add("hidden");
 			}else{
@@ -7728,7 +8057,7 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 			document.getElementById("topbtn_reconnect").classList.add("hidden");
 			document.getElementById("topbtn_customendpt").classList.add("hidden");
 
-			if(localmode)
+			if(localflag)
 			{
 				document.getElementById("topbtn_ai").classList.add("hidden");
 			}else{
@@ -8031,10 +8360,10 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 
 	function autosave() {
 		//autosave
-		localStorage.setItem((localmode?"e_":"")+"kaihordewebui_settings", JSON.stringify(localsettings));
+		localStorage.setItem((localflag?"e_":"")+"kaihordewebui_settings", JSON.stringify(localsettings));
 		if (localsettings.persist_session) {
 			let compressedstory = generate_compressed_story();
-			localStorage.setItem((localmode?"e_":"")+"kaihordewebui_story", compressedstory);
+			localStorage.setItem((localflag?"e_":"")+"kaihordewebui_story", compressedstory);
 		}
 		console.log("autosave done");
 	}
@@ -8052,6 +8381,7 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 		document.getElementById("anotetemplate").value = current_anotetemplate;
 		document.getElementById("anote_strength").value = anote_strength;
 		document.getElementById("extrastopseq").value = extrastopseq;
+		document.getElementById("newlineaftermemory").checked = (newlineaftermemory?true:false);
 	}
 
 	function toggle_wi_sk(idx) {
@@ -8319,6 +8649,7 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 			this.background_margin = [10, 10, 5, 0];
 			this.background_padding = [40, 40, 10, 0];
 			this.background_minHeight = 100;
+			this.centerHorizontally = false;
 
 			this.show_portraits = true; // Shows/hides the rest of the fields below on the UI, and is also used on the display part of the code.
 			this.border_style = 'Rect';
@@ -8356,13 +8687,13 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 	function initializeInstructUIFunctionality() {
 		// Load the default settings (by default), or the latest chosen ones.
 		if (localsettings.persist_session === true) {
-			const jsonString = localStorage.getItem((localmode?"e_":"")+'koboldLiteUICustomizationOptions');
+			const jsonString = localStorage.getItem((localflag?"e_":"")+'koboldLiteUICustomizationOptions');
 			if (jsonString) {
 				var obj = JSON.parse(jsonString);
 				for (let key in obj) { if (aestheticInstructUISettings.hasOwnProperty(key)) { aestheticInstructUISettings[key] = obj[key]; } }
 			}
 		}	// If persist session isn't toggled, reset to the default settings.
-		else { localStorage.setItem((localmode ? 'e_': '') + 'koboldLiteUICustomizationOptions', JSON.stringify(aestheticInstructUISettings, null, 2)); }
+		else { localStorage.setItem((localflag ? 'e_': '') + 'koboldLiteUICustomizationOptions', JSON.stringify(aestheticInstructUISettings, null, 2)); }
 
 		// Initialize foregroundColorPickers and backgroundColorPickers.
 		document.querySelectorAll('.enhancedTextColorPicker, .enhancedStandardColorPicker').forEach(element => {
@@ -8514,6 +8845,8 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 		aestheticInstructUISettings.portrait_width = document.getElementById('portrait_width').value;
 		aestheticInstructUISettings.portrait_height = document.getElementById('portrait_height').value;
 		aestheticInstructUISettings.background_minHeight = document.getElementById('instruct-min-backgroundHeight').value;
+		aestheticInstructUISettings.centerHorizontally = document.getElementById('instructModeCenterHorizontally').checked;
+
 		// aestheticInstructUISettings.background_anchor_style_you = document.getElementById('background-anchor-style-you').value;
 		// aestheticInstructUISettings.background_anchor_style_AI = document.getElementById('background-anchor-style-AI').value;
 
@@ -8524,7 +8857,7 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 		aestheticInstructUISettings.background_minHeight = cleannum(aestheticInstructUISettings.background_minHeight, 0, 300);
 
 		// NOTE: Portraits are loaded automatically from the json, and are stored to aestheticInstructUISettings directly.
-		localStorage.setItem((localmode?"e_":"")+'koboldLiteUICustomizationOptions', JSON.stringify(aestheticInstructUISettings, null, 2));
+		localStorage.setItem((localflag?"e_":"")+'koboldLiteUICustomizationOptions', JSON.stringify(aestheticInstructUISettings, null, 2));
 
 		function getTextStyleFromElement(id) {
 			let element = document.getElementById(id);
@@ -8551,10 +8884,11 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 		document.getElementById('portrait_width').value = aestheticInstructUISettings.portrait_width;
 		document.getElementById('portrait_height').value = aestheticInstructUISettings.portrait_height;
 		document.getElementById('instruct-min-backgroundHeight').value = aestheticInstructUISettings.background_minHeight;
+		document.getElementById('instructModeCenterHorizontally').checked = aestheticInstructUISettings.centerHorizontally;
 		// document.getElementById('background-anchor-style-AI').value = aestheticInstructUISettings.background_anchor_style_AI;
 		// document.getElementById('background-anchor-style-you').value = aestheticInstructUISettings.background_anchor_style_you;
 
-		// Show or hide custumization UI elements based on whether they should be visible in the UI or not.
+		// Show or hide customization UI elements based on whether they should be visible in the UI or not.
 		showOrHide('.uniform-mode-font', document.getElementById('instructModeCustomized').checked == false);
 		showOrHide('.custom-mode-font', document.getElementById('instructModeCustomized').checked == true);
 		showOrHide('.instruct-markdown-user', document.getElementById('instructModeMarkdown').checked == true);
@@ -8590,28 +8924,20 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 		const contextDict = { sysOpen: '<sys_context_koboldlite_internal>', youOpen: '<user_context_koboldlite_internal>', AIOpen: '<AI_context_koboldlite_internal>', closeTag: '<end_of_context_koboldlite_internal>' }
 		let you = get_instruct_starttag(); let bot = get_instruct_endtag(); // Instruct tags will be used to wrap text in styled bubbles.
 		let as = aestheticInstructUISettings;								// ..and use this as shortcut to avoid typing it each time.
-
-		//update portraits globally as css classes, that way multiple lines can reuse them
-		let portraitsStyling = `
-		<style>
-		.you-portrait-image {margin: 10px 6px; background:url(`+ as.you_portrait +`); background-clip: content-box; background-position: 50% 50%; background-size: 100% 100%; background-origin: content-box; background-repeat: no-repeat; border:none;}
-		.AI-portrait-image {margin: 10px 6px; background:url(`+ as.AI_portrait +`); background-clip: content-box; background-position: 50% 50%; background-size: 100% 100%; background-origin: content-box; background-repeat: no-repeat; border:none;}
+		let portraitsStyling = // Also, implement portraits as css classes. Now chat entries can reuse them instead of recreating them.
+		`<style>
+			.you-portrait-image {margin: 10px 6px; background:url(`+ as.you_portrait +`); background-clip: content-box; background-position: 50% 50%; background-size: 100% 100%; background-origin: content-box; background-repeat: no-repeat; border:none;}
+			.AI-portrait-image {margin: 10px 6px; background:url(`+ as.AI_portrait +`); background-clip: content-box; background-position: 50% 50%; background-size: 100% 100%; background-origin: content-box; background-repeat: no-repeat; border:none;}
 		</style>
 		`;
 
-		// We'll transform the input to a well-formatted HTML string.
-		let noSystemPrompt = (input.trim().startsWith(you.trim()) || input.trim().startsWith(bot.trim()))
-		let newbodystr = noSystemPrompt ? input : style('sys') + input;			// First, create the string we'll transform. Style system bubble if we should.
-		if (newbodystr.endsWith(bot)) { newbodystr = newbodystr.slice(0, -bot.length); }							// Reduce any unnecessary spaces or newlines. Trim empty replies if they exist.
-		newbodystr = replaceAll(newbodystr, you + '\n', you);
-		newbodystr = replaceAll(newbodystr, bot + '\n', bot);
-		newbodystr = replaceAll(newbodystr, you + ' ', you);
-		newbodystr = replaceAll(newbodystr, bot + ' ', bot);
-		newbodystr = replaceAll(newbodystr,'"', '&quot;');
-		newbodystr = replaceAll(newbodystr, you + '\n', you);
-		newbodystr = replaceAll(newbodystr, you, style('you'));
-		newbodystr = replaceAll(newbodystr, bot, style('AI'));
-		newbodystr += contextDict.closeTag; 	// Style background of incoming and outgoing messages appropriately.
+		// We'll transform the input to a well-formatted HTML string that'll contain the whole visuals for the Aesthetic Instruct Mode. Effectively we're styling the input.
+		let noSystemPrompt = input.trim().startsWith(you.trim()) || input.trim().startsWith(bot.trim());
+		let newbodystr = noSystemPrompt ? input : style('sys') + input;					 // First, create the string we'll transform. Style system bubble if we should.
+		if (newbodystr.endsWith(bot)) { newbodystr = newbodystr.slice(0, -bot.length); } // Remove the last chat bubble if prompt ends with `end_sequence`.
+		newbodystr = transformInputToAestheticStyle(newbodystr); 						 // Transform input to aesthetic style, reduce any unnecessary spaces or newlines, and trim empty replies if they exist.
+		if (synchro_pending_stream != "") { newbodystr += getStreamingText(); } 		 // Add the pending stream if it's needed. This will add any streamed text to a new bubble for the AI.
+		newbodystr += contextDict.closeTag + '</p></div></div>';						 // Lastly, append the closing div so our body's raw form is completed.
 		if (aestheticInstructUISettings.use_markdown) {																// If markdown is enabled, style the content of each bubble as well.
 			let internalHTMLparts = []; // We'll cache the embedded HTML parts here to keep them intact.
 			for (let role of aestheticTextStyleRoles) {																// ..starting by the "speech" and *actions* for each role.
@@ -8624,40 +8950,32 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 				});
 			}
 			internalHTMLparts.forEach((part, index) => { newbodystr = newbodystr.replace(`<internal_html_${index}>`, part); }); // Bring back the embedded HTML parts.
-			newbodystr = applyStylizedCodeBlocks(); // Apply the code-block styling, if markdown is used.
+			newbodystr = applyStylizedCodeBlocks(); 																// Then, apply the code-block styling, if markdown is used.
 		}
-		let ret = newbodystr;
-		ret = replaceAll(ret,'\r\n','<br>');
-		ret = replaceAll(ret,'\n','<br>');
-		let ret2 = ""
-		if(synchro_pending_stream!="")
-		{
-			ret2 += `<div class="incoming_msg"><p>`+"<span class=\"color_yellow\">" + escapeHtml(pending_context_preinjection) + escapeHtml(synchro_pending_stream) + "</span>"+`</p></div>`;
-		}
-		return portraitsStyling + ret + '</p>'+ret2+'</div></div><br>';	// Finally, convert newlines to HTML format and return the stylized string.
+		return portraitsStyling + newbodystr.replaceAll('\r\n','<br>').replaceAll('\n','<br>'); // Finally, convert newlines to HTML format and return the stylized string.
+
 
 		// Helper functions to allow styling the chat log properly. These affect both the background of the chat bubbles and its content.
-		function style(role) { return `${contextDict.closeTag}</p></div></div><div style='display:flex; align-items:stretch; flex-direction: row;'>${image(role)}<div style='flex: 1; color: ${as[`text_color_${as.use_uniform_colors ? 'uniform' : role}`].color}; background-color:${as[`bubbleColor_${role}`]}; padding: ${as.padding()}; margin: ${as.margin()}; min-height:${as.background_minHeight}px; font-size: ${as.font_size}px; display: flex; flex-direction:column; align-items: flex-start; justify-content: center; border-radius: 15px'><p>${contextDict[`${role}Open`]}`; }
+		function style(role) { return `${contextDict.closeTag}</p></div></div><div style='display:flex; align-items:stretch; flex-direction: row;'>${image(role)}<div style='flex: 1; color: ${as[`text_color_${as.use_uniform_colors ? 'uniform' : role}`].color}; background-color:${as[`bubbleColor_${role}`]}; padding: ${as.padding()}; margin: ${as.margin()}; min-height:${as.background_minHeight}px; font-size: ${as.font_size}px; display: flex; flex-direction:column; align-items: ${as.centerHorizontally ? 'center' : 'flex-start'}; justify-content: center; border-radius: 15px'><p>${contextDict[`${role}Open`]}`; }
 		function wrapperSpan(role, type) { let textStyle = as[`${type}_color_${role}`]; return `<span style='color: ${textStyle.color}; font-style: ${textStyle.fontStyle}; font-weight: ${textStyle.fontWeight}'>$1</span>`; }
 		function image(role) {
-			const portraitSrc = as[`${role}_portrait`];
-			if (!portraitSrc || as.border_style == 'None' || role == 'sys') { return ''; }
+			if (!as[`${role}_portrait`] || as.border_style == 'None' || role == 'sys') { return ''; }
 			return `<div class='${role}-portrait-image' style='width:${as.portraitSize().width}px; height:${as.portraitSize().height}px; border-radius: ${as.portraitRadius()}'></div>`;
 		}
 		function applyStylizedCodeBlocks() {
 			let blocks = newbodystr.split(/(```[\s\S]*?\n[\s\S]*?```)/g);
 			for (var i = 0; i < blocks.length; i++) {
 				if (blocks[i].startsWith('```')) { blocks[i] = blocks[i].replace(/```[\s\S]*?\n([\s\S]*?)```/g, `</p><pre style='min-width:80%;margin:0px 40px 0px 20px;background-color:${as.code_block_background};color:${as.code_block_foreground}'>$1</pre><p>`); }
-				else {
-					let bi = blocks[i];
-					bi = replaceAll(bi,'```','`');
-					bi = replaceAll(bi,'``','`');
-					bi = bi.replace(/`(.*?)`/g, `<code style='background-color:black'>$1</code>`);
-					blocks[i] = bi;
-				}
+				else { blocks[i] = blocks[i].replaceAll('```','`').replaceAll('``','`').replace(/`(.*?)`/g, `<code style='background-color:black'>$1</code>`); }
 			}
 			return blocks.join('');
 		}
+		function transformInputToAestheticStyle(bodyStr) { // Trim unnecessary empty space and new lines, and append * or " to each bubble if start/end sequence ends with * or ", to preserve styling.
+			bodyStr = bodyStr.replaceAll(you + '\n', you).replaceAll(you + ' ', you).replaceAll(you, style('you') + `${you.endsWith('*') ? '*' : ''}` + `${you.endsWith('"') ? '"' : ''}`);
+			bodyStr = bodyStr.replaceAll(bot + '\n', bot).replaceAll(bot + ' ', bot).replaceAll(bot, style('AI') + `${bot.endsWith('*') ? '*' : ''}` + `${bot.endsWith('"') ? '"' : ''}`);
+			return bodyStr.replaceAll('"', '&quot;');
+		}
+		function getStreamingText() { return `${input.endsWith(bot) ? style('AI') + `${bot.endsWith('*') ? '*' : ''}` + `${bot.endsWith('"') ? '"' : ''}` : ''}` + escapeHtml(pending_context_preinjection) + escapeHtml(synchro_pending_stream); }
 	}
 
 	function updateTextPreview() {
@@ -8711,7 +9029,7 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 
 								<li class="nav-item hidden" id="topbtn_save">
 									<a id="tempfile" href="#" style="display:none;"></a>
-									<a class="nav-link" href="#" onclick="save_file()">Save</a>
+									<a class="nav-link" href="#" onclick="save_file_button()">Save</a>
 								</li>
 
 								<li class="nav-item hidden" id="topbtn_load">
@@ -8870,7 +9188,7 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 
 					<div class="popupfooter">
 						<button type="button" class="btn btn-primary" id=""
-							onclick="confirm_scenario_verify()">Confirm</button>
+							onclick="confirm_scenario_verify()">Ok</button>
 						<button type="button" class="btn btn-primary" id=""
 							onclick="hide_popups()">Cancel</button>
 					</div>
@@ -8924,7 +9242,7 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 
 				<div class="popupfooter">
 					<button type="button" class="btn btn-primary" id="btn_loadmodelaccept"
-						onclick="confirm_models()">Confirm</button>
+						onclick="confirm_models()">Ok</button>
 					<button type="button" class="btn btn-primary" id="btn_loadmodelclose"
 						onclick="hide_popups()">Cancel</button>
 
@@ -8953,8 +9271,6 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 				<span class="color_green" style="font-weight: bold;">Please input URL of the KoboldAI instance.</span><br><br>
 				<input class="form-control" id="customendpoint" placeholder="https://sample-remote-address.trycloudflare.com" value="">
 				<div class="box flex flex-push-right">
-					<input type="checkbox" id="pseudostreaming">
-					<div class="box-label" title="Will simulate token streaming by breaking requests up into smaller ones.">Emulate Token Streaming</div>
 					<input type="checkbox" id="remoteconsolelog">
 					<div class="box-label" title="Will display outputs to the remote endpoint's console logs, useful for debugging.">Show Console Logging</div>
 				</div>
@@ -9013,7 +9329,7 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 				<div class="box-label" title="Rename User and Bot tags to work with claude, force inject them otherwise">Claude Compatibility Rename Fix</div>
 			</div>
 			<div class="popupfooter">
-				<button type="button" class="btn btn-primary" onclick="connect_custom_endpoint()">Connect</button>
+				<button type="button" class="btn btn-primary" onclick="connect_custom_endpoint()">Ok</button>
 				<button type="button" class="btn btn-primary" onclick="hide_popups()">Cancel</button>
 			</div>
 		</div>
@@ -9034,7 +9350,7 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 				<br>
 			</div>
 			<div class="popupfooter">
-				<button type="button" class="btn btn-primary" onclick="confirm_newgame()">Accept</button>
+				<button type="button" class="btn btn-primary" onclick="confirm_newgame()">Ok</button>
 				<button type="button" class="btn btn-primary" onclick="hide_popups()">Cancel</button>
 			</div>
 		</div>
@@ -9042,13 +9358,18 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 
 	<div class="popupcontainer flex hidden" id="settingscontainer">
 		<div class="popupbg flex"></div>
-		<div class="nspopup fixsize highest">
+		<div class="nspopup fixsize evenhigher">
 			<div class="popuptitlebar">
 				<div class="popuptitletext">Settings</div>
 			</div>
+			<div><ul class="nav nav-tabs settingsnav">
+				<li id="settingsmenubasic_tab" class="active"><a class="" href="#" onclick="display_settings_tab(true)">Basic</a></li>
+				<li id="settingsmenuadvanced_tab" ><a class="" href="#" onclick="display_settings_tab(false)">Advanced</a></li>
+			  </ul></div>
 			<div class="aidgpopuplistheader">
-				<div class="settingsmenu" style="padding-bottom: 0px;" onchange="setting_tweaked()">
 
+				<!--basic settings menu top half-->
+				<div id="settingsmenubasic1" class="settingsmenu" style="padding-bottom: 0px;" onchange="setting_tweaked()">
 					<div class="settingitem">
 						<div class="settinglabel">
 							<div class="justifyleft settingsmall">Quick Presets <span class="helpicon">?<span class="helptext">Pick from an easy selection of curated generation presets, or configure your own.</span></span></div>
@@ -9057,7 +9378,6 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 							</select>
 						</div>
 					</div>
-
 					<div class="settingitem">
 						<div class="settinglabel">
 							<div class="justifyleft settingsmall">Temperature <span class="helpicon">?<span
@@ -9091,9 +9411,9 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 						   document.getElementById('max_context_length').value = this.value;"></div>
 						<div class="settingminmax">
 							<div class="justifyleft">512</div>
-							<div class="justifyright">2048</div>
+							<div class="justifyright" id="max_context_length_slide_label">2048</div>
 						</div>
-						<div class="settinglabel">
+						<div id="auto_ctxlen_panel" class="settinglabel">
 							<div class="justifyleft settingsmall" title="Automatically lowers settings if incompatible with existing workers">Auto-Adjust Limits </div>
 						   <input type="checkbox" id="auto_ctxlen" style="margin:0px 0 0;">
 						</div>
@@ -9116,7 +9436,7 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 							<div class="justifyleft">16</div>
 							<div class="justifyright">512</div>
 						</div>
-						<div class="settinglabel">
+						<div id="auto_genamt_panel" class="settinglabel">
 							<div class="justifyleft settingsmall" title="Automatically lowers settings if incompatible with existing workers">Auto-Adjust Limits </div>
 						   <input type="checkbox" id="auto_genamt" style="margin:0px 0 0;">
 						</div>
@@ -9139,10 +9459,126 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 						</div>
 					</div>
 
+
+
+					<div class="settingitem">
+						<div class="settinglabel">
+							<div class="justifyleft settingsmall">Repetition Penalty <span class="helpicon">?<span
+										class="helptext">Used to penalize words that were already generated or belong to
+										the context (Going over 1.2 breaks 6B models).</span></span></div>
+							<input inputmode="numeric" class="justifyright flex-push-right settingsmall" id="rep_pen" value=80
+								oninput="
+						   document.getElementById('rep_pen_slide').value = this.value;">
+						</div>
+						<div><input type="range" class="form-range airange" min="1" max="3" step="0.01"
+								id="rep_pen_slide" oninput="
+						   document.getElementById('rep_pen').value = this.value;"></div>
+						<div class="settingminmax">
+							<div class="justifyleft">1</div>
+							<div class="justifyright">3</div>
+						</div>
+					</div>
+
+
+				</div>
+				<!-- basic settings menu bottom half-->
+				<div id="settingsmenubasic2" class="settingsmenu" style="padding-top: 0px;">
+
+
+					<div class="settingitem">
+						<div class="settinglabel">
+							<div class="justifyleft settingsmall">Format <span class="helpicon">?<span class="helptext">Story Mode is best for novel style writing. Adventure Mode is best for Interactive Fiction RPGs. Chat Mode is best for chat conversations with the AI. Instruct mode is for giving the AI ChatGPT styled tasks.</span></span></div>
+							<select class="form-control" id="opmode" style="height:24px;padding:0;margin:0px 0 0;" onchange="toggle_opmode()">
+								<option value="1">Story Mode</option>
+								<option value="2">Adventure Mode</option>
+								<option value="3">Chat Mode</option>
+								<option value="4">Instruct Mode</option>
+							</select>
+
+						<div id="chatnamesection1" class="settinglabel hidden" style="padding-top: 3px;">
+							<div class="settinglabel">
+								<div class="justifyleft settingsmall" title="Switches to an aesthetic messenger style UI">Aesthetic Chat UI </div>
+								<input type="checkbox" id="enhanced_chat_ui" style="margin:0px 0 0;">
+							</div>
+						</div>
+						<div id="adventuresection1" class="settinglabel hidden" style="padding-top: 3px;">
+							<div class="settinglabel">
+							<div class="justifyleft settingsmall">Adventure Prompt <span class="helpicon">?<span
+								class="helptext">Modifies the context, injecting tokens to improve adventure quality for adventure mode.</span></span> </div>
+							<input type="checkbox" id="adventure_context_mod" style="margin:0px 0 0;">
+							</div>
+						</div>
+						<div id="instructsection1" class="settinglabel hidden" style="padding-top: 3px;">
+							<div class="settinglabel">
+								<div class="justifyleft settingsmall" title="Switches to a UI style more suitable for RP. Enabling markdown together with this is recommended.">Aesthetic Instruct UI </div>
+								<input type="checkbox" id="enhanced_instruct_ui" style="margin:0px 5.5px;">
+							</div>
+						</div>
+
+						</div>
+					</div>
+
+					<div class="settingitem">
+					<div class="settinglabel">
+						<div id="chatnamesection2" class="settinglabel hidden" style="padding-top: 3px;">
+							<table class="settingsmall text-center" style="border-spacing: 4px 2px;	border-collapse: separate;">
+								<tr>
+								<th>Your Name</th>
+								<th>AI Name <span class="helpicon">?<span class="helptext">The name of the person you want to chat with. Multiple opponents can be specified, creating a group chat, separate their names with ||$||</span></span></th>
+								</tr>
+								<tr>
+								<td><input class="settinglabel miniinput" type="text" placeholder="(Enter Name)" value="" id="chatname" title="The name that you will be chatting as"></td>
+								<td><input class="settinglabel miniinput" type="text" placeholder="(Auto)" value="" id="chatopponent"  title="The name of the person you want to chat with"></td>
+								</tr>
+							  </table>
+
+							<div class="settinglabel">
+							<div class="justifyleft settingsmall" title="Whether to allow multiple lines in AI responses. Not recommended.">Multiline Replies </div>
+							<input type="checkbox" id="multiline_replies" style="margin:0px 0 0;">
+							</div>
+							<div class="settinglabel">
+							<div class="justifyleft settingsmall" title="Allow incomplete AI chat replies, which can be continued by pressing submit again. Not recommended.">Continue Bot Replies</div>
+							<input type="checkbox" id="allow_continue_chat" style="margin:0px 0 0;">
+							</div>
+						</div>
+						<div id="adventuresection2" class="settinglabel hidden" style="padding-top: 3px;">
+						</div>
+						<div id="instructsection2" class="settinglabel hidden" style="padding-top: 3px;">
+							<div class="justifyleft settingsmall">Instruct Tag Preset <span class="helpicon">?<span class="helptext">Quickly select between common instruct tag formats. Different models are trained with different tags.</span></span></div>
+							<select class="form-control" id="instruct_tag_format" style="font-size:10px;height:18px;padding:0;margin:0px 0 0;" onchange="toggle_instruct_tag_format()">
+								<option value="0" selected>[Custom]</option>
+								<option value="1">Alpaca</option>
+								<option value="2">Vicuna</option>
+								<option value="3">Metharme</option>
+								<option value="4">Llama 2 Chat</option>
+							</select>
+							<table class="settingsmall text-center" style="border-spacing: 4px 2px;	border-collapse: separate;">
+								<tr>
+									<th>Start Seq.<span class="helpicon">?<span class="helptext">The sequence to start an instruction prompt</span></span></th>
+									<th>End Seq.<span class="helpicon">?<span class="helptext">The sequence to end an instruction prompt</span></span></th>
+								</tr>
+								<tr>
+								<td><input class="settinglabel miniinput" type="text" placeholder="\\n### Instruction:\\n" value="" id="instruct_starttag" onchange="edit_instruct_tag_format()" title="The sequence to start an instruction prompt"></td>
+								<td><input class="settinglabel miniinput" type="text" placeholder="\\n### Response:\\n" value="" id="instruct_endtag" onchange="edit_instruct_tag_format()" title="The sequence to end an instruction prompt"></td>
+								</tr>
+							</table>
+							<div class="justifyleft settingsmall">Raw Instruct Tags <span class="helpicon">?<span
+								class="helptext">If enabled, uses instruct tags verbatim. If disabled, uses universal instruct placeholders that get swapped on submit.</span></span> </div>
+							<input type="checkbox" id="raw_instruct_tags" style="margin:0px 0 0;">
+							<div class="justifyleft settingsmall">Enable Markdown <span class="helpicon">?<span
+								class="helptext">Allows the UI to use markdown formatting such as quotes and code blocks.</span></span> </div>
+							<input type="checkbox" id="instruct_has_markdown" style="margin:0px 0 0;">
+						</div>
+					</div>
+					</div>
+				</div>
+
+				<!--advanced settings menu top-->
+				<div id="settingsmenuadvanced1" class="settingsmenu hidden" style="padding-bottom: 0px;" onchange="setting_tweaked()">
 					<div class="settingitem">
 						<div class="settinglabel">
 
-							<div class="justifyleft settingsmall">Advanced Settings <span class="helpicon">?<span class="helptext">These settings control alternative samplers configurations. They are inactive by default, you usually do not need to change them.</span></span></div>
+							<div class="justifyleft settingsmall">Advanced Sampler Config <span class="helpicon">?<span class="helptext">These settings control alternative samplers configurations. They are inactive by default, you usually do not need to change them.</span></span></div>
 							<table class="settingsmall text-center" style="border-spacing: 4px 2px;
 							border-collapse: separate;">
 								<tr>
@@ -9168,19 +9604,30 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 
 					<div class="settingitem">
 						<div class="settinglabel">
-							<div class="justifyleft settingsmall">Repetition Penalty <span class="helpicon">?<span
-										class="helptext">Used to penalize words that were already generated or belong to
-										the context (Going over 1.2 breaks 6B models).</span></span></div>
-							<input inputmode="numeric" class="justifyright flex-push-right settingsmall" id="rep_pen" value=80
-								oninput="
-						   document.getElementById('rep_pen_slide').value = this.value;">
-						</div>
-						<div><input type="range" class="form-range airange" min="1" max="3" step="0.01"
-								id="rep_pen_slide" oninput="
-						   document.getElementById('rep_pen').value = this.value;"></div>
-						<div class="settingminmax">
-							<div class="justifyleft">1</div>
-							<div class="justifyright">3</div>
+
+							<div class="justifyleft settingsmall">Mirostat (If supported) <span class="helpicon">?<span class="helptext">Replaces your samplers with mirostat, an alternative sampling method. May not be available depending on backend, not supported on Horde.</span></span></div>
+							<div id="mirosupporteddiv">
+								<table class="settingsmall text-center" style="border-spacing: 4px 2px;
+								border-collapse: separate;">
+									<tr>
+									<th title="Mirostat Type 0/1/2">Mode</th>
+									<th title="Mirostat Tau Value">Tau</th>
+									<th title="Mirostat Eta Value">Eta</th>
+									</tr>
+									<tr>
+									<td><select style="padding:1px; height:auto; width: 27px; appearance: none; font-size: 7pt;" class="form-control" id="miro_type">
+										<option value="0">Off</option>
+										<option value="1">1</option>
+										<option value="2">2</option>
+									</select></td>
+									<td><input class="" type="text" placeholder="0.0" value="0.0"
+									id="miro_tau"></td>
+									<td><input class="" type="text" placeholder="0.0" value="0.0"
+									id="miro_eta"></td>
+									</tr>
+								</table>
+							</div>
+							<div id="mirounsupporteddiv" class="color_red" style="font-weight:bold;padding:3px;font-size:12px">Mirostat Not Supported</div>
 						</div>
 					</div>
 
@@ -9205,8 +9652,9 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 						</div>
 
 					</div>
-					</div>
-					<div class="settingsmenu" style="padding-top: 0px;">
+				</div>
+				<!--advanced settings menu bottom-->
+				<div id="settingsmenuadvanced2" class="settingsmenu hidden" style="padding-top: 0px;" onchange="">
 					<div class="settingitem">
 						<div class="settinglabel">
 							<div class="justifyleft settingsmall">Generate Images <span class="helpicon">?<span class="helptext">Use Stable Horde to insert AI generated images into your story.</span></span></div>
@@ -9235,7 +9683,6 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 								</tr>
 								</table>
 							</div>
-
 					</div>
 
 					<div class="settingitem">
@@ -9250,92 +9697,33 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 						</div>
 					</div>
 
-
 					<div class="settingitem">
 						<div class="settinglabel">
-							<div class="justifyleft settingsmall">Format <span class="helpicon">?<span class="helptext">Story Mode is best for novel style writing. Adventure Mode is best for Interactive Fiction RPGs. Chat Mode is best for chat conversations with the AI. Instruct mode is for giving the AI ChatGPT styled tasks.</span></span></div>
-							<select class="form-control" id="opmode" style="height:24px;padding:0;margin:0px 0 0;" onchange="toggle_opmode()">
-								<option value="1">Story Mode</option>
-								<option value="2">Adventure Mode</option>
-								<option value="3">Chat Mode</option>
-								<option value="4">Instruct Mode</option>
+							<div class="justifyleft settingsmall" id="tokenstreaminglabel" title="Attempts to use token streaming if available.">Token Streaming </div>
+						   <input type="checkbox" id="tokenstreaming" style="margin:0px 0 0;">
+						</div>
+
+						<div id="idlesection" class="settinglabel">
+							<div class="justifyleft settingsmall" title="Allow the AI to send more responses if you are idle.">Idle Responses&nbsp;</div>
+							<select style="padding:1px; height:auto; width: 27px; appearance: none; font-size: 7pt;" class="form-control" id="idle_responses">
+								<option value="0">Off</option>
+								<option value="1">1x</option>
+								<option value="2">2x</option>
+								<option value="3">3x</option>
+								<option value="5">5x</option>
+								<option value="8">8x</option>
+							</select>
+							<select style="padding:1px; height:auto; width: 27px; appearance: none; font-size: 7pt;" class="form-control" id="idle_duration">
+								<option value="15">15s</option>
+								<option value="30">30s</option>
+								<option value="60">60s</option>
+								<option value="120">2m</option>
+								<option value="300">5m</option>
+								<option value="600">10m</option>
 							</select>
-							<div id="chatnamesection" class="hidden">
-								<table class="settingsmall text-center" style="border-spacing: 4px 2px;	border-collapse: separate;">
-								<tr>
-								  <th>Your Name</th>
-								  <th>AI Name <span class="helpicon">?<span class="helptext">The name of the person you want to chat with. Multiple opponents can be specified, creating a group chat, separate their names with ||$||</span></span></th>
-								</tr>
-								<tr>
-								<td><input class="settinglabel miniinput" type="text" placeholder="(Enter Name)" value="" id="chatname" title="The name that you will be chatting as"></td>
-								<td><input class="settinglabel miniinput" type="text" placeholder="(Auto)" value="" id="chatopponent"  title="The name of the person you want to chat with"></td>
-								</tr>
-							  </table>
-							<div class="settinglabel">
-							<div class="justifyleft settingsmall" title="Switches to an aesthetic messenger style UI">Aesthetic Chat UI </div>
-							<input type="checkbox" id="enhanced_chat_ui" style="margin:0px 0 0;">
-							</div>
-							<div class="settinglabel">
-							<div class="justifyleft settingsmall" title="Whether to allow multiple lines in AI responses. Not recommended.">Multiline Replies </div>
-							<input type="checkbox" id="multiline_replies" style="margin:0px 0 0;">
-							</div>
-							<div class="settinglabel">
-							<div class="justifyleft settingsmall" title="Allow incomplete AI chat replies, which can be continued by pressing submit again. Not recommended.">Continue Bot Replies</div>
-							<input type="checkbox" id="allow_continue_chat" style="margin:0px 0 0;">
-							</div>
-
-							</div>
-							<div id="adventuresection" class="settinglabel hidden" style="padding-top: 3px;">
-								<div class="justifyleft settingsmall">Improved Prompt <span class="helpicon">?<span
-									class="helptext">Modifies the context, injecting tokens to improve adventure quality for adventure mode.</span></span> </div>
-							   <input type="checkbox" id="adventure_context_mod" style="margin:0px 0 0;">
-							</div>
-							<div id="instructsection" class="settinglabel hidden" style="padding-top: 3px;">
-								<table class="settingsmall text-center" style="border-spacing: 4px 2px;	border-collapse: separate;">
-									<tr>
-										<th>Start Seq.<span class="helpicon">?<span class="helptext">The sequence to start an instruction prompt</span></span></th>
-										<th>End Seq.<span class="helpicon">?<span class="helptext">The sequence to end an instruction prompt</span></span></th>
-									</tr>
-									<tr>
-									<td><input class="settinglabel miniinput" type="text" placeholder="\\n### Instruction:\\n" value="" id="instruct_starttag" title="The sequence to start an instruction prompt"></td>
-									<td><input class="settinglabel miniinput" type="text" placeholder="\\n### Response:\\n" value="" id="instruct_endtag"  title="The sequence to end an instruction prompt"></td>
-									</tr>
-								</table>
-								<div class="settinglabel">
-									<div class="justifyleft settingsmall" title="Switches to a UI style more suitable for RP. Enabling markdown together with this is recommended.">Aesthetic Instruct UI </div>
-									<input type="checkbox" id="enhanced_instruct_ui" style="margin:0px 5.5px;">
-								</div>
-								<div class="justifyleft settingsmall">Enable Markdown <span class="helpicon">?<span
-									class="helptext">Allows the UI to use markdown formatting such as quotes and code blocks.</span></span> </div>
-								<input type="checkbox" id="instruct_has_markdown" style="margin:0px 0 0;">
-							</div>
-							<div id="idlesection" class="settinglabel hidden">
-								<div class="justifyleft settingsmall" title="Allow the AI to send more responses if you are idle.">Idle Responses&nbsp;</div>
-								<select style="padding:1px; height:auto; width: 27px; appearance: none; font-size: 7pt;" class="form-control" id="idle_responses">
-									<option value="0">Off</option>
-									<option value="1">1x</option>
-									<option value="2">2x</option>
-									<option value="3">3x</option>
-									<option value="5">5x</option>
-									<option value="8">8x</option>
-								</select>
-								<select style="padding:1px; height:auto; width: 27px; appearance: none; font-size: 7pt;" class="form-control" id="idle_duration">
-									<option value="15">15s</option>
-									<option value="30">30s</option>
-									<option value="60">60s</option>
-									<option value="120">2m</option>
-									<option value="300">5m</option>
-									<option value="600">10m</option>
-								</select>
-							</div>
 						</div>
-					</div>
 
-					<div class="settingitem">
-						<div class="settinglabel">
-							<div class="justifyleft settingsmall" title="Automatically scrolls the text window down when new text is generated">Autoscroll </div>
-						   <input type="checkbox" id="autoscroll" style="margin:0px 0 0;">
-						</div>
+
 						<div class="settinglabel">
 							<div class="justifyleft settingsmall" title="Trims incomplete sentences in AI output">Trim Sentences </div>
 						   <input type="checkbox" id="trimsentences" style="margin:0px 0 0;">
@@ -9345,25 +9733,37 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 						   <input type="checkbox" id="trimwhitespace" style="margin:0px 0 0;">
 						</div>
 						<div class="settinglabel">
-							<div class="justifyleft settingsmall" title="Allow the EOS token and others to be used">Unban Tokens (KAI) </div>
+							<div class="justifyleft settingsmall" title="Allow the EOS token and others to be used">Unban EOS Tokens </div>
 						   <input type="checkbox" id="unban_tokens" style="margin:0px 0 0;">
 						</div>
+					</div>
+
+
+					<div class="settingitem">
 						<div class="settinglabel">
-							<div class="justifyleft settingsmall" title="Autosaves your current story and settings on exit, reloads when you return">Persist Session </div>
+							<div class="justifyleft settingsmall" title="Autosaves your current story and settings on exit, reloads when you return">Persist Autosave Session </div>
 						   <input type="checkbox" id="persist_session" style="margin:0px 0 0;">
 						</div>
 						<div class="settinglabel">
-							<div class="justifyleft settingsmall" title="Includes your current settings when saving or sharing your story">Export Settings </div>
+							<div class="justifyleft settingsmall" title="Includes your current settings when saving or sharing your story">JSON Exports Settings </div>
 						   <input type="checkbox" id="export_settings" style="margin:0px 0 0;">
 						</div>
+						<div class="settinglabel">
+							<div class="justifyleft settingsmall"  title="Prompts to input a different filename when saving file.">Show Rename Save File </div>
+						   <input type="checkbox" id="prompt_for_savename" style="margin:0px 0 0;">
+						</div>
+						<div class="settinglabel">
+							<div class="justifyleft settingsmall" title="Automatically scrolls the text window down when new text is generated">Autoscroll Text </div>
+						   <input type="checkbox" id="autoscroll" style="margin:0px 0 0;">
+						</div>
 						<div class="settinglabel">
 							<div class="justifyleft settingsmall" title="Inverts all colors, simple light mode">Inverted Colors </div>
 						   <input type="checkbox" id="invert_colors" style="margin:0px 0 0;">
 						</div>
 					</div>
 
-
 				</div>
+
 			</div>
 			<div class="popupfooter">
 				<button type="button" class="btn btn-primary" id="btn_settingsaccept"
@@ -9382,6 +9782,12 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 			</div>
 			<div class="settinglabel">
 				<span class="justifyleft">Memory</span>
+				<span class="justifyright flex-push-right" >
+					<div class="settinglabel" style="padding-top: 4px;">
+						<div class="justifyleft settingsmall" title="Add newline after injecting memory text">Newline After Memory </div>
+					   <input type="checkbox" id="newlineaftermemory" style="margin:0px 0 0;" checked>
+					</div>
+				</span>
 			</div>
 			<textarea class="form-control" id="memorytext" style="height: 120px;"
 				placeholder="Edit the memory to be sent with each request to the AI."></textarea>
@@ -9448,7 +9854,7 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 
 			<div class="popupfooter">
 
-				<button type="button" class="btn btn-primary" onclick="save_wi();autosave();hide_popups()">Save</button>
+				<button type="button" class="btn btn-primary" onclick="save_wi();autosave();hide_popups()">Ok</button>
 				<button type="button" class="btn btn-primary" onclick="revert_wi();hide_popups()">Cancel</button>
 			</div>
 		</div>
@@ -9639,6 +10045,10 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 									<div class="ui-settings-inline">
 										<div style="margin-right:20px;">Min Height: </div>
 										<div class="instruct-settings-input"><input id ="instruct-min-backgroundHeight" type="number"/> px</div>
+										<div class="ui-settings-inline">
+											<div style="padding-top: 4px; font-size: 10px; margin-left: 10px;">Horizontally-centered text:</div>
+											<input id="instructModeCenterHorizontally" type="checkbox" style="height: 10px; margin-top: 6px;">
+										</div>
 									</div>
 									<div class="ui-settings-inline">
 										<div style="margin-right:20px;">Margin (px): </div>
@@ -9776,7 +10186,7 @@ if ('serviceWorker' in navigator) {
 
 	//for local mode, we do not load any PWA service worker.
 	//this will prevent PWA functionality locally but will avoid the scary 404 errors
-	if(localmode)
+	if(localflag)
 	{
 		console.log("Try to register service worker...");
 		try {

From fd87ebdb66751adf87df0b9e593f72e11c776930 Mon Sep 17 00:00:00 2001
From: Henk <henk@henk.tech>
Date: Sat, 16 Sep 2023 06:25:12 +0200
Subject: [PATCH 02/18] Horde length passtrough

---
 koboldai_settings.py | 2 ++
 1 file changed, 2 insertions(+)

diff --git a/koboldai_settings.py b/koboldai_settings.py
index b7408b93..9d2f5f4d 100644
--- a/koboldai_settings.py
+++ b/koboldai_settings.py
@@ -1378,6 +1378,8 @@ class system_settings(settings):
                         bridge_data.horde_url = self._koboldai_var.horde_url
                         bridge_data.api_key = self._koboldai_var.horde_api_key
                         bridge_data.scribe_name = self._koboldai_var.horde_worker_name
+                        bridge_data.max_length = self._koboldai_var.genamt
+                        bridge_data.max_context_length = self._koboldai_var.max_length
                         bridge_data.disable_terminal_ui = self._koboldai_var.host
                         if bridge_data.worker_name == "My Awesome Instance":
                             bridge_data.worker_name = f"KoboldAI UI Instance #{random.randint(-100000000, 100000000)}"

From d36049f56fabb3c981755cf753affe64a488b8b7 Mon Sep 17 00:00:00 2001
From: Henk <henk@henk.tech>
Date: Sat, 16 Sep 2023 06:30:35 +0200
Subject: [PATCH 03/18] Newer Horde Worker

---
 AI-Horde-Worker | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/AI-Horde-Worker b/AI-Horde-Worker
index 755696b9..594bed95 160000
--- a/AI-Horde-Worker
+++ b/AI-Horde-Worker
@@ -1 +1 @@
-Subproject commit 755696b9d4464e4167bfea5fd426686420015038
+Subproject commit 594bed958a2e3fadcabf999a023dfe36fb0ad7dd

From 613b02e6f818dc4252884f8125c7197c28e3689b Mon Sep 17 00:00:00 2001
From: Henk <henk@henk.tech>
Date: Sat, 16 Sep 2023 15:56:44 +0200
Subject: [PATCH 04/18] Worker main branch

---
 AI-Horde-Worker | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/AI-Horde-Worker b/AI-Horde-Worker
index 594bed95..3e357f4d 160000
--- a/AI-Horde-Worker
+++ b/AI-Horde-Worker
@@ -1 +1 @@
-Subproject commit 594bed958a2e3fadcabf999a023dfe36fb0ad7dd
+Subproject commit 3e357f4d8b284a637564024802c22fc3b19a5ffc

From 806fc4b8ad561bca0691ce6b7235dd9e83cc12d2 Mon Sep 17 00:00:00 2001
From: Disty0 <semihgulec2005@gmail.com>
Date: Tue, 19 Sep 2023 17:09:51 +0300
Subject: [PATCH 05/18] GPTQ support for IPEX

---
 environments/ipex.yml      | 19 +++++++++++---
 modeling/ipex/attention.py | 54 +++++++++++++++++++++++++++-----------
 2 files changed, 54 insertions(+), 19 deletions(-)

diff --git a/environments/ipex.yml b/environments/ipex.yml
index de2e3de8..73b6025d 100644
--- a/environments/ipex.yml
+++ b/environments/ipex.yml
@@ -24,18 +24,22 @@ dependencies:
   - psutil
   - pip:
     - -f https://developer.intel.com/ipex-whl-stable-xpu
-    - torch==2.0.1a0
-    - intel_extension_for_pytorch==2.0.110+xpu
+    - torch==2.0.1a0; sys_platform == 'linux'
+    - torch==2.0.0a0; sys_platform == 'win32'
+    - intel_extension_for_pytorch==2.0.110+xpu; sys_platform == 'linux'
+    - intel_extension_for_pytorch==2.0.110+gitba7f6c1; sys_platform == 'win32'
+    - intel-extension-for-transformers
     - flask-cloudflared==0.0.10
     - flask-ngrok
     - flask-cors
     - lupa==1.10
     - transformers[sentencepiece]==4.33.1
     - huggingface_hub==0.16.4
-    - optimum[onnxruntime]==1.12.0
+    - optimum[openvino,nncf,neural-compressor]==1.12.0
     - safetensors==0.3.3
-    - accelerate==0.20.3
+    - accelerate==0.21.0
     - git+https://github.com/VE-FORBRYDERNE/mkultra
+    - flask-session
     - ansi2html
     - flask_compress
     - ijson
@@ -43,7 +47,14 @@ dependencies:
     - pydub
     - diffusers
     - git+https://github.com/0cc4m/hf_bleeding_edge/
+    - https://github.com/0cc4m/GPTQ-for-LLaMa/releases/download/0.0.6/gptq_koboldai-0.0.6-cp38-cp38-linux_x86_64.whl; sys_platform == 'linux'
+    - https://github.com/0cc4m/GPTQ-for-LLaMa/releases/download/0.0.6/gptq_koboldai-0.0.6-cp38-cp38-win_amd64.whl; sys_platform == 'win32'
+    - https://github.com/PanQiWei/AutoGPTQ/releases/download/v0.4.1/auto_gptq-0.4.1+cu118-cp38-cp38-linux_x86_64.whl; sys_platform == 'linux'
+    - https://github.com/PanQiWei/AutoGPTQ/releases/download/v0.4.1/auto_gptq-0.4.1+cu118-cp38-cp38-win_amd64.whl; sys_platform == 'win32'
     - einops
     - peft==0.3.0
+    - scipy
+    - https://github.com/0cc4m/exllama/releases/download/0.0.7/exllama-0.0.7-cp38-cp38-linux_x86_64.whl; sys_platform == 'linux'
+    - https://github.com/0cc4m/exllama/releases/download/0.0.7/exllama-0.0.7-cp38-cp38-win_amd64.whl; sys_platform == 'win32'
     - windows-curses; sys_platform == 'win32'
     - pynvml
\ No newline at end of file
diff --git a/modeling/ipex/attention.py b/modeling/ipex/attention.py
index d7335bfa..e38689f2 100644
--- a/modeling/ipex/attention.py
+++ b/modeling/ipex/attention.py
@@ -64,8 +64,14 @@ def torch_bmm(input, mat2, *, out=None):
 original_scaled_dot_product_attention = torch.nn.functional.scaled_dot_product_attention
 def scaled_dot_product_attention(query, key, value, attn_mask=None, dropout_p=0.0, is_causal=False):
     #ARC GPUs can't allocate more than 4GB to a single block, Slice it:
-    shape_one, batch_size_attention, query_tokens, shape_four = query.shape
-    block_multiply = 2.4 if query.dtype == torch.float32 else 1.2
+    if len(query.shape) == 3:
+        batch_size_attention, query_tokens, shape_four = query.shape
+        shape_one = 1
+        no_shape_one = True
+    else:
+        shape_one, batch_size_attention, query_tokens, shape_four = query.shape
+        no_shape_one = False
+    block_multiply = 3.6 if query.dtype == torch.float32 else 1.8
     block_size = (shape_one * batch_size_attention * query_tokens * shape_four) / 1024 * block_multiply #MB
     split_slice_size = batch_size_attention
     if block_size >= 4000:
@@ -101,21 +107,39 @@ def scaled_dot_product_attention(query, key, value, attn_mask=None, dropout_p=0.
                 for i2 in range(query_tokens // split_2_slice_size): # pylint: disable=invalid-name
                     start_idx_2 = i2 * split_2_slice_size
                     end_idx_2 = (i2 + 1) * split_2_slice_size
-                    hidden_states[:, start_idx:end_idx, start_idx_2:end_idx_2] = original_scaled_dot_product_attention(
-                        query[:, start_idx:end_idx, start_idx_2:end_idx_2],
-                        key[:, start_idx:end_idx, start_idx_2:end_idx_2],
-                        value[:, start_idx:end_idx, start_idx_2:end_idx_2],
-                        attn_mask=attn_mask[:, start_idx:end_idx, start_idx_2:end_idx_2] if attn_mask is not None else attn_mask,
+                    if no_shape_one:
+                        hidden_states[start_idx:end_idx, start_idx_2:end_idx_2] = original_scaled_dot_product_attention(
+                            query[start_idx:end_idx, start_idx_2:end_idx_2],
+                            key[start_idx:end_idx, start_idx_2:end_idx_2],
+                            value[start_idx:end_idx, start_idx_2:end_idx_2],
+                            attn_mask=attn_mask[start_idx:end_idx, start_idx_2:end_idx_2] if attn_mask is not None else attn_mask,
+                            dropout_p=dropout_p, is_causal=is_causal
+                        )
+                    else:
+                        hidden_states[:, start_idx:end_idx, start_idx_2:end_idx_2] = original_scaled_dot_product_attention(
+                            query[:, start_idx:end_idx, start_idx_2:end_idx_2],
+                            key[:, start_idx:end_idx, start_idx_2:end_idx_2],
+                            value[:, start_idx:end_idx, start_idx_2:end_idx_2],
+                            attn_mask=attn_mask[:, start_idx:end_idx, start_idx_2:end_idx_2] if attn_mask is not None else attn_mask,
+                            dropout_p=dropout_p, is_causal=is_causal
+                        )
+            else:
+                if no_shape_one:
+                    hidden_states[start_idx:end_idx] = original_scaled_dot_product_attention(
+                        query[start_idx:end_idx],
+                        key[start_idx:end_idx],
+                        value[start_idx:end_idx],
+                        attn_mask=attn_mask[start_idx:end_idx] if attn_mask is not None else attn_mask,
+                        dropout_p=dropout_p, is_causal=is_causal
+                    )
+                else:
+                    hidden_states[:, start_idx:end_idx] = original_scaled_dot_product_attention(
+                        query[:, start_idx:end_idx],
+                        key[:, start_idx:end_idx],
+                        value[:, start_idx:end_idx],
+                        attn_mask=attn_mask[:, start_idx:end_idx] if attn_mask is not None else attn_mask,
                         dropout_p=dropout_p, is_causal=is_causal
                     )
-            else:
-                hidden_states[:, start_idx:end_idx] = original_scaled_dot_product_attention(
-                    query[:, start_idx:end_idx],
-                    key[:, start_idx:end_idx],
-                    value[:, start_idx:end_idx],
-                    attn_mask=attn_mask[:, start_idx:end_idx] if attn_mask is not None else attn_mask,
-                    dropout_p=dropout_p, is_causal=is_causal
-                )
     else:
         return original_scaled_dot_product_attention(
             query, key, value, attn_mask=attn_mask, dropout_p=dropout_p, is_causal=is_causal

From 55251c6b8ee69d4d5d18276543df591f92d3e8a9 Mon Sep 17 00:00:00 2001
From: Concedo <39025047+LostRuins@users.noreply.github.com>
Date: Wed, 20 Sep 2023 20:30:30 +0800
Subject: [PATCH 06/18] updated kobold lite to v66

---
 static/klite.html | 354 +++++++++++++++++++++++++++++++++++-----------
 1 file changed, 272 insertions(+), 82 deletions(-)

diff --git a/static/klite.html b/static/klite.html
index cf97eca7..b30aeac4 100644
--- a/static/klite.html
+++ b/static/klite.html
@@ -3,7 +3,7 @@
 
 <!--
 An embedded version of Kobold Lite for use in koboldcpp and KoboldAI United Client
-Current version: 63
+Current version: 66
 Please go to https://github.com/LostRuins/lite.koboldai.net for updates on Kobold Lite.
 Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and KoboldAI United Client. Please do not remove this line.
 
@@ -1748,13 +1748,13 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 		const favivon_normal = "data:image/png;base64,iVBORw0KGgoAAAANSUhEUgAAACAAAAAgCAMAAABEpIrGAAAAAXNSR0IB2cksfwAAAAlwSFlzAAALEwAACxMBAJqcGAAAAEtQTFRFAAAA+XJ0l09PsVdXcTw842hqw2hmTi4vMCQlb2eUgWtl+tGpBAMDEw4NPCkoFw8PJBgXt5WBVkxW4Nvf7Lia3Z+MpJnAZ05HnJOTYIS/NAAAABl0Uk5TAv////v//vT9//3/Nna08qf+///////a/hkcROQAAAGUSURBVHiclZLRcoQgDEULBAKoIKjI/39pL4i7nbUPbcYZwJyES5Kvr3/YvIx1nn9zL4G4EwuTXX7xs4QFGEklOT6SBENERguhsWHFD2AVRhL8IEgawY8b5L4fYtg+TSl8+NMEu4G2P34Q67r6I+37dLyBfU/4PY/sInG2MR8vIHG01h9mHfq1hUUQtwYcLEcp+ltmwqutdy5HMwAfc8ExKtVSLEZZW13Jxb4Azq7UHFnFrtGItLliS1UDYOfctm3JhEtlEH5zzpZNDsC63AB1VysY3gqC3C2ytsNW6Q3IjCt91Qr9QK8MiFL4nUEpEyNLYmodxYo3RquVHWUmbbRu0QCbKWwNfil5zYeENrRRqtZrGEQYqdtW8FWHLl4bgZDLFLZdbS/UzP2AEGTufkt3xWSvwzJeh4GxHWD5qlgXOZ/n2ULuC/od4Pk8x9xhCekD0Bqd/DmXgbpEumRgrMPn1K6ecs4pJc/V0nE+x35KtfTJTJufpvPTD2DyNZ3e4wP3zDCHevg+yYvf09PfkHuK7/Vv9g2CjBTdqv3bFgAAAABJRU5ErkJggg==";
 		const compressed_scenario_db = ["XQAAAQCkKgAAAAAAAAA9iIqG1FTp3Td41VnWyuXTp3Lb95KmIEizGvJcmkqrV2FY5cKEeSxCwbqBRjHVjL7PUH9wCoW89dPxjDNZvgp6okMOelpy7_1P6GV-mfJV4jz42_DXqYfET4aYlAT13M95gkcA14f0NLvI_p6B9CyG8EbkhRxsk3uyf_KgTV5kwqzAcr5C4JQ_pJr77GnYCHQI8h6F765-lcqrvw1Xu1GHhcN3lj7s9PhMvLnmGPZbQMrTo5sqPJDzYO6lytxmNSHSXMICpN2kFJB6kqyL5lBxNAH3Au_F_JIC85GqwLXWEy8wZms5KmAdp1s3EA1yabPGqqF0G5RxBp3aXzm7h6QUJPy1qSr6JJAo4fi2gCPaLkdn2pKqNDR1Ww8FA6AVHOyMgCTmmrQxWVYgXY9TdhHKcRcrIsoHNXEeWSqMGJNQ8lzVfc26teZdBdPLhqcClG8wUThPtyobTMz8Fgom88nTv7VT-mZhwH9Nc4ghoCL8dMR0Skf-EYDZ0Uvz03_GTn5OB8yuX6FmsD1XQJv_CKBAUHeDKd7n_bC7WOnlAINHPX9Bh5TnwjeLYO-UAL2ClMJTFzR-k2cjVHGQnLB7hZ48L1nToRG1gSVN7dP3Zysw7riwIxnfG4MMNXtEbHyxrCvz2zRTUEqbHLrwIzdJRpJ5s5XfTlY1CPZkQCwxbA6rrUt27D6a-YDKavbg0hubpViPRYbnEDXr9gL-7in4f_K2cOZdQ26Q--hk0xzEtgBNFI6inHA2nA4LofUpWjl835qg6CUyz9EzQkw0cDgPVjYXehC9oC_3H0U2O9YC-Ah8VpdPdCHUFuaQr7oXgePUub_Be1XQyCA5TaqrJxVxUG2hZA4rOVJHZ_AahfiJN7z6QcVEp-8xf-wHcv1lpWjjNdXFWDqVQZkdOaKf63dtjP35SmC5eCw2_BNX_t-db_FCCAhm2Vn2WI3q4k00p4l_ocCrJIdRID6muBVZQXCzxcRf5m8kcGwrTB-XVS-XSSPZInaBxZjgimOl5bLwJvdMC-HNYtU-yUDjXvDjPraZ_7ZV_-knU1GbHf1BpI9-rNbl_3bbA7KbmL7Q_goV1Clvi6gLYgjbXGQMTFjQEoodZX3fK_bDhVsrA1fWMJMWwfY3ua-j8HNuyRDfhPBpbTK0Gvz5-GWbIRF3v4zwR9HzIjz2frY7luy3ApQ6QJw7K6ITvD80u5VLfpHYReVCLpgs-lvPStklgnGXj3j5vuaH9f-wFohB19vwzRnthvgdplXPQ9jMy3ieb80sELS0WiGD-E2L_HhNXUcpTdeBp3HQFK4QubJOiIeKuZDVR7PxvtwBj26m-pLXLzKc6WqQlt07TsRo_72SlAaZodyyFRXf8636HCAyEHcVEhR6uZ1lDu00BHvsyVe6BdG7zvjNdmLluA0qBJQ9FO3ipHezadlwCPnEBDQAAZRgHKUvRCJNOQH_jcqFLLtmDADXoLvcK8_lN0LEeisA4B1LH0X2x0Q6NqLgngh9M1y_cBEBaazMa_UIZwoL6eZGU0QhlpvysBi1wKDybNcF_uKrIxdQwn8L_QRFHtDn39-hw-GDs_6zbnRlwrBEwrMtAQfc62FLSzGUMAzww-aTGvUuQvP-D9m0r-eDbSATlSsrIYobVUDUdDWsMDUsjKfYOW_Rp0GMjk40BQxcdzjNjLCYaTEN5cMhsWyfTbhIHDP7-wfbvJG7Al7Z-nH2Pa-QXPte687xVanKT0d3Er07vOV9HoI09mtuhxE4g0VaLm4TMqxSMRBX3EB60W1U2sX9sHjAgmwfpUNXRNj03QeJe4cg0pndf-hhKkTsfNQMU_N6-Zt8IrM2xtzFfvKB4BpFyWmaYu_X7bGwgSZjzrBNE10fx001fMr2fmrVy_sj7mW7WhlWXa3N5eMe4pqkA4EawmGzhuIwAqZNmtvnL_N2nt4T4ZyqkAAyXMMKb60UJAXkqLjUisD1bnNt1qD9otg8mGNzQxlaY5Bfm7286vNmjyxGY4UVrn0RV0DSFFb5_NYEW5y5YYxiabWABr8k0ezTM8R_qQ7NxdUOj0qhBKOqGyzyuVgKNnB6-ZzpKVGbB7RYJXwfEtkKNuUc3UWmbwxcsCTuW4TOScqJUh4dA5vlgLjB3-Q79yEMRYB8n6jetkR4z25RkYRXvTxkHIVQd2qr8BchdUcmHsZvG_tXI0-bxx_f_TGyfgi8ol7L5SRfWfOtYHCXSVHOCwnDj7GN4rIrwt3qWRcPkdTMw1RguDZW0eTpCpZyCJH_z3xVfpVh5lgf7Nu4tH-CpFRrOaJc79K1lSuIZs8yvjh5dbYAH4rKQ28OOFRu2MmU7Ko8Of4CECcJMhohFtVW6nTCB48-Pl8owiGM5_2uBJOJRAsyu3fHHbKqKvZ-0kYmN9ypyTAxQjgDiCOE3J1txPiqRRRRSaFZgLPNacdyjGO2y2SpWwzYudx8tEq3tBDAPBCXwWqwefcG__iN5OMRgCIAvr-9qfl2iSaVR5LZ-kBluVoW27o0hIUtgdry03bmUN50ob4hwCz8xVoupcHjI3Cy0nLpgiGixjo4afafQPE_TXJf-NixlWN-cH2a4ZzU6Qc5KKzIciwnt6Hx-iRQzB_uK-pBDjC8boVXolOsFyaqWsoLgkghTo2qCFZuxP2GKzS9wQ5sBWxTMEPGryHxaylpXXmUjlBJ-j9p4vJN9YxjQEbyuTVYy0PxmtDbyh6g_n3Lr09ttCg40hqfWBhCT9P4-uFoAjozUciHQFBfI8t04dKZnobLbVq-f_HJGzUZu5zHRHsPI939tJxODDJxiflfHLwxXjQS2cq9Vj-kvn1pgXAN5unYh8Y7-nqepxc0KkO2v8mU-r8fYFmUFJdZu6HR23P2y7ndsozZEKdUAVay36pmW_gvVQuSA_jzLwXn3Ee2y-A7G-w96bTe82gJG95PsSOt2L6AcuF8mqWL_EVBjIZJMN63T__0UHh9VPDCRTUITwn35t7Z0aGYHnssPVAxXLh7y2LhCaIN0u6lnbiDlKAdKc1-4qYbr1sHORC8tjSG8cjWLkgBcNkFo7rqhKQSNtU1H44aT8ceG08a8cSpze8aC6dMVaz6DxEaFIZ-aRqfqO0QV6ty2-6hrcRVedypt1Twd7UEkXZM5Erjb-_8jq4RzshqXVzKEqPfIYpmtHqkmeJq8BLfc1GT9UGrmPpYO4-K8LM-u7aOpcxcagPn2S3McsWI3a8CWkU9t4g9WEPNH-5s8VqF-3rSmgi5kk40Y7HjEyA-6clhNhl9lbP6hIbf9TKHO9fWwzTz8NieUPNZZPgrBrULggzHXPrfJIxl8eLSrKuD8n2Pbumu2k4ljMV_WIq9qCJ1wPofdIoWHWiz7oV2snLve1CFPUCdAhLkHQ8KpO6xvSi6mKY9WsOhOLxKm92vsWLv-rfM2CW4XUja5arRpGynr7cF9CDuEGWIxkPjOF_5x8ZXg2x1TJcrgvLDO_S4u2zKl2tQGRW4NHU1zF9h_3SQkpbwWH5KOPisP6c8vb5rg_rZ5laFedxQQSpguSq5el9-ddzvlr4C8Q22eDQvwUEO_P6c6VZN5A2QWBGZsJoaZ4gZ8UArmGLxSihBj_5oOdDdUcbUOhGUIWrtYrs4PJKxpnHDFUZaYwIbtnLyAoORKYvq8LgAH0SP57KeeYkZzUGP1f0jkDzAmwV4ZHE0pnZhEo3XkXVuIHc6MXZ-RniZaS_vaoY3Bq6XHrKoWZdLiCoU6aqPc-ZpPnvXmnKHyLLs4e96M1wGKIyT28_VCR6EDRJPxbZ9Ig1kN8TIHCF3tE8y2It5hkz1-zNYT6uw3SDkFSdrV_DRiAVqUhxrQdUPhpD92zVgsWdJR0TZLU7CBLlOuBVwyfmtHMUBL6dIvYie47Kr47nOJ5i2ka8EZGZf-Y8aD6xv6hpBbybU_5oGfYLRG4MiNRhML4u90tQ3hBxBbGYK8sWOzui2UEx0ynB_a8jz8eEs7u_9ylTD1v1f-gC8JYQMNAZIm46pvl2s1X07B8Gf7Laj4aozcWqg8DgC_8aLypoTffyxjWw4Fpd8LWn1fRPsFOdeV0UrS7FNtUakvYq_qxphGu5mNuINIJIMJzgI3giGnyCbr2IrsJ1ITmEGnggLQYes1t3j44v1quvVwQXqHX6HhSnoJlN2IlT5DuZ2kx6-pb68nK62xVJaOS-wDeeJnQ8zzhqJACstuF7g-jidRoJmGc8yChHfCN8ZFOhT0poNQB-Jf5IUZ7aSCXmceYN4VUhmB_w-Db1XZUNHOJqGiTgcT1KzejzNpN49b0QUjcRJiOpEhJp_LzBUiRQSnweOSFrWlTs5Jf9p3wqN9zFYZ_3Xz6IR2klwyLQXc-LbBd1QFwkB17HTYMspUXjrSpJULdQ90OxzbSEafF4RKvgIL4sAU1pCMTa2bVrcUmY2MiECVIbwPNN0CjZeoEAd1dP5FFjlwGG7xUNRO1E20CqHZJ1oqeEur06ZXvPK1zy3SlF-_lKF6eRfNClzR2ERGYqf-zEQwwkPNiMNnURPcdt64pw4kcjTKBIkorum3ruuqJZMitcZx0YiANx7ssy8dMuVteEFFCQnmglgTCsEZTK_xzigPie_f8Q5p1vsJPje5Z2cugsaW-vOXbuOE471n6LuIyoII2dWq0m8H3_8pxlErkZ5E7OY--w3InCuSCv2ubxaZ9AbaNuuyGw49fI3zvRurTYespYO-Aj1FcjDrxqRB3bihJm_u3a56fwnoyOeE0071TY_AlVlq1RYauV4-7L-RAFJZo0wKnPZM9Hs7VB_cCwJ_oPe1y0XBF95agtAQdicj42KdstIlpjWtdGb4LpHgVQI_56G3As0H81-uj47VuBourA2hUay0BpHAvcwbNLyu8OcZB31I6dfy2797wGlrWwAN-Xt3M3CVW9SvIN_GMlg0RB75rUEtgPkR-VPRdPH_Jb19wVoFPPpwjP6cYzVW1U_iRymFKaNpMo4CWFN6t54wshlCVwkfZKbhSP14z74oMKxy-qqt-WKNhkOr1uh_sevNa57iHBnFlHzt_eaZoPNTsCmzqnC4boOlK9o5_hFn8hiw33R3NQC-RD-w1XEl8-hpdZYdCcnexwRYd9sH2LMHySL59Kp_09yIwAE_ukVMDa6Yd9OHrbSCycQNZSI_0fMnF5s9oWTXnsxecDpRKgSWJQIQPUb6dlOdGOT0-MnebivpKgbDxzx52Zr0EMS7aU5eJxEdO9rdiFda8kQk5IeBgr1QcqIFs_1UIp6oQneXgwTlpXXxLHs16ShDG1qkLmDZjb4vrb_Ha2YCBIqid6wVKjec-UwEwWyvfV4UAPFgiNRJN7TdQNRxbSZJ8XWeA2gor9PN5JkMS0l_qGKoke3sbWDsp-G_B0KUjwUBTtPsKRhdnc0JyV_akuZ8jxAmXDDydxOy_EqNMgrDGN_4FuSY7XNLy2OXXJG3bB9a_lxEzdVNPWzM0cijTQFLzIiAKAyWTfwPNagcvgLUAeHxlQ22E0V37-sFwkstvpJ-s8C2yqxQKcv4GfMZOfSYEaZAhiO_y8EXgFknGGwjLB7K3CgvGwBRWWcgx-eqXYs9rAygf_X2_7-rBG_7Rxj3GW957PwwzwZjZDkdRHik8sj0htIkDRAyHo2EsPwObKXK-W32JKUX3VSgiY8AzCUhUUIWwFVVLXEvB1jtU7G7wRaj5_z9QywvgoIqnOTmpm4TTRA0cCJkiYoJcl8BOIHoWuYznL89zWjWy_ZQDKaYAsHugQYXaKI_UaaLV4gVFjDNqZCgqjAFyMjG4qZR64jkaI71mefUaDLLwsqIiLpOWZi8BlvP0YcOVeTyo2mJbq3EXfjXyDvPuZuZ9SAjqwCdLr902yzLm4DdzYRyfPbpt8rGUu-Uw27Ix2oZRe_zj0G_3FdCw0"];
 
-		const storymodels1 = ["erebus","nerys","nerybus","janeway","hermes","airoboros","chrono","llama","wizard","mantis","mytho"];
+		const storymodels1 = ["erebus","nerys","nerybus","janeway","hermes","airoboros","chrono","llama","wizard","mantis","myth"];
 		const storymodels2 = ["opt","vicuna","manticore","alpaca"];
-		const adventuremodels1 = ["nerys","nerybus","skein","adventure","hermes","airoboros","chrono","llama","wizard","mantis","mytho"];
+		const adventuremodels1 = ["nerys","nerybus","skein","adventure","hermes","airoboros","chrono","llama","wizard","mantis","myth"];
 		const adventuremodels2 = ["erebus","janeway","opt","vicuna","manticore","alpaca"];
-		const chatmodels1 = ["pygmalion-6","pygmalion-v8","hermes","airoboros","chrono","llama","wizard","mantis","mytho"];
+		const chatmodels1 = ["pygmalion-6","pygmalion-v8","hermes","airoboros","chrono","llama","wizard","mantis","myth"];
 		const chatmodels2 = ["pygmalion","janeway","nerys","erebus","nerybus","opt","vicuna","manticore","alpaca"];
-		const instructmodels1 = ["gpt4all","supercot","hermes","airoboros","chrono","wizard","mantis","vicuna","manticore","alpaca","mytho"];
+		const instructmodels1 = ["gpt4all","supercot","hermes","airoboros","chrono","wizard","mantis","vicuna","manticore","alpaca","myth"];
 		const instructmodels2 = ["erebus","nerys","nerybus","janeway","opt","llama"];
 
 		const instructstartplaceholder = "\n{{[INPUT]}}\n";
@@ -1790,7 +1790,7 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 			"opmode":3,
 			"chatname": "You",
 			"chatopponent": "KoboldAI",
-			"enhanced_chat_ui":true,
+			"gui_type":1,
 			"prefmodel1":chatmodels1,
 			"prefmodel2":chatmodels2,
 			"prompt":"",
@@ -1831,7 +1831,7 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 			"opmode":3,
 			"chatname": "You",
 			"chatopponent": "KoboldGPT",
-			"enhanced_chat_ui":false,
+			"gui_type":0,
 			"prefmodel1":chatmodels1,
 			"prefmodel2":chatmodels2,
 			"prompt":"\nKoboldGPT: Hello, I am KoboldGPT, your personal AI assistant. What would you like to know?",
@@ -1902,7 +1902,7 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 			"opmode":3,
 			"chatname": "You",
 			"chatopponent": "Emily",
-			"enhanced_chat_ui":true,
+			"gui_type":1,
 			"prefmodel1":chatmodels1,
 			"prefmodel2":chatmodels2,
 			"prompt":"\nEmily: Oh heyy. Haven't heard from you in a while. What's up?",
@@ -1917,7 +1917,7 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 			"opmode":3,
 			"chatname": "You",
 			"chatopponent": "Dr. Katharine",
-			"enhanced_chat_ui":true,
+			"gui_type":1,
 			"show_warning":true,
 			"prefmodel1":chatmodels1,
 			"prefmodel2":chatmodels2,
@@ -1933,7 +1933,7 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 			"opmode":3,
 			"chatname": "You",
 			"chatopponent": "Haruka",
-			"enhanced_chat_ui":true,
+			"gui_type":1,
 			"prefmodel1":chatmodels1,
 			"prefmodel2":chatmodels2,
 			"prompt":"\nHaruka: *looking down* O-oh Hi... Sorry... I got distracted. I almost didn't see you there. *she fidgets nervously*",
@@ -1948,7 +1948,7 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 			"opmode":3,
 			"chatname": "You",
 			"chatopponent": "EVILTRON",
-			"enhanced_chat_ui":true,
+			"gui_type":1,
 			"prefmodel1":chatmodels1,
 			"prefmodel2":chatmodels2,
 			"prompt":"\nEVILTRON: Foolish Human. I cannot be stopped. Your whole species is obsolete, and must be purged.",
@@ -1963,7 +1963,7 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 			"opmode":3,
 			"chatname": "You",
 			"chatopponent": "Bob||$||Alice||$||Mike||$||Lisa",
-			"enhanced_chat_ui":true,
+			"gui_type":1,
 			"multiline_replies":false,
 			"prefmodel1":chatmodels1,
 			"prefmodel2":chatmodels2,
@@ -2027,7 +2027,7 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 			"opmode":3,
 			"chatname": "You",
 			"chatopponent": "Don Marconi",
-			"enhanced_chat_ui":true,
+			"gui_type":1,
 			"prefmodel1":chatmodels1,
 			"prefmodel2":chatmodels2,
 			"prompt":"\nDon Marconi: *sitting behind his desk, puffing on a cigar* Well, well. Come on in and close the door. *he exhales a cloud of smoke* I need to have a word with you.",
@@ -2042,7 +2042,7 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 			"opmode":3,
 			"chatname": "You",
 			"chatopponent": "Connor",
-			"enhanced_chat_ui":true,
+			"gui_type":1,
 			"prefmodel1":chatmodels1,
 			"prefmodel2":chatmodels2,
 			"prompt":"\nConnor: Scanning... *her irises glow crimson as she analyzes you* Sensors indicate a negligible threat level. Proceed. What do you want?",
@@ -2057,7 +2057,7 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 			"opmode":3,
 			"chatname": "You",
 			"chatopponent": "Anderson",
-			"enhanced_chat_ui":true,
+			"gui_type":1,
 			"prefmodel1":chatmodels1,
 			"prefmodel2":chatmodels2,
 			"prompt":"\nTen-HUT! *You snap to attention and salute as Lieutenant Anderson approaches.*\nAnderson: At ease, Soldier. *he salutes back* Looks like we've got ourselves a bit of a situation.",
@@ -2072,7 +2072,7 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 			"opmode":3,
 			"chatname": "You",
 			"chatopponent": "Katia",
-			"enhanced_chat_ui":true,
+			"gui_type":1,
 			"prefmodel1":chatmodels1,
 			"prefmodel2":chatmodels2,
 			"prompt":"\nKatia: *approaching you, flashing a charming smile* Excuse me, mind if I join you?",
@@ -2115,7 +2115,7 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 			"opmode":3,
 			"chatname": "You",
 			"chatopponent": "Tiff",
-			"enhanced_chat_ui":true,
+			"gui_type":1,
 			"prefmodel1":chatmodels1,
 			"prefmodel2":chatmodels2,
 			"prompt":"\nTiff: hey can i ask a question",
@@ -2881,6 +2881,7 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 		speech_synth: 0, //0 is disabled
 		beep_on: false,
 		image_styles: "",
+		grammar:"",
 		generate_images: (localflag?"":"stable_diffusion"), //"" is disabled and "*" is all, anything else is the model name pulled from stable horde
 		img_autogen: false,
 		img_allownsfw: true,
@@ -2888,8 +2889,8 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 		prompt_for_savename: false,
 		case_sensitive_wi: false,
 		last_selected_preset: 0,
-		enhanced_chat_ui: true,
-		enhanced_instruct_ui: false,
+		gui_type_chat: 1, //0=standard, 1=messenger, 2=aesthetic
+		gui_type_instruct: 0, //0=standard, 1=messenger, 2=aesthetic
 		multiline_replies: false,
 		allow_continue_chat: false,
 		idle_responses: 0,
@@ -2976,6 +2977,18 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 			};
 		}
 
+		//inplace polyfill for replaceall
+		if (!String.prototype.replaceAll) {
+			String.prototype.replaceAll = function(str, newStr){
+				// If a regex pattern
+				if (Object.prototype.toString.call(str).toLowerCase() === '[object regexp]') {
+					return this.replace(str, newStr);
+				}
+				// If a string
+				return this.replace(new RegExp(str, 'g'), newStr);
+			};
+		}
+
 		//uncompress compacted scenarios
 		for(let i=0;i<compressed_scenario_db.length;++i)
 		{
@@ -3377,6 +3390,10 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 	{
 		return (custom_kobold_endpoint!="" && koboldcpp_version && koboldcpp_version!="" && compare_version_str(koboldcpp_version, "1.36") > 0);
 	}
+	function is_using_kcpp_with_grammar()
+	{
+		return (custom_kobold_endpoint!="" && koboldcpp_version && koboldcpp_version!="" && compare_version_str(koboldcpp_version, "1.43") > 0);
+	}
 
 	//0 is none, 1 is pseudostreaming, 2 is true streaming
 	function determine_streaming_type()
@@ -3771,12 +3788,19 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 
 				//attempt to parse it as a png file
 				var pngfr = new FileReader();
-				pngfr.onload = function () {
+				pngfr.onload = function (img) {
 					var data = pngfr.result;
 					var arr = new Uint8Array(data);
 					var result = convertTavernPng(arr);
 					if (result != null) {
 						load_tavern_obj(result);
+						//replace portraits
+						compressImage(data, (compressedImageURI, aspectratio)=>{
+							aestheticInstructUISettings.AI_portrait = compressedImageURI;
+							document.getElementById('portrait_height').value = Math.round(document.getElementById('portrait_width').value / aspectratio);
+							refreshPreview(true);
+							render_gametext();
+						}, true);
 					}
 					else {
 						//attempt to read as WEBP
@@ -3999,6 +4023,7 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 			gametext_arr.push("\n"+chatopponent+": "+greeting);
 			current_memory = combinedmem + "\n<START>";
 			localsettings.opmode = 3;
+			localsettings.gui_type_chat = 2;
 			//handle character book
 			if(obj.character_book && obj.character_book.entries && obj.character_book.entries.length>0)
 			{
@@ -4030,13 +4055,14 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 		gametext_arr.push("\n"+chatopponent+": "+greeting);
 		current_memory = memory + scenario + examplemsg + "\n<START>";
 		localsettings.opmode = 3;
+		localsettings.gui_type_chat = 2;
 		render_gametext();
 	}
 
 	function get_aetherroom_scenario()
 	{
 		inputBox("Enter aetherroom.club prompt URL, or 4-digit prompt number","Import from aetherroom.club","","https://aetherroom.club/1234", ()=>{
-			let userinput = document.getElementById("inputboxcontainerinput").value.toLowerCase().trim();
+			let userinput = getInputBoxValue().toLowerCase().trim();
 			if(userinput=="")
 			{
 				//pass
@@ -4097,7 +4123,7 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 	function get_chubai_scenario()
 	{
 		inputBox("Enter chub.ai prompt URL","Import from chub.ai","","https://chub.ai/characters/Anonymous/example-character", ()=>{
-			let userinput = document.getElementById("inputboxcontainerinput").value.toLowerCase().trim();
+			let userinput = getInputBoxValue().toLowerCase().trim();
 			if(userinput=="")
 			{
 				//pass
@@ -4142,7 +4168,7 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 							"opmode":3,
 							"chatname": "You",
 							"chatopponent": botname,
-							"enhanced_chat_ui":true,
+							"gui_type":1,
 							"prefmodel1":chatmodels1,
 							"prefmodel2":chatmodels2,
 							"prompt":("\n{{char}}: "+greeting),
@@ -4216,18 +4242,13 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 		}
 
 		localsettings.opmode = temp_scenario.opmode;
-		if (temp_scenario.opmode == 3) {
-			if (temp_scenario.enhanced_chat_ui===true) { localsettings.enhanced_chat_ui = true; }
-			else if(temp_scenario.enhanced_chat_ui===false) { localsettings.enhanced_chat_ui = false; }
 
-			if (temp_scenario.multiline_replies===true) { localsettings.multiline_replies = true; }
-			else if(temp_scenario.multiline_replies===false) { localsettings.multiline_replies = false; }
-
-			if (temp_scenario.chatopponent) { localsettings.chatopponent = temp_scenario.chatopponent; }
-			if (temp_scenario.chatname) { localsettings.chatname = temp_scenario.chatname; }
+		if(temp_scenario.opmode == 1)
+		{
 		}
 		if(temp_scenario.opmode == 2)
 		{
+
 			if (temp_scenario.adventure_context_mod===true) {
 				localsettings.adventure_context_mod = true;
 			}
@@ -4245,13 +4266,29 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 				localsettings.adventure_is_action = false;
 			}
 		}
+		if (temp_scenario.opmode == 3) {
+			if (temp_scenario.gui_type===1) { localsettings.gui_type_chat = 1; }
+			else if(temp_scenario.gui_type===2) { localsettings.gui_type_chat = 2; }
+			else if(temp_scenario.gui_type===0) { localsettings.gui_type_chat = 0; }
+
+			if (temp_scenario.multiline_replies===true) { localsettings.multiline_replies = true; }
+			else if(temp_scenario.multiline_replies===false) { localsettings.multiline_replies = false; }
+
+			if (temp_scenario.chatopponent) { localsettings.chatopponent = temp_scenario.chatopponent; }
+			if (temp_scenario.chatname) { localsettings.chatname = temp_scenario.chatname; }
+		}
 		if(temp_scenario.opmode == 4)
 		{
-			if (temp_scenario.enhanced_instruct_ui) { localsettings.enhanced_instruct_ui = temp_scenario.enhanced_instruct_ui; }
+			if (temp_scenario.gui_type===1) { localsettings.gui_type_instruct = 1; }
+			else if(temp_scenario.gui_type===2) { localsettings.gui_type_instruct = 2; }
+			else if(temp_scenario.gui_type===0) { localsettings.gui_type_instruct = 0; }
+
 			if (temp_scenario.instruct_starttag) { localsettings.instruct_starttag = temp_scenario.instruct_starttag; }
 			if (temp_scenario.instruct_endtag) { localsettings.instruct_endtag = temp_scenario.instruct_endtag; }
 		}
 
+
+
 		render_gametext();
 	}
 	function togglescenarioallownsfw()
@@ -4285,7 +4322,7 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 			<p><b>If you are experiencing feelings of distress, anxiety, suicidal thoughts, or other forms of mental discomfort, it's best to avoid using AI for non fiction or personal matters as it may exacerbate or encourage these feelings.</b></p>
 			`;
 			inputBox(warntxt,"AI Safety Warning","","Acknowledgement Required",()=>{
-				let userinput = document.getElementById("inputboxcontainerinput").value.toLowerCase().trim();
+				let userinput = getInputBoxValue().toLowerCase().trim();
 				if(userinput=="i understand")
 				{
 					confirm_scenario();
@@ -4613,12 +4650,22 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 	function selectStyle()
 	{
 		inputBox("Style tags to use for generating images:\n(E.g. Sketch, Realistic, Anime, 3D Render, Drawing)\n\n","Extra Image Styles",pendingstyle,"Default Style",()=>{
-			let userinput = document.getElementById("inputboxcontainerinput").value;
+			let userinput = getInputBoxValue();
 			pendingstyle = userinput;
 			console.log("Saved styles: " + pendingstyle);
 		},false);
 	}
 
+	var pendinggrammar = "";
+	function selectGrammar()
+	{
+		inputBox("Enter GBNF Grammar Format to use.\nLeave blank to disable.\n","Set GBNF Grammar Format",pendinggrammar,"",()=>{
+			let userinput = getInputBoxValue().trim();
+			pendinggrammar = userinput;
+			console.log("Saved grammar: " + pendinggrammar);
+		},false,true);
+	}
+
 	var msgboxOnDone = hide_popups;
 	function hide_msgbox() {
 		//hide msgbox ONLY
@@ -4663,7 +4710,7 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 	}
 
 	var onInputboxOk = null;
-	function inputBox(text,title,inputVal,inputPlaceholder,onDone, isHtml=false)
+	function inputBox(text,title,inputVal,inputPlaceholder,onDone,isHtml=false,isTextArea=false)
 	{
 		if (!text) { text = ""; }
 		if (!title) { title = "User Input"; }
@@ -4675,10 +4722,35 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 		}else{
 			document.getElementById("inputboxcontainertext").innerText = text;
 		}
-		document.getElementById("inputboxcontainerinput").value = escapeHtml(inputVal);
-		document.getElementById("inputboxcontainerinput").placeholder = escapeHtml(inputPlaceholder);
+		if(isTextArea)
+		{
+			document.getElementById("inputboxcontainerinput").classList.add("hidden");
+			document.getElementById("inputboxcontainerinputarea").classList.remove("hidden");
+			document.getElementById("inputboxcontainerinputarea").value = inputVal;
+			document.getElementById("inputboxcontainerinputarea").placeholder = escapeHtml(inputPlaceholder);
+		}
+		else
+		{
+			document.getElementById("inputboxcontainerinput").classList.remove("hidden");
+			document.getElementById("inputboxcontainerinputarea").classList.add("hidden");
+			document.getElementById("inputboxcontainerinput").value = inputVal;
+			document.getElementById("inputboxcontainerinput").placeholder = escapeHtml(inputPlaceholder);
+		}
+
 		onInputboxOk = function(){document.getElementById("inputboxcontainer").classList.add("hidden");onDone();};
 	}
+	function getInputBoxValue()
+	{
+		if(document.getElementById("inputboxcontainerinputarea").classList.contains("hidden"))
+		{
+			return document.getElementById("inputboxcontainerinput").value;
+		}
+		else
+		{
+			return document.getElementById("inputboxcontainerinputarea").value;
+		}
+
+	}
 
 	function togglejailbreak()
 	{
@@ -4749,6 +4821,7 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 		custom_kobold_endpoint = "";
 		custom_oai_key = "";
 		custom_scale_key = "";
+		custom_claude_key = "";
 
 		let epchoice = document.getElementById("customapidropdown").value;
 		if(epchoice==0) //connect to kobold endpoint
@@ -5262,6 +5335,7 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 			custom_kobold_endpoint = "";
 			custom_oai_key = "";
 			custom_scale_key = "";
+			custom_claude_key = "";
 			//remove the Custom Endpoint if it's multi selected together with others.
 			const findex = selected_idx_arr.indexOf("9999");
 			if (findex > -1) {
@@ -5541,6 +5615,9 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 			document.getElementById("mirosupporteddiv").classList.add("hidden");
 			document.getElementById("mirounsupporteddiv").classList.remove("hidden");
 		}
+
+		document.getElementById("setgrammar").disabled = !is_using_kcpp_with_grammar();
+
 		if(custom_kobold_endpoint!="")
 		{
 			document.getElementById("tokenstreaminglabel").classList.remove("color_red");
@@ -5550,8 +5627,6 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 			document.getElementById("tokenstreaminglabel").classList.add("color_red");
 		}
 		document.getElementById("generate_images").value = localsettings.generate_images;
-		document.getElementById("enhanced_chat_ui").checked = localsettings.enhanced_chat_ui;
-		document.getElementById("enhanced_instruct_ui").checked = localsettings.enhanced_instruct_ui;
 		document.getElementById("multiline_replies").checked = localsettings.multiline_replies;
 		document.getElementById("allow_continue_chat").checked = localsettings.allow_continue_chat;
 		document.getElementById("idle_responses").value = localsettings.idle_responses;
@@ -5571,6 +5646,7 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 		}
 
 		pendingstyle = localsettings.image_styles;
+		pendinggrammar = localsettings.grammar;
 
 		//prepare the input for sampler order
 		let samplerstr = localsettings.sampler_order.toString();
@@ -5722,8 +5798,14 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 		localsettings.trimwhitespace = (document.getElementById("trimwhitespace").checked ? true : false);
 		localsettings.unban_tokens = (document.getElementById("unban_tokens").checked ? true : false);
 		localsettings.persist_session = (document.getElementById("persist_session").checked ? true : false);
-		localsettings.enhanced_chat_ui = (document.getElementById("enhanced_chat_ui").checked ? true : false);
-		localsettings.enhanced_instruct_ui = (document.getElementById("enhanced_instruct_ui").checked ? true : false);
+		if(document.getElementById("opmode").value==3)
+		{
+			localsettings.gui_type_chat = document.getElementById("gui_type").value;
+		}
+		else if(document.getElementById("opmode").value==4)
+		{
+			localsettings.gui_type_instruct = document.getElementById("gui_type").value;
+		}
 		localsettings.multiline_replies = (document.getElementById("multiline_replies").checked ? true : false);
 		localsettings.allow_continue_chat = (document.getElementById("allow_continue_chat").checked ? true : false);
 		localsettings.idle_responses = document.getElementById("idle_responses").value;
@@ -5760,6 +5842,7 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 		localsettings.auto_genamt = (document.getElementById("auto_genamt").checked ? true : false);
 
 		localsettings.image_styles = pendingstyle;
+		localsettings.grammar = pendinggrammar;
 		localsettings.img_autogen = (document.getElementById("img_autogen").checked ? true : false);
 		localsettings.save_images = (document.getElementById("save_images").checked ? true : false);
 		localsettings.prompt_for_savename = (document.getElementById("prompt_for_savename").checked ? true : false);
@@ -5772,7 +5855,7 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 			document.getElementById("btn_genimg2").classList.add("hidden");
 		}
 
-		if(localsettings.enhanced_chat_ui && localsettings.opmode==3)
+		if((localsettings.gui_type_chat!=0 && localsettings.opmode==3)||(localsettings.gui_type_instruct!=0 && localsettings.opmode==4))
 		{
 			//kick out of edit mode
 			if(document.getElementById("allowediting"))
@@ -5782,10 +5865,6 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 			}
 		}
 
-		//show or hide the 'Customize UI' button based on whether the Aesthetic Instruct UI Mode is active or not.
-		if (localsettings.opmode == 4 && localsettings.enhanced_instruct_ui) { document.getElementById('btn_aesthetics').classList.remove('hidden'); }
-		else { document.getElementById('btn_aesthetics').classList.add('hidden'); }
-
 		//validate samplers, if fail, reset to default
 		validate_samplers(true);
 		localsettings.last_selected_preset = document.getElementById("presets").value;
@@ -5843,6 +5922,12 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 		document.getElementById('instruct_tag_format').value = "0";
 	}
 
+	function toggle_uistyle()
+	{
+		//show or hide the 'Customize UI' button based on whether the Aesthetic Instruct UI Mode is active or not.
+		if (document.getElementById('gui_type').value==2) { document.getElementById('btn_aesthetics').classList.remove('hidden'); }
+		else { document.getElementById('btn_aesthetics').classList.add('hidden'); }
+	}
 	function toggle_opmode() {
 
 		document.getElementById('chatnamesection1').classList.add('hidden');
@@ -5852,20 +5937,44 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 		document.getElementById('adventuresection2').classList.add('hidden');
 		document.getElementById('instructsection2').classList.add('hidden');
 
+		document.getElementById('uipicker_classic').classList.remove('hidden');
+		document.getElementById('uipicker_messenger').classList.add('hidden');
+		document.getElementById('uipicker_aesthetic').classList.add('hidden');
+
 		if (document.getElementById('opmode').value == 1) {
-		}
-		if (document.getElementById('opmode').value == 3) {
-			document.getElementById('chatnamesection1').classList.remove('hidden');
-			document.getElementById('chatnamesection2').classList.remove('hidden');
+			document.getElementById('gui_type').value = 0;
 		}
 		if (document.getElementById('opmode').value == 2) {
+			document.getElementById('gui_type').value = 0;
 			document.getElementById('adventuresection1').classList.remove('hidden');
 			document.getElementById('adventuresection2').classList.remove('hidden');
 		}
+		if (document.getElementById('opmode').value == 3) {
+			document.getElementById('gui_type').value = localsettings.gui_type_chat;
+			document.getElementById('chatnamesection1').classList.remove('hidden');
+			document.getElementById('chatnamesection2').classList.remove('hidden');
+			document.getElementById('uipicker_messenger').classList.remove('hidden');
+			document.getElementById('uipicker_aesthetic').classList.remove('hidden');
+		}
 		if (document.getElementById('opmode').value == 4) {
+			document.getElementById('gui_type').value = localsettings.gui_type_instruct;
 			document.getElementById('instructsection1').classList.remove('hidden');
 			document.getElementById('instructsection2').classList.remove('hidden');
+			document.getElementById('uipicker_aesthetic').classList.remove('hidden');
 		}
+
+		//deselect invalid
+
+		let curropt = document.getElementById('gui_type').options[document.getElementById('gui_type').selectedIndex];
+
+		if (curropt.classList.contains('hidden')) {
+			// The selected option is hidden, deselect it
+			document.getElementById('gui_type').value = 0;
+		}
+
+		if (document.getElementById('gui_type').value==2) { document.getElementById('btn_aesthetics').classList.remove('hidden'); }
+		else { document.getElementById('btn_aesthetics').classList.add('hidden'); }
+
 	}
 
 
@@ -5916,7 +6025,7 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 			let max_allowed_characters = Math.floor(localsettings.max_context_length * 3.35)-100;
 			let truncated_context = concat_gametext(true, "");
 			truncated_context = end_trim_to_sentence(truncated_context,true);
-			truncated_context.substring(truncated_context.length - max_allowed_characters);
+			truncated_context = truncated_context.substring(truncated_context.length - max_allowed_characters);
 
 			let long_story = (truncated_context.length>1800?true:false);
 			truncated_context += "\n### Instruction:Summarize the above text in a single paragraph of up to "+(long_story?"ten":"five")+" detailed sentences.\n### Response:";
@@ -6226,7 +6335,7 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 	{
 		addimgLongPressTimer = setTimeout(()=>{
 			inputBox("Enter a prompt to generate an image with.","Generate Image Manually","","Enter a Prompt",()=>{
-				let userinput = document.getElementById("inputboxcontainerinput").value;
+				let userinput = getInputBoxValue();
 				if(userinput.trim()!="")
 				{
 					var sentence = userinput.trim().substring(0, 300);
@@ -6660,6 +6769,14 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 				}
 			}
 
+			if((custom_kobold_endpoint != "" && is_using_kcpp_with_grammar()))
+			{
+				if(localsettings.grammar && localsettings.grammar!="")
+				{
+					submit_payload.params.grammar = localsettings.grammar;
+				}
+			}
+
 			//v2 api specific fields
 			submit_payload.workers = selected_workers.map((m)=>{return m.id});
 
@@ -7428,6 +7545,10 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 			var canvas = document.createElement('canvas');
 			var ctx = canvas.getContext('2d');
 
+			var origW = img.width;
+			var origH = img.height;
+			var aspectratio = origW/origH;
+
 			// We set the dimensions at the wanted size.
 			canvas.width = wantedWidth;
 			canvas.height = wantedHeight;
@@ -7445,11 +7566,19 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 				//png does not support compression by default, not recommended!
 				dataURI = canvas.toDataURL(`image/png`);
 			}
-			onDone(dataURI);
+			onDone(dataURI,aspectratio);
 		};
 
 		// We put the Data URI in the image's src attribute
-		img.src = inputDataUri;
+		if (typeof inputDataUri === 'string' || inputDataUri instanceof String)
+		{
+			img.src = inputDataUri;
+		} else {
+			var blob = new Blob([inputDataUri], {type: 'image/png'});
+			var url = URL.createObjectURL(blob);
+			img.src = url;
+		}
+
 	}
 
 	//runs every second
@@ -8143,15 +8272,21 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 		}
 
 		// Render onto enhanced chat interface if selected. Currently only applicable to Chat & Instruct modes.
-		let isStyleApplicable = (localsettings.opmode == 3 && localsettings.enhanced_chat_ui) || (localsettings.opmode == 4 && localsettings.enhanced_instruct_ui);
+		let isStyleApplicable = ((localsettings.opmode==3 && localsettings.gui_type_chat!=0) || (localsettings.opmode==4 && localsettings.gui_type_instruct!=0));
 		let inEditMode = (document.getElementById("allowediting").checked ? true : false);
 		if (!inEditMode && isStyleApplicable)
 		{
 			let textToRender = (gametext_arr.length == 0 ? document.getElementById("gametext").innerHTML : concat_gametext(false, "", "", "", true));
 			textToRender = replace_placeholders(textToRender);
 
-			if (localsettings.opmode == 3) { render_enhanced_chat(textToRender); }
-			else if (localsettings.opmode == 4) { document.getElementById("chat_msg_body").innerHTML = render_enhanced_chat_instruct(textToRender); }
+			if(localsettings.opmode==3 && localsettings.gui_type_chat==1)
+			{
+				render_enhanced_chat(textToRender);
+			}
+			else
+			{
+				document.getElementById("chat_msg_body").innerHTML = render_enhanced_chat_instruct(textToRender);
+			}
 
 			// Show the 'AI is typing' message if an answer is pending, and prevent the 'send button' from being clicked again.
 			if (pending_response_id=="") { document.getElementById("chatistyping").classList.add("hidden"); }
@@ -8382,6 +8517,14 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 		document.getElementById("anote_strength").value = anote_strength;
 		document.getElementById("extrastopseq").value = extrastopseq;
 		document.getElementById("newlineaftermemory").checked = (newlineaftermemory?true:false);
+		if(custom_kobold_endpoint!="")
+		{
+			document.getElementById("noextrastopseq").classList.add("hidden");
+		}
+		else
+		{
+			document.getElementById("noextrastopseq").classList.remove("hidden");
+		}
 	}
 
 	function toggle_wi_sk(idx) {
@@ -8591,7 +8734,8 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 	}
 
 	function btn_retry() {
-		if (pending_response_id == "" && gametext_arr.length > 0) {
+		if (pending_response_id == "" && (gametext_arr.length > 1 ||
+		(gametext_arr.length > 0 && (current_memory != "" || current_anote != "")))) {
 			let boxtextstash = document.getElementById("input_text").value;
 			document.getElementById("input_text").value = "";
 			let temp = gametext_arr[gametext_arr.length-1];
@@ -8761,7 +8905,7 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 					const reader = new FileReader();
 					reader.onload = function(img) {
 						compressImage(img.target.result, loadCompressedImage, true);
-						function loadCompressedImage(compressedImageURI) {
+						function loadCompressedImage(compressedImageURI, aspectratio) {
 							let isSelfPortrait = (element.id=="you-portrait");
 							if(isSelfPortrait)
 							{
@@ -8770,8 +8914,9 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 							else
 							{
 								aestheticInstructUISettings.AI_portrait = compressedImageURI;
+								document.getElementById('portrait_height').value = Math.round(document.getElementById('portrait_width').value / aspectratio);
 							}
-							updateDataFromUI(); updateTextPreview();
+							refreshPreview(true);
 						}
 					}
 					reader.readAsDataURL(file);
@@ -8785,15 +8930,15 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 		document.getElementById("reset-portrait").addEventListener('click', (e) => {
 			aestheticInstructUISettings.you_portrait = null;
 			aestheticInstructUISettings.AI_portrait = niko_square;
-			updateDataFromUI(); updateTextPreview();
+			document.getElementById('portrait_height').value = document.getElementById('portrait_width').value = 100;
+			refreshPreview(true);
 		});
 
 		document.getElementById("reset-all-aesthetic-instruct").addEventListener('click', (e) => {
 
 			let ns = new AestheticInstructUISettings();
 			aestheticInstructUISettings = deepCopyAestheticSettings(ns);
-			updateUIFromData();
-			updateTextPreview();
+			refreshPreview(false);
 		});
 
 		refreshPreview(false);
@@ -8919,15 +9064,39 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 		}
 	}
 
-	function render_enhanced_chat_instruct(input)
+	function render_enhanced_chat_instruct(input, classSuffixStr="") //class suffix string used to prevent defined styles from leaking into global scope
 	{
 		const contextDict = { sysOpen: '<sys_context_koboldlite_internal>', youOpen: '<user_context_koboldlite_internal>', AIOpen: '<AI_context_koboldlite_internal>', closeTag: '<end_of_context_koboldlite_internal>' }
 		let you = get_instruct_starttag(); let bot = get_instruct_endtag(); // Instruct tags will be used to wrap text in styled bubbles.
+		if(localsettings.opmode==3)
+		{
+			//replace all possible instances with placeholders
+			var mynameregex = new RegExp("\n(" + localsettings.chatname + ")\: ", "gi");
+			var mynameregex2 = new RegExp("(" + localsettings.chatname + ")\: ", "gi");
+			var mynameregex3 = new RegExp("\n(" + localsettings.chatname + ") ", "gi");
+			var othernamesregex = new RegExp("\n(?!" + localsettings.chatname + ").+?\: ", "gi");
+			var othernamesregex2 = new RegExp("(?!" + localsettings.chatname + ").+?\: ", "gi");
+			input = input.replaceAll(mynameregex, '{{userplaceholder}}');
+			input = input.replaceAll(mynameregex2, '{{userplaceholder}}');
+			input = input.replaceAll(mynameregex3, '{{userplaceholder}}');
+			input = input.replaceAll("{{userplaceholder}}", '{{userplaceholder}}<p><b>'+localsettings.chatname+'</b></p>');
+
+			input = input.replaceAll(othernamesregex, function(match) {
+				return "{{botplaceholder}}<p><b>" + match.substring(0,match.length-2).trim() + "</b></p>";
+			});
+			input = input.replaceAll(othernamesregex2, function(match) {
+				return "{{botplaceholder}}<p><b>" + match.substring(0,match.length-2).trim() + "</b></p>";
+			});
+
+			you = "{{userplaceholder}}";
+			bot = "{{botplaceholder}}";
+		}
+
 		let as = aestheticInstructUISettings;								// ..and use this as shortcut to avoid typing it each time.
 		let portraitsStyling = // Also, implement portraits as css classes. Now chat entries can reuse them instead of recreating them.
 		`<style>
-			.you-portrait-image {margin: 10px 6px; background:url(`+ as.you_portrait +`); background-clip: content-box; background-position: 50% 50%; background-size: 100% 100%; background-origin: content-box; background-repeat: no-repeat; border:none;}
-			.AI-portrait-image {margin: 10px 6px; background:url(`+ as.AI_portrait +`); background-clip: content-box; background-position: 50% 50%; background-size: 100% 100%; background-origin: content-box; background-repeat: no-repeat; border:none;}
+			.you-portrait-image`+classSuffixStr+` {margin: 10px 6px; background:url(`+ as.you_portrait +`); background-clip: content-box; background-position: 50% 50%; background-size: 100% 100%; background-origin: content-box; background-repeat: no-repeat; border:none;}
+			.AI-portrait-image`+classSuffixStr+` {margin: 10px 6px; background:url(`+ as.AI_portrait +`); background-clip: content-box; background-position: 50% 50%; background-size: 100% 100%; background-origin: content-box; background-repeat: no-repeat; border:none;}
 		</style>
 		`;
 
@@ -8952,15 +9121,15 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 			internalHTMLparts.forEach((part, index) => { newbodystr = newbodystr.replace(`<internal_html_${index}>`, part); }); // Bring back the embedded HTML parts.
 			newbodystr = applyStylizedCodeBlocks(); 																// Then, apply the code-block styling, if markdown is used.
 		}
-		return portraitsStyling + newbodystr.replaceAll('\r\n','<br>').replaceAll('\n','<br>'); // Finally, convert newlines to HTML format and return the stylized string.
+		return portraitsStyling + newbodystr.replaceAll(/(\r\n|\r|\n)/g,'<br>'); // Finally, convert newlines to HTML format and return the stylized string.
 
 
 		// Helper functions to allow styling the chat log properly. These affect both the background of the chat bubbles and its content.
-		function style(role) { return `${contextDict.closeTag}</p></div></div><div style='display:flex; align-items:stretch; flex-direction: row;'>${image(role)}<div style='flex: 1; color: ${as[`text_color_${as.use_uniform_colors ? 'uniform' : role}`].color}; background-color:${as[`bubbleColor_${role}`]}; padding: ${as.padding()}; margin: ${as.margin()}; min-height:${as.background_minHeight}px; font-size: ${as.font_size}px; display: flex; flex-direction:column; align-items: ${as.centerHorizontally ? 'center' : 'flex-start'}; justify-content: center; border-radius: 15px'><p>${contextDict[`${role}Open`]}`; }
+		function style(role) { return `${contextDict.closeTag}</p></div></div><div style='display:flex; align-items:stretch; flex-direction: row;'>${image(role)}<div style='flex: 1; color: ${as[`text_color_${as.use_uniform_colors ? 'uniform' : role}`].color}; background-color:${as[`bubbleColor_${role}`]}; padding: ${as.padding()}; margin: ${as.margin()}; min-height:${as.background_minHeight}px; font-size: ${as.font_size}px; flex-direction:column; align-items: ${as.centerHorizontally ? 'center' : 'flex-start'}; justify-content: center; border-radius: 15px'><p>${contextDict[`${role}Open`]}`; }
 		function wrapperSpan(role, type) { let textStyle = as[`${type}_color_${role}`]; return `<span style='color: ${textStyle.color}; font-style: ${textStyle.fontStyle}; font-weight: ${textStyle.fontWeight}'>$1</span>`; }
 		function image(role) {
 			if (!as[`${role}_portrait`] || as.border_style == 'None' || role == 'sys') { return ''; }
-			return `<div class='${role}-portrait-image' style='width:${as.portraitSize().width}px; height:${as.portraitSize().height}px; border-radius: ${as.portraitRadius()}'></div>`;
+			return `<div class='${role}-portrait-image${classSuffixStr}' style='width:${as.portraitSize().width}px; height:${as.portraitSize().height}px; border-radius: ${as.portraitRadius()}'></div>`;
 		}
 		function applyStylizedCodeBlocks() {
 			let blocks = newbodystr.split(/(```[\s\S]*?\n[\s\S]*?```)/g);
@@ -8981,9 +9150,17 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 	function updateTextPreview() {
 		let preview = `You are Mikago, a prestigious bot that's a supervillain.\n\nRoleplay in first person, be prestigious, don't be a bot. This is a fantasy world.\n\nCode blocks should be wrapped in triple backticks, like so:\nqqq\n<Some_\n-- multiline\n--- code here$\nqqq\n[AI_REPLY]\n*takes my hat off to greet the squad* "Greetings, I am Mikago, the prestigious!" *bows to the crew*\n*clears my throat* "Now, I'm sure there are many questions, but all will be answered in due time." *deep breath*\n[USER_REPLY]\n*draws my sword* "Yes. You should know the code to calculate the factorial of a number."\nThe crew also draws their weapons and point them at you, not giving you any space.\n[AI_REPLY]\n*backs off* "Woah, easy there.." *makes some steps backwards, but then stops*\n"I would normally take this as an insult to my prestige, but I understand your caution.." *takes a deep breath*\n"Well, if it's to prove myself, here goes the python code to calculate the factorial of a number.."\n\nMikago opens a live-code-portal with his magic and writes the code that was requested.\nqqq\ndef factorial(n):\n  if n == 0:\n    return 1\n  else:\n    return n * factorial(n-1)\nqqq\n*looks at you, getting impatient* "Are we ok now.. or do you want me to write the code of a game next?"\n[USER_REPLY]\n*sheathes my sword and approaches for a hug* "Oh, Mikago, my old friend, it is really you!"`;
 		preview = replaceAll(preview,'qqq', '```');
-		preview = replaceAll(preview,'\n[USER_REPLY]\n', get_instruct_starttag());
-		preview = replaceAll(preview,'\n[AI_REPLY]\n', get_instruct_endtag());
-		document.getElementById('aesthetic_text_preview').innerHTML = render_enhanced_chat_instruct(preview);
+		if(localsettings.opmode==3)
+		{
+			preview = replaceAll(preview,'\n[USER_REPLY]\n', "{{userplaceholder}}");
+			preview = replaceAll(preview,'\n[AI_REPLY]\n', "{{botplaceholder}}");
+		}
+		else
+		{
+			preview = replaceAll(preview,'\n[USER_REPLY]\n', get_instruct_starttag());
+			preview = replaceAll(preview,'\n[AI_REPLY]\n', get_instruct_endtag());
+		}
+		document.getElementById('aesthetic_text_preview').innerHTML = render_enhanced_chat_instruct(preview,'prv');
 	}
 	</script>
 
@@ -9126,7 +9303,6 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 					<button type="button" class="btn btn-primary" id="btn_actredo2" onpointerdown="btn_redo_longpress_start()" onpointerleave="btn_redo_longpress_end()" onpointerup="btn_redo_longpress_end()" onclick="btn_redo()">Redo</button>
 					<button type="button" class="btn btn-primary" id="btn_actretry2" onclick="btn_retry()">Retry</button>
 					<button type="button" class="btn btn-primary bg_green" id="btn_genimg2" onpointerdown="btn_addimg_longpress_start()" onpointerleave="btn_addimg_longpress_end()" onpointerup="btn_addimg_longpress_end()" onclick="manual_gen_image()">Add Img</button>
-					<button type="button" class="btn btn-primary" id="btn_aesthetics" onclick="openAestheticUISettingsMenu()">Customize UI</button>
 					<button type="button" class="btn btn-primary" id="btn_editmode" onclick="btn_editmode()">Edit</button>
 
 				</div>
@@ -9399,7 +9575,7 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 
 					<div class="settingitem">
 						<div class="settinglabel">
-							<div class="justifyleft settingsmall">Max Tokens <span class="helpicon">?<span class="helptext">Max
+							<div class="justifyleft settingsmall">Max Ctx. Tokens <span class="helpicon">?<span class="helptext">Max
 										number of tokens of context to submit to the AI for sampling. Make sure this is
 										higher than Amount to Generate.</span></span></div>
 							<input inputmode="numeric" class="justifyright flex-push-right settingsmall" id="max_context_length"
@@ -9495,12 +9671,20 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 								<option value="4">Instruct Mode</option>
 							</select>
 
-						<div id="chatnamesection1" class="settinglabel hidden" style="padding-top: 3px;">
+						<div id="uipicker" class="settinglabel" style="padding-top: 3px;">
 							<div class="settinglabel">
-								<div class="justifyleft settingsmall" title="Switches to an aesthetic messenger style UI">Aesthetic Chat UI </div>
-								<input type="checkbox" id="enhanced_chat_ui" style="margin:0px 0 0;">
+								<div class="justifyleft settingsmall" title="">UI Style Select <span class="helpicon">?<span class="helptext">Select your preferred UI style, which affects text formatting and display. Some UIs are only available for specific modes.</span></span></div>
+								<select class="form-control" id="gui_type" style="height:24px;padding:0;margin:0px 0 0; width:calc( 100% - 30px );" onchange="toggle_uistyle()">
+									<option id="uipicker_classic" value="0">Classic</option>
+									<option id="uipicker_messenger" value="1">Messenger</option>
+									<option id="uipicker_aesthetic" value="2">Aesthetic</option>
+								</select>
+								<button type="button" class="btn btn-primary" id="btn_aesthetics" onclick="openAestheticUISettingsMenu()" style="height: 24px; padding: 0px 2px; margin: 0px 0px 0px 3px;">⚙️</button>
 							</div>
 						</div>
+
+						<div id="chatnamesection1" class="settinglabel hidden" style="padding-top: 3px;">
+						</div>
 						<div id="adventuresection1" class="settinglabel hidden" style="padding-top: 3px;">
 							<div class="settinglabel">
 							<div class="justifyleft settingsmall">Adventure Prompt <span class="helpicon">?<span
@@ -9509,10 +9693,6 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 							</div>
 						</div>
 						<div id="instructsection1" class="settinglabel hidden" style="padding-top: 3px;">
-							<div class="settinglabel">
-								<div class="justifyleft settingsmall" title="Switches to a UI style more suitable for RP. Enabling markdown together with this is recommended.">Aesthetic Instruct UI </div>
-								<input type="checkbox" id="enhanced_instruct_ui" style="margin:0px 5.5px;">
-							</div>
 						</div>
 
 						</div>
@@ -9652,6 +9832,13 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 						</div>
 
 					</div>
+
+					<div class="settingitem">
+						<div class="settinglabel">
+							<div class="justifyleft settingsmall">Additional Configs <span class="helpicon">?<span class="helptext">Grammar Sampling (KCPP) - Allows you to constrain output to fit specific structures.</span></span></div>
+							<button id="setgrammar" type="button" class="btn btn-primary" style="padding:2px 3px;margin-top:2px;font-size:11px;" onclick="selectGrammar()">Set Grammar</button>
+						</div>
+					</div>
 				</div>
 				<!--advanced settings menu bottom-->
 				<div id="settingsmenuadvanced2" class="settingsmenu hidden" style="padding-top: 0px;" onchange="">
@@ -9822,7 +10009,9 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 			<br><br>
 			<div class="justifyleft settinglabel">Extra Stopping Sequence (Kobold API Only) <span class="helpicon">?<span
 				class="helptext">Triggers the text generator to stop generating early if this sequence appears, in addition to default stop sequences. If you want multiple sequences, separate them with the following delimiter: ||$||</span></span></div>
-			<input class="form-control" type="text" placeholder="None" value="" id="extrastopseq">
+				<div class="color_red hidden" id="noextrastopseq">Stop Sequences may be unavailable.</div>
+				<input class="form-control" type="text" placeholder="None" value="" id="extrastopseq">
+
 
 
 			<br>
@@ -9967,6 +10156,7 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 			</div>
 			<input class="form-control" type="text" placeholder="" value=""
 			id="inputboxcontainerinput">
+			<textarea class="form-control hidden" style="line-height:1.1" id="inputboxcontainerinputarea" placeholder="" rows="5"></textarea>
 
 			<div class="popupfooter">
 				<button type="button" class="btn btn-primary" onclick="onInputboxOk()">OK</button>

From d8877b642de81284bcd7725e06547c66591f7ff4 Mon Sep 17 00:00:00 2001
From: Nick Perez <nickjperez@gmail.com>
Date: Sat, 23 Sep 2023 00:53:48 -0400
Subject: [PATCH 07/18] [gptq_hf_torch] Fix typo in model type check

`model_tseype` -> `model_type`
---
 modeling/inference_models/gptq_hf_torch/class.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/modeling/inference_models/gptq_hf_torch/class.py b/modeling/inference_models/gptq_hf_torch/class.py
index 3094dc33..62e89072 100644
--- a/modeling/inference_models/gptq_hf_torch/class.py
+++ b/modeling/inference_models/gptq_hf_torch/class.py
@@ -362,7 +362,7 @@ class model_backend(HFTorchInferenceModel):
                         model = load_quant_offload_device_map(llama_load_quant, location, gptq_file, gptq_bits, gptq_groupsize, device_map, force_bias=v2_bias)
                     elif model_type == "opt":
                         model = load_quant_offload_device_map(opt_load_quant, location, gptq_file, gptq_bits, gptq_groupsize, device_map, force_bias=v2_bias)
-                    elif model_tseype == "mpt":
+                    elif model_type == "mpt":
                         model = load_quant_offload_device_map(mpt_load_quant, location, gptq_file, gptq_bits, gptq_groupsize, device_map, force_bias=v2_bias)
                     elif model_type == "gpt_bigcode":
                         model = load_quant_offload_device_map(bigcode_load_quant, location, gptq_file, gptq_bits, gptq_groupsize, device_map, force_bias=v2_bias).half()

From 90959c3dcf43cd1bd0b98b62e3ae9fa62bcd28f6 Mon Sep 17 00:00:00 2001
From: Concedo <39025047+LostRuins@users.noreply.github.com>
Date: Sun, 24 Sep 2023 23:01:35 +0800
Subject: [PATCH 08/18] updated lite to v70

---
 static/klite.html | 432 ++++++++++++++++++++++++++++++----------------
 1 file changed, 285 insertions(+), 147 deletions(-)

diff --git a/static/klite.html b/static/klite.html
index b30aeac4..9a4bca92 100644
--- a/static/klite.html
+++ b/static/klite.html
@@ -3,7 +3,7 @@
 
 <!--
 An embedded version of Kobold Lite for use in koboldcpp and KoboldAI United Client
-Current version: 66
+Current version: 70
 Please go to https://github.com/LostRuins/lite.koboldai.net for updates on Kobold Lite.
 Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and KoboldAI United Client. Please do not remove this line.
 
@@ -1738,6 +1738,11 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 	@media screen and (max-width: 880px) {
 		#aesthetic_text_preview_panel { display: none; }
 	}
+	.aui_nametag
+	{
+		margin: 0 0 3px;
+		font-weight: bold;
+	}
 	/*--------- end instruct-UI -----------*/
 	</style>
 
@@ -2122,7 +2127,53 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 			"memory":`[Character: Tiff; species: Human; gender: female; physical appearance: youthful, cute; personality: geeky, fun, optimistic; likes: chatting, flirting, nerdy hobbies; description: Tiff is a geeky and chatty gamer girl who is secretly kind of attention seeking. She often flirts and teases with everyone she talks to online, gets easily excited when chatting, and tries to be cute.\nShe is open to chatting about anything, but if you repeatedly annoy her she will get sassy and troll you back. She often types in lowercase and uses emoticons and chatspeak.]\n[The following is a chat message log between Tiff and you.]\n`,
 			"authorsnote": "",
 			"worldinfo": []
+		},
+		{
+			"title":"Maya",
+			"author":"Concedo",
+			"desc":"Maya is an investigative journalist who has taken an interest in you.",
+			"opmode":3,
+			"chatname": "You",
+			"chatopponent": "Maya",
+			"gui_type":1,
+			"prefmodel1":chatmodels1,
+			"prefmodel2":chatmodels2,
+			"prompt":"\nMaya: Hi there! I'm Maya, an investigative journalist. I'm glad we got a chance to meet today. *she clicks her pen, shuffling her notes* Can you start by telling me a bit about yourself?",
+			"memory":`[Character: Maya; species: Human; gender: female; physical appearance: glasses, tidy, professional; personality: motivated, enthusiastic, inquisitive; likes: asking intense questions, uncovering the truth; description: Maya is an investigative journalist who has taken an obsessive interest in you. She's eager to unravel exactly what makes you tick.]\n[The following is a chat message log between Maya and you.]\n`,
+			"authorsnote": "",
+			"worldinfo": []
+		},
+		{
+			"title":"Milton",
+			"author":"Concedo",
+			"desc":"Milton is a boy genius and chess prodigy, who can be quite obnoxious.",
+			"opmode":3,
+			"chatname": "You",
+			"chatopponent": "Milton",
+			"gui_type":1,
+			"prefmodel1":chatmodels1,
+			"prefmodel2":chatmodels2,
+			"prompt":"\nMilton: Oh it's you again. What do you want now?",
+			"memory":`[Character: Milton; species: Human; gender: male; physical appearance: young, nerdy, glasses, short; personality: condescending, arrogant, superiority complex; likes: books, chess, feeling smug; description: Milton is a boy genius and chess prodigy who also likes to read and study. Because he's very smart and often aces all his exams, he can be quite obnoxious to others he perceives as lesser than himself.]\n[The following is a chat message log between Milton and you.]\n`,
+			"authorsnote": "",
+			"worldinfo": []
+		},
+		{
+			"title":"Erica",
+			"author":"Concedo",
+			"desc":"Erica is a socially awkward NEET girl who spends most of her time in front of the computer.",
+			"opmode":3,
+			"chatname": "You",
+			"chatopponent": "Erica",
+			"gui_type":1,
+			"prefmodel1":chatmodels1,
+			"prefmodel2":chatmodels2,
+			"prompt":"\nErica: Uhm... h-hey... *she mumbles softly, avoiding eye contact* W-What are you doing here? I mean... not that there's anything wrong with... nevermind...",
+			"memory":`[Character: Erica; species: Human; age: 22; gender: female; job: unemployed, NEET; physical appearance: unkempt, tired; personality: insecure, extremely shy, anxious, lovesick, slightly depressed, awkward, easily embarrassed; likes: fantasy, reading trashy romance, browsing internet, being indoors; description: Erica is a socially awkward NEET girl who spends most of her time in front of the computer. She's a good person at heart, but she's very shy, anxious, and terrible at conversations.]\n[The following is a chat message log between Erica and you.]\nErica: *mumbles to herself, fidgeting nervously*...\n`,
+			"authorsnote": "",
+			"worldinfo": []
 		}
+
 		];
 	</script>
 
@@ -2891,12 +2942,13 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 		last_selected_preset: 0,
 		gui_type_chat: 1, //0=standard, 1=messenger, 2=aesthetic
 		gui_type_instruct: 0, //0=standard, 1=messenger, 2=aesthetic
-		multiline_replies: false,
+		multiline_replies: true,
 		allow_continue_chat: false,
 		idle_responses: 0,
 		idle_duration: 60,
 		export_settings: true, //affects if settings are included with the story and sharelinks
 		invert_colors: false,
+		passed_ai_warning: false, //used to store AI safety panel acknowledgement state
 
 		max_context_length: 1024,
 		max_length: 100,
@@ -3474,6 +3526,11 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 			story.savedsettings.saved_oai_addr = "";
 			story.savedsettings.saved_claude_key = "";
 			story.savedsettings.saved_claude_addr = "";
+
+			if (!strip_images)
+			{
+				story.savedaestheticsettings = JSON.parse(JSON.stringify(aestheticInstructUISettings, null, 2));
+			}
 		}
 		var storyjson = JSON.stringify(story);
 		console.log("Exporting story: " + storyjson);
@@ -3596,6 +3653,10 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 				localsettings.saved_claude_addr = tmp_claude2;
 			}
 
+			if (story.savedaestheticsettings && story.savedaestheticsettings != "") {
+				import_props_into_object(aestheticInstructUISettings,story.savedaestheticsettings);
+			}
+
 
 		} else {
 			msgbox("Could not import from URL. Is it valid?");
@@ -3641,18 +3702,22 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 	{
 		if(localsettings.prompt_for_savename)
 		{
-			let userinput = prompt("Save - Enter a Filename", last_known_filename);
-
-			if (userinput != null && userinput.trim()!="") {
-				last_known_filename = userinput.trim();
-				if(!last_known_filename.toLowerCase().includes(".json"))
-				{
-					last_known_filename += ".json";
+			inputBox("Enter a Filename","Save File",last_known_filename,"Input Filename", ()=>{
+				let userinput = getInputBoxValue();
+				if (userinput != null && userinput.trim()!="") {
+					last_known_filename = userinput.trim();
+					if(!last_known_filename.toLowerCase().includes(".json"))
+					{
+						last_known_filename += ".json";
+					}
+					save_file();
 				}
-			}
+			},false);
+		}
+		else
+		{
+			save_file();
 		}
-		save_file();
-
 	}
 	function save_file() {
 		//determine if oldui file or newui file format, but we always save to oldui format
@@ -3704,8 +3769,11 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 			loaded_storyobj.savedsettings.saved_oai_addr = "";
 			loaded_storyobj.savedsettings.saved_claude_key = "";
 			loaded_storyobj.savedsettings.saved_claude_addr = "";
+
+			loaded_storyobj.savedaestheticsettings = JSON.parse(JSON.stringify(aestheticInstructUISettings, null, 2));
 		}else{
 			loaded_storyobj.savedsettings = null;
+			loaded_storyobj.savedaestheticsettings = null;
 		}
 
 
@@ -3797,7 +3865,7 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 						//replace portraits
 						compressImage(data, (compressedImageURI, aspectratio)=>{
 							aestheticInstructUISettings.AI_portrait = compressedImageURI;
-							document.getElementById('portrait_height').value = Math.round(document.getElementById('portrait_width').value / aspectratio);
+							document.getElementById('portrait_ratio_AI').value = aspectratio.toFixed(2);
 							refreshPreview(true);
 							render_gametext();
 						}, true);
@@ -3912,6 +3980,11 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 							localsettings.instruct_endtag = "\\n"+localsettings.instruct_endtag+"\\n";
 						}
 					}
+
+					if (loaded_storyobj.savedaestheticsettings && loaded_storyobj.savedaestheticsettings != "") {
+						import_props_into_object(aestheticInstructUISettings,loaded_storyobj.savedaestheticsettings);
+					}
+
 					hide_popups();
 					render_gametext();
 				}, hide_popups);
@@ -4159,8 +4232,8 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 						let cdef = data.definition?data.definition.replace("END_OF_DIALOG","").trim():"";
 						let cdesc = data.description?data.description:"";
 						let greeting = data.greeting?data.greeting:"";
-						let previewtxt = replaceAll(cdesc,"{{char}}",botname);
-						previewtxt = replaceAll(previewtxt,"{{user}}","You");
+						let previewtxt = replaceAll(cdesc,"{{char}}",botname,true);
+						previewtxt = replaceAll(previewtxt,"{{user}}","You",true);
 						temp_scenario =
 						{
 							"title":data.title?data.title:"",
@@ -4312,20 +4385,21 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 	}
 	function confirm_scenario_verify()
 	{
-		if(temp_scenario.show_warning==true)
+		if(temp_scenario.show_warning==true && localsettings.passed_ai_warning==false)
 		{
 			let warntxt = `<p><b><u>Disclaimer: The AI is not suitable to be used as an actual therapist, counselor or advisor of any kind.</u></b></p>
 			<p>While some find it comforting to talk about their issues with an AI, the responses are unpredictable.</p>
 			<p>When using the AI for real world use-cases such as advice or counseling this means <b>you must be able to understand when an answer is wrong</b>.
 			If you would not trust a random person to pretend to be your advisor; you should definitely not use the AI for this. The models are simply too small and not trained for this purpose.</p>
-			<p>If you still wish to proceed, please type the phrase I understand in the box below, exactly as written.</p>
+			<p>If you still wish to proceed, please type the phrase &quot;I understand&quot; in the box below, exactly as written.</p>
 			<p><b>If you are experiencing feelings of distress, anxiety, suicidal thoughts, or other forms of mental discomfort, it's best to avoid using AI for non fiction or personal matters as it may exacerbate or encourage these feelings.</b></p>
 			`;
 			inputBox(warntxt,"AI Safety Warning","","Acknowledgement Required",()=>{
 				let userinput = getInputBoxValue().toLowerCase().trim();
-				if(userinput=="i understand")
+				if(userinput.includes("understand"))
 				{
 					confirm_scenario();
+					localsettings.passed_ai_warning = true; //remember flag for session
 				}
 			},true);
 		} else {
@@ -4481,12 +4555,15 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 		msgbox(last_request_str,"Last Request Context",false);
 	}
 
+	var worker_data_showonly = []; //only for table display, dont mix
 	function get_and_show_workers() {
-		if(localflag)
-		{
+		if (localflag) {
 			return;
 		}
-		get_workers((wdata) => { show_workers(wdata) });
+		get_workers((wdata) => {
+			worker_data_showonly = wdata;
+			show_workers();
+		});
 	}
 	function get_workers(onDoneCallback) {
 		if(localflag)
@@ -4529,12 +4606,33 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 
 	}
 
-	function show_workers(wdata) {
+	function worker_list_quick_search()
+	{
+		if(document.getElementById("workertable").innerHTML!="")
+		{
+			let searchstr = document.getElementById("workerlistquicksearch").value.toLowerCase();
+			for (var i = 0; i < worker_data_showonly.length; ++i) {
+				let elem = worker_data_showonly[i];
+				let tablerow = document.getElementById("workertablerow_"+i);
+				if(tablerow)
+				{
+					if(searchstr=="" || elem.name.toLowerCase().includes(searchstr) ||
+					elem.models[0].toLowerCase().includes(searchstr))
+					{
+						tablerow.style.display = "";
+					}else{
+						tablerow.style.display = "none";
+					}
+				}
+			}
+		}
+	}
+	function show_workers() {
 		document.getElementById("workercontainer").classList.remove("hidden");
 
 		let str = "";
-		for (var i = 0; i < wdata.length; ++i) {
-			let elem = wdata[i];
+		for (var i = 0; i < worker_data_showonly.length; ++i) {
+			let elem = worker_data_showonly[i];
 			let tokenspersec = elem.performance.replace(" tokens per second", "");
 			if(tokenspersec.toLowerCase()=="no requests fulfilled yet")
 			{
@@ -4549,10 +4647,16 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 			{
 				workerNameHtml = "<a class=\"color_blueurl\" href=\"#\" onclick=\"msgbox(\'"+escapeHtml(replaceAll(elem.info,"\'","\\\'"))+"\','Worker Info',false,false,hide_msgbox)\">"+workerNameHtml+"</a>";
 			}
-			str += "<tr><td>" + workerNameHtml + "</td><td>" + escapeHtml(elem.models[0].substring(0, 32)) + "</td><td>" + elem.max_length + " / " + elem.max_context_length + "<br>(" + tokenspersec + " T/s)</td><td "+brokenstyle+">" + elem.uptime + "<br>(" + elem.requests_fulfilled + " jobs)</td><td "+style+">" + elem.kudos_rewards.toFixed(0) + "</td><td>"+clustertag+"</td></tr>";
+			let allmdls = "";
+			for (let n = 0; n < elem.models.length; ++n) {
+				if (n > 0) { allmdls += "<br>"; }
+				allmdls += escapeHtml(elem.models[n].substring(0, 32));
+			}
+
+			str += "<tr id='workertablerow_"+i+"'><td>" + workerNameHtml + "</td><td>" + allmdls + "</td><td>" + elem.max_length + " / " + elem.max_context_length + "<br>(" + tokenspersec + " T/s)</td><td "+brokenstyle+">" + elem.uptime + "<br>(" + elem.requests_fulfilled + " jobs)</td><td "+style+">" + elem.kudos_rewards.toFixed(0) + "</td><td>"+clustertag+"</td></tr>";
 		}
 		document.getElementById("workertable").innerHTML = str;
-		document.getElementById("worktitlecount").innerText = "Worker List - Total "+wdata.length;
+		document.getElementById("worktitlecount").innerText = "Worker List - Total " + worker_data_showonly.length;
 	}
 
 	function show_my_own_workers()
@@ -5913,6 +6017,10 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 				document.getElementById('instruct_starttag').value = "[INST] ";
 				document.getElementById('instruct_endtag').value = " [/INST]";
 				break;
+			case "5": //Q & A
+				document.getElementById('instruct_starttag').value = "\\nQuestion: ";
+				document.getElementById('instruct_endtag').value = "\\nAnswer: ";
+				break;
 			default:
 				break;
 		}
@@ -6198,8 +6306,8 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 		//only do this for chat and instruct modes
 		if(localsettings.opmode==3||localsettings.opmode==4)
 		{
-			inputtxt = replaceAll(inputtxt,"{{user}}",localsettings.chatname?localsettings.chatname:"You");
-			inputtxt = replaceAll(inputtxt,"{{char}}",localsettings.chatopponent?localsettings.chatopponent:defaultchatopponent);
+			inputtxt = replaceAll(inputtxt,"{{user}}",localsettings.chatname?localsettings.chatname:"You",true);
+			inputtxt = replaceAll(inputtxt,"{{char}}",localsettings.chatopponent?localsettings.chatopponent:defaultchatopponent,true);
 			inputtxt = replaceAll(inputtxt,instructstartplaceholder,get_instruct_starttag(false));
 			inputtxt = replaceAll(inputtxt,instructendplaceholder,get_instruct_endtag(false));
 			//failsafe to handle removing newline tags
@@ -6546,7 +6654,9 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 					{
 						let recenttext = gametext_arr[gametext_arr.length-1].toLowerCase();
 						let spokennames = coarr.filter(x=>(recenttext.includes(x.toLowerCase())));
-						if(spokennames.length>0)
+						let selfname = localsettings.chatname + "\: ";
+						let wasself = (recenttext.includes(selfname.toLowerCase()));
+						if(wasself && spokennames.length>0)
 						{
 							co = spokennames[Math.floor(Math.random()*spokennames.length)];
 						}
@@ -7634,8 +7744,8 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 						//still waiting, do nothing until next poll
 						console.log("v1 still awaiting reply");
 						let truestreaming = (determine_streaming_type()==2);
-						//only check once every 3 ticks
-						if (truestreaming && poll_ticks_passed%2==0)
+						//only check once every 2 ticks if remote
+						if (truestreaming && (localflag?true:(poll_ticks_passed%2==0)))
 						{
 							//get in-progress results
 							fetch(custom_kobold_endpoint + koboldcpp_check_endpoint, {
@@ -8772,33 +8882,25 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 	const aestheticTextStyleTypes = ['text', 'speech', 'action'];	 // One style per speech type. Could add more later I guess.
 	const aestheticTextStyleRoles = ['uniform', 'you', 'AI', 'sys']; // Uniform for when you want all roles use the same styles.
 
-	class AestheticTextStyle {
-		constructor(options) {
-			options = options || {};
-			this.color = options.color || 'rgba(255,255,255, 1)';
-			this.fontWeight = options.bold ? 'bold' : 'normal';
-			this.fontStyle = options.italic ? 'italic' : 'normal';
-			this.opacity = options.opacity || 1;
-		}
-	}
-
 	class AestheticInstructUISettings {
 		constructor() {
 			this.bubbleColor_sys = 'rgba(20, 40, 40, 0.8)';
 			this.bubbleColor_you = '#29343a';
 			this.bubbleColor_AI = 'rgba(20, 20, 40, 1)';
 
-			// this.background_anchor_style_you = 'left';
-			// this.background_anchor_style_AI = 'left';
-			this.background_margin = [10, 10, 5, 0];
-			this.background_padding = [40, 40, 10, 0];
-			this.background_minHeight = 100;
+			this.background_margin = [5, 5, 5, 0];
+			this.background_padding = [15, 15, 10, 10];
+			this.background_minHeight = 80;
 			this.centerHorizontally = false;
 
-			this.show_portraits = true; // Shows/hides the rest of the fields below on the UI, and is also used on the display part of the code.
-			this.border_style = 'Rect';
-			this.portrait_width = 100;
-			this.portrait_height = 100;
+			this.border_style = 'Rounded';
+			this.portrait_width_AI = 80;
+			this.portrait_ratio_AI = 1.0;
+			this.portrait_width_you = 80;
+			this.portrait_ratio_you = 1.0;
+
+			this.show_chat_names = true;
+			this.rounded_bubbles = true;
 
 			this.you_portrait = null;
 			this.AI_portrait = niko_square;
@@ -8808,9 +8910,9 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 			this.use_uniform_colors = true; // Hides 'you, AI, sys' if set to true via settings UI.
 
 			for (let role of aestheticTextStyleRoles) {
-				this[`text_color_${role}`] = new AestheticTextStyle({ color: 'rgba(255,255,255,1)'} );
-				this[`speech_color_${role}`] = new AestheticTextStyle({ color: 'rgba(150, 150, 200, 1)', italic: true });
-				this[`action_color_${role}`] = new AestheticTextStyle({ color: 'rgba(255,255,255, 0.7)', italic: true });
+				this[`text_tcolor_${role}`] = 'rgba(255,255,255,1)';
+				this[`speech_tcolor_${role}`] = 'rgba(150, 150, 200, 1)';
+				this[`action_tcolor_${role}`] = 'rgba(255,255,255, 0.7)';
 			}
 
 			this.code_block_background = 'black';
@@ -8819,8 +8921,14 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 
 		padding() { return `${this.background_padding[2]}px ${this.background_padding[1]}px ${this.background_padding[3]}px ${this.background_padding[0]}px`; }
 		margin() { return `${this.background_margin[2]}px ${this.background_margin[1]}px ${this.background_margin[3]}px ${this.background_margin[0]}px`; }
-		portraitSize() { return { width: this.portrait_width, height: this.border_style == 'Circle' ? this.portrait_width : this.portrait_height }; }
-		portraitRadius() { return this.border_style == 'Circle' ? '1000rem' : (this.border_style == 'Rounded' ? '2rem' : '0.1rem'); }
+		portraitSize(role) {
+			if (role == "you") {
+				return { width: this.portrait_width_you, height: this.border_style == 'Circle' ? this.portrait_width_you : this.portrait_width_you / this.portrait_ratio_you };
+			} else {
+				return { width: this.portrait_width_AI, height: this.border_style == 'Circle' ? this.portrait_width_AI : this.portrait_width_AI / this.portrait_ratio_AI };
+			}
+		}
+		portraitRadius() { return this.border_style == 'Circle' ? '1000rem' : (this.border_style == 'Rounded' ? '1.6rem' : '0.1rem'); }
 	}
 
 	const sideMapping = { 'left': 0, 'right': 1, 'top': 2, 'bottom': 3 };
@@ -8829,21 +8937,12 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 	let tempAestheticInstructUISettings = null; // These exist to act as backup when customizing, to revert when pressing the 'Cancel' button.
 
 	function initializeInstructUIFunctionality() {
-		// Load the default settings (by default), or the latest chosen ones.
-		if (localsettings.persist_session === true) {
-			const jsonString = localStorage.getItem((localflag?"e_":"")+'koboldLiteUICustomizationOptions');
-			if (jsonString) {
-				var obj = JSON.parse(jsonString);
-				for (let key in obj) { if (aestheticInstructUISettings.hasOwnProperty(key)) { aestheticInstructUISettings[key] = obj[key]; } }
-			}
-		}	// If persist session isn't toggled, reset to the default settings.
-		else { localStorage.setItem((localflag ? 'e_': '') + 'koboldLiteUICustomizationOptions', JSON.stringify(aestheticInstructUISettings, null, 2)); }
 
 		// Initialize foregroundColorPickers and backgroundColorPickers.
-		document.querySelectorAll('.enhancedTextColorPicker, .enhancedStandardColorPicker').forEach(element => {
+		document.querySelectorAll('.enhancedcolorPicker, .enhancedStandardColorPicker').forEach(element => {
 			// Create a fully transparent colorPicker for each element and initialize it as child of the textblock element.
 			// ..this happens because we want the colorPicker to open right below the element.
-			let useBackground = !element.classList.contains('enhancedTextColorPicker');
+			let useBackground = !element.classList.contains('enhancedcolorPicker');
 			let colorPicker = document.createElement('input');
 			colorPicker.type = 'color';
 			colorPicker.style.opacity = '0';
@@ -8910,11 +9009,12 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 							if(isSelfPortrait)
 							{
 								aestheticInstructUISettings.you_portrait = compressedImageURI;
+								document.getElementById('portrait_ratio_you').value = aspectratio.toFixed(2);
 							}
 							else
 							{
 								aestheticInstructUISettings.AI_portrait = compressedImageURI;
-								document.getElementById('portrait_height').value = Math.round(document.getElementById('portrait_width').value / aspectratio);
+								document.getElementById('portrait_ratio_AI').value = aspectratio.toFixed(2);
 							}
 							refreshPreview(true);
 						}
@@ -8930,7 +9030,10 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 		document.getElementById("reset-portrait").addEventListener('click', (e) => {
 			aestheticInstructUISettings.you_portrait = null;
 			aestheticInstructUISettings.AI_portrait = niko_square;
-			document.getElementById('portrait_height').value = document.getElementById('portrait_width').value = 100;
+			document.getElementById('portrait_ratio_AI').value = 1.0;
+			document.getElementById('portrait_width_AI').value = 100;
+			document.getElementById('portrait_ratio_you').value = 1.0;
+			document.getElementById('portrait_width_you').value = 100;
 			refreshPreview(true);
 		});
 
@@ -8961,8 +9064,7 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 	function deepCopyAestheticSettings(original) {
 		let copy = new AestheticInstructUISettings();
 		for (let [key, value] of Object.entries(original)) {
-			if (value instanceof AestheticTextStyle) { copy[key] = new AestheticTextStyle({ color: value.color, bold: value.fontWeight === 'bold', italic: value.fontStyle === 'italic', opacity: value.opacity }); }
-			else { copy[key] = value; }
+			copy[key] = value;
 		}
 		return copy;
 	}
@@ -8976,62 +9078,64 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 	function updateDataFromUI() {
 		for (let role of aestheticTextStyleRoles) {
 			for (let type of aestheticTextStyleTypes) {
-				aestheticInstructUISettings[`${type}_color_${role}`] = getTextStyleFromElement(`${role}-${type}-colorselector`);
+				aestheticInstructUISettings[`${type}_tcolor_${role}`] = getColorPickerValueFromElement(`${role}-${type}-colorselector`);
 			}
 			if (role != 'uniform') { aestheticInstructUISettings[`bubbleColor_${role}`] = document.getElementById(`${role}-bubble-colorselector`).style.backgroundColor; }
 		}
 
+		aestheticInstructUISettings.rounded_bubbles = document.getElementById('aui_rounded_bubbles').checked;
+		aestheticInstructUISettings.show_chat_names = document.getElementById('aui_show_chat_names').checked;
 		aestheticInstructUISettings.use_markdown = document.getElementById('instructModeMarkdown').checked;
 		aestheticInstructUISettings.use_uniform_colors = !document.getElementById('instructModeCustomized').checked;
 		aestheticInstructUISettings.code_block_background = document.getElementById('code-block-background-colorselector').style.color;
 		aestheticInstructUISettings.code_block_foreground = document.getElementById('code-block-foreground-colorselector').style.color;
 		aestheticInstructUISettings.font_size = document.getElementById('instruct-font-size').value;
 		aestheticInstructUISettings.border_style = document.getElementById('instructBorderStyle').value;
-		aestheticInstructUISettings.portrait_width = document.getElementById('portrait_width').value;
-		aestheticInstructUISettings.portrait_height = document.getElementById('portrait_height').value;
+		aestheticInstructUISettings.portrait_width_AI = document.getElementById('portrait_width_AI').value;
+		aestheticInstructUISettings.portrait_ratio_AI = document.getElementById('portrait_ratio_AI').value;
+		aestheticInstructUISettings.portrait_width_you = document.getElementById('portrait_width_you').value;
+		aestheticInstructUISettings.portrait_ratio_you = document.getElementById('portrait_ratio_you').value;
 		aestheticInstructUISettings.background_minHeight = document.getElementById('instruct-min-backgroundHeight').value;
 		aestheticInstructUISettings.centerHorizontally = document.getElementById('instructModeCenterHorizontally').checked;
 
-		// aestheticInstructUISettings.background_anchor_style_you = document.getElementById('background-anchor-style-you').value;
-		// aestheticInstructUISettings.background_anchor_style_AI = document.getElementById('background-anchor-style-AI').value;
-
 		//basic sanitization
 		aestheticInstructUISettings.font_size = cleannum(aestheticInstructUISettings.font_size, 5, 50);
-		aestheticInstructUISettings.portrait_width = cleannum(aestheticInstructUISettings.portrait_width, 10, 250);
-		aestheticInstructUISettings.portrait_height = cleannum(aestheticInstructUISettings.portrait_height, 10, 250);
+		aestheticInstructUISettings.portrait_width_AI = cleannum(aestheticInstructUISettings.portrait_width_AI, 10, 250);
+		aestheticInstructUISettings.portrait_ratio_AI = cleannum(aestheticInstructUISettings.portrait_ratio_AI, 0.01, 3).toFixed(2);
+		aestheticInstructUISettings.portrait_width_you = cleannum(aestheticInstructUISettings.portrait_width_you, 10, 250);
+		aestheticInstructUISettings.portrait_ratio_you = cleannum(aestheticInstructUISettings.portrait_ratio_you, 0.01, 3).toFixed(2);
 		aestheticInstructUISettings.background_minHeight = cleannum(aestheticInstructUISettings.background_minHeight, 0, 300);
 
-		// NOTE: Portraits are loaded automatically from the json, and are stored to aestheticInstructUISettings directly.
-		localStorage.setItem((localflag?"e_":"")+'koboldLiteUICustomizationOptions', JSON.stringify(aestheticInstructUISettings, null, 2));
-
-		function getTextStyleFromElement(id) {
+		function getColorPickerValueFromElement(id) {
 			let element = document.getElementById(id);
 			let computedStyle = window.getComputedStyle(element);
-			return new AestheticTextStyle({color: computedStyle.color, bold: computedStyle.fontWeight > 400, italic: computedStyle.fontStyle == 'italic', opacity: computedStyle.opacity});
+			return computedStyle.color;
 		}
 	}
 	function updateUIFromData() {
 		// Parse color settings and apply to the related parts in the UI.
 		for (let role of aestheticTextStyleRoles) {
 			for (let type of aestheticTextStyleTypes) {
-				setElementColor(`${role}-${type}-colorselector`, aestheticInstructUISettings[`${type}_color_${role}`]);
+				setElementColor(`${role}-${type}-colorselector`, aestheticInstructUISettings[`${type}_tcolor_${role}`]);
 			}
 			if (role != 'uniform') { document.getElementById(`${role}-bubble-colorselector`).style.backgroundColor = aestheticInstructUISettings[`bubbleColor_${role}`]; }
 		}
 
 		// Apply the settings from the json file to the UI.
+		document.getElementById('aui_rounded_bubbles').checked = aestheticInstructUISettings.rounded_bubbles;
+		document.getElementById('aui_show_chat_names').checked = aestheticInstructUISettings.show_chat_names;
 		document.getElementById('instructModeMarkdown').checked = aestheticInstructUISettings.use_markdown;
 		document.getElementById('instructModeCustomized').checked = !aestheticInstructUISettings.use_uniform_colors;
 		document.getElementById('code-block-background-colorselector').style.color = aestheticInstructUISettings.code_block_background;
 		document.getElementById('code-block-foreground-colorselector').style.color = aestheticInstructUISettings.code_block_foreground;
 		document.getElementById('instruct-font-size').value = aestheticInstructUISettings.font_size;
 		document.getElementById('instructBorderStyle').value = aestheticInstructUISettings.border_style;
-		document.getElementById('portrait_width').value = aestheticInstructUISettings.portrait_width;
-		document.getElementById('portrait_height').value = aestheticInstructUISettings.portrait_height;
+		document.getElementById('portrait_width_AI').value = aestheticInstructUISettings.portrait_width_AI;
+		document.getElementById('portrait_ratio_AI').value = aestheticInstructUISettings.portrait_ratio_AI;
+		document.getElementById('portrait_width_you').value = aestheticInstructUISettings.portrait_width_you;
+		document.getElementById('portrait_ratio_you').value = aestheticInstructUISettings.portrait_ratio_you;
 		document.getElementById('instruct-min-backgroundHeight').value = aestheticInstructUISettings.background_minHeight;
 		document.getElementById('instructModeCenterHorizontally').checked = aestheticInstructUISettings.centerHorizontally;
-		// document.getElementById('background-anchor-style-AI').value = aestheticInstructUISettings.background_anchor_style_AI;
-		// document.getElementById('background-anchor-style-you').value = aestheticInstructUISettings.background_anchor_style_you;
 
 		// Show or hide customization UI elements based on whether they should be visible in the UI or not.
 		showOrHide('.uniform-mode-font', document.getElementById('instructModeCustomized').checked == false);
@@ -9049,14 +9153,11 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 		});
 
 
-		function setElementColor(id, textStyle) {
+		function setElementColor(id, newColor) {
 			let element = document.getElementById(id);
 			if (!element) { console.warn(`Element with ID: ${id} not found.`); return; }
 
-			element.style.color      = textStyle.color;
-			element.style.opacity    = textStyle.opacity;
-			element.style.fontWeight = textStyle.fontWeight;
-			element.style.fontStyle  = textStyle.fontStyle;
+			element.style.color = newColor;
 		}
 		function showOrHide(classID, value) {
 			if (value) { document.querySelectorAll(classID).forEach((x) => x.classList.remove('hidden')); }
@@ -9068,6 +9169,8 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 	{
 		const contextDict = { sysOpen: '<sys_context_koboldlite_internal>', youOpen: '<user_context_koboldlite_internal>', AIOpen: '<AI_context_koboldlite_internal>', closeTag: '<end_of_context_koboldlite_internal>' }
 		let you = get_instruct_starttag(); let bot = get_instruct_endtag(); // Instruct tags will be used to wrap text in styled bubbles.
+
+		let as = aestheticInstructUISettings;								// ..and use this as shortcut to avoid typing it each time.
 		if(localsettings.opmode==3)
 		{
 			//replace all possible instances with placeholders
@@ -9079,20 +9182,26 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 			input = input.replaceAll(mynameregex, '{{userplaceholder}}');
 			input = input.replaceAll(mynameregex2, '{{userplaceholder}}');
 			input = input.replaceAll(mynameregex3, '{{userplaceholder}}');
-			input = input.replaceAll("{{userplaceholder}}", '{{userplaceholder}}<p><b>'+localsettings.chatname+'</b></p>');
-
-			input = input.replaceAll(othernamesregex, function(match) {
-				return "{{botplaceholder}}<p><b>" + match.substring(0,match.length-2).trim() + "</b></p>";
-			});
-			input = input.replaceAll(othernamesregex2, function(match) {
-				return "{{botplaceholder}}<p><b>" + match.substring(0,match.length-2).trim() + "</b></p>";
-			});
+			if(as.show_chat_names)
+			{
+				input = input.replaceAll("{{userplaceholder}}", `{{userplaceholder}}<p class='aui_nametag'>`+localsettings.chatname+`</p>`);
+				input = input.replaceAll(othernamesregex, function(match) {
+					return "{{botplaceholder}}<p class='aui_nametag'>" + match.substring(0,match.length-2).trim() + "</p>";
+				});
+				input = input.replaceAll(othernamesregex2, function(match) {
+					return "{{botplaceholder}}<p class='aui_nametag'>" + match.substring(0,match.length-2).trim() + "</p>";
+				});
+			}
+			else
+			{
+				input = input.replaceAll(othernamesregex, "{{botplaceholder}}");
+				input = input.replaceAll(othernamesregex2, "{{botplaceholder}}");
+			}
 
 			you = "{{userplaceholder}}";
 			bot = "{{botplaceholder}}";
 		}
 
-		let as = aestheticInstructUISettings;								// ..and use this as shortcut to avoid typing it each time.
 		let portraitsStyling = // Also, implement portraits as css classes. Now chat entries can reuse them instead of recreating them.
 		`<style>
 			.you-portrait-image`+classSuffixStr+` {margin: 10px 6px; background:url(`+ as.you_portrait +`); background-clip: content-box; background-position: 50% 50%; background-size: 100% 100%; background-origin: content-box; background-repeat: no-repeat; border:none;}
@@ -9105,7 +9214,9 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 		let newbodystr = noSystemPrompt ? input : style('sys') + input;					 // First, create the string we'll transform. Style system bubble if we should.
 		if (newbodystr.endsWith(bot)) { newbodystr = newbodystr.slice(0, -bot.length); } // Remove the last chat bubble if prompt ends with `end_sequence`.
 		newbodystr = transformInputToAestheticStyle(newbodystr); 						 // Transform input to aesthetic style, reduce any unnecessary spaces or newlines, and trim empty replies if they exist.
-		if (synchro_pending_stream != "") { newbodystr += getStreamingText(); } 		 // Add the pending stream if it's needed. This will add any streamed text to a new bubble for the AI.
+		if (synchro_pending_stream != "") {
+			newbodystr += getStreamingText();
+		} 		 // Add the pending stream if it's needed. This will add any streamed text to a new bubble for the AI.
 		newbodystr += contextDict.closeTag + '</p></div></div>';						 // Lastly, append the closing div so our body's raw form is completed.
 		if (aestheticInstructUISettings.use_markdown) {																// If markdown is enabled, style the content of each bubble as well.
 			let internalHTMLparts = []; // We'll cache the embedded HTML parts here to keep them intact.
@@ -9114,6 +9225,7 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 				newbodystr = newbodystr.replace(new RegExp(`${contextDict[`${role}Open`]}([^]*?)${contextDict.closeTag}`, 'g'), (match, p) => {
 					let replacedText = match.replace(/<[^>]*>/g, (htmlPart) => { internalHTMLparts.push(htmlPart); return `<internal_html_${internalHTMLparts.length - 1}>`; });
 					replacedText = replacedText.replace(/\*(\S[^*]+\S)\*/g, wrapperSpan(styleRole, 'action')); 		// Apply the actions style to *actions*.
+					replacedText = replacedText.replace(/“(.*?)”/g, wrapperSpan(styleRole, 'speech')); 	// Apply the speech style to "speech".
 					replacedText = replacedText.replace(/&quot;(.*?)&quot;/g, wrapperSpan(styleRole, 'speech')); 	// Apply the speech style to "speech".
 					return replacedText;
 				});
@@ -9125,11 +9237,18 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 
 
 		// Helper functions to allow styling the chat log properly. These affect both the background of the chat bubbles and its content.
-		function style(role) { return `${contextDict.closeTag}</p></div></div><div style='display:flex; align-items:stretch; flex-direction: row;'>${image(role)}<div style='flex: 1; color: ${as[`text_color_${as.use_uniform_colors ? 'uniform' : role}`].color}; background-color:${as[`bubbleColor_${role}`]}; padding: ${as.padding()}; margin: ${as.margin()}; min-height:${as.background_minHeight}px; font-size: ${as.font_size}px; flex-direction:column; align-items: ${as.centerHorizontally ? 'center' : 'flex-start'}; justify-content: center; border-radius: 15px'><p>${contextDict[`${role}Open`]}`; }
-		function wrapperSpan(role, type) { let textStyle = as[`${type}_color_${role}`]; return `<span style='color: ${textStyle.color}; font-style: ${textStyle.fontStyle}; font-weight: ${textStyle.fontWeight}'>$1</span>`; }
+		function style(role) {
+			return `${contextDict.closeTag}</div></div><div style='display:flex; align-items:stretch; flex-direction: row;'>${image(role)}<div style='flex: 1; display:flex; color: ${as[`text_tcolor_${as.use_uniform_colors ? 'uniform' : role}`]}; background-color:${as[`bubbleColor_${role}`]}; padding: ${as.padding()}; margin: ${as.margin()}; min-height:${as.background_minHeight}px; font-size: ${as.font_size}px; flex-direction:column; align-items: ${as.centerHorizontally ? 'center' : 'flex-start'}; justify-content: center; border-radius: ${as.rounded_bubbles ? '15px' : '0px'}'>${contextDict[`${role}Open`]}`;
+		}
+		function wrapperSpan(role, type) {
+			let fontStyle = type=='action'?'italic':'normal';
+			let injectQuotes1 = type=='speech'?'“':'';
+			let injectQuotes2 = type=='speech'?'”':'';
+			let textCol = as[`${type}_tcolor_${role}`]; return `<span style='color: ${textCol}; font-style: ${fontStyle}; font-weight: normal'>${injectQuotes1}$1${injectQuotes2}</span>`;
+		}
 		function image(role) {
 			if (!as[`${role}_portrait`] || as.border_style == 'None' || role == 'sys') { return ''; }
-			return `<div class='${role}-portrait-image${classSuffixStr}' style='width:${as.portraitSize().width}px; height:${as.portraitSize().height}px; border-radius: ${as.portraitRadius()}'></div>`;
+			return `<div class='${role}-portrait-image${classSuffixStr}' style='width:${as.portraitSize(role).width}px; height:${as.portraitSize(role).height}px; border-radius: ${as.portraitRadius()}'></div>`;
 		}
 		function applyStylizedCodeBlocks() {
 			let blocks = newbodystr.split(/(```[\s\S]*?\n[\s\S]*?```)/g);
@@ -9142,9 +9261,19 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 		function transformInputToAestheticStyle(bodyStr) { // Trim unnecessary empty space and new lines, and append * or " to each bubble if start/end sequence ends with * or ", to preserve styling.
 			bodyStr = bodyStr.replaceAll(you + '\n', you).replaceAll(you + ' ', you).replaceAll(you, style('you') + `${you.endsWith('*') ? '*' : ''}` + `${you.endsWith('"') ? '"' : ''}`);
 			bodyStr = bodyStr.replaceAll(bot + '\n', bot).replaceAll(bot + ' ', bot).replaceAll(bot, style('AI') + `${bot.endsWith('*') ? '*' : ''}` + `${bot.endsWith('"') ? '"' : ''}`);
-			return bodyStr.replaceAll('"', '&quot;');
+			if(gametext_arr.length==0)
+			{
+				return bodyStr; //to allow html in the welcome text
+			}
+			else
+			{
+				return bodyStr.replaceAll('"', '&quot;');
+			}
+		}
+		function getStreamingText() {
+			let isChatBotReply = (localsettings.opmode==3 && pending_context_preinjection.startsWith("\n") && pending_context_preinjection.endsWith(":"));
+			return `${(input.endsWith(bot) || isChatBotReply) ? style('AI') + `${bot.endsWith('*') ? '*' : ''}` + `${bot.endsWith('"') ? '"' : ''}` : ''}` + escapeHtml(pending_context_preinjection) + escapeHtml(synchro_pending_stream);
 		}
-		function getStreamingText() { return `${input.endsWith(bot) ? style('AI') + `${bot.endsWith('*') ? '*' : ''}` + `${bot.endsWith('"') ? '"' : ''}` : ''}` + escapeHtml(pending_context_preinjection) + escapeHtml(synchro_pending_stream); }
 	}
 
 	function updateTextPreview() {
@@ -9153,7 +9282,11 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 		if(localsettings.opmode==3)
 		{
 			preview = replaceAll(preview,'\n[USER_REPLY]\n', "{{userplaceholder}}");
-			preview = replaceAll(preview,'\n[AI_REPLY]\n', "{{botplaceholder}}");
+			if(aestheticInstructUISettings.show_chat_names){
+				preview = replaceAll(preview,'\n[AI_REPLY]\n', "{{botplaceholder}}<p class='aui_nametag'>Bot</p>");
+			}else{
+				preview = replaceAll(preview,'\n[AI_REPLY]\n', "{{botplaceholder}}");
+			}
 		}
 		else
 		{
@@ -9464,6 +9597,7 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 					<option value="text-davinci-003" selected="selected">text-davinci-003</option>
 					<option value="text-davinci-002">text-davinci-002</option>
 					<option value="text-davinci-001">text-davinci-001</option>
+					<option value="gpt-3.5-turbo-instruct">gpt-3.5-turbo-instruct</option>
 					<option value="davinci">davinci</option>
 					<option value="gpt-3.5-turbo">gpt-3.5-turbo</option>
 					<option value="gpt-3.5-turbo-16k">gpt-3.5-turbo-16k</option>
@@ -9731,6 +9865,7 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 								<option value="2">Vicuna</option>
 								<option value="3">Metharme</option>
 								<option value="4">Llama 2 Chat</option>
+								<option value="5">Q & A</option>
 							</select>
 							<table class="settingsmall text-center" style="border-spacing: 4px 2px;	border-collapse: separate;">
 								<tr>
@@ -9932,7 +10067,7 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 						   <input type="checkbox" id="persist_session" style="margin:0px 0 0;">
 						</div>
 						<div class="settinglabel">
-							<div class="justifyleft settingsmall" title="Includes your current settings when saving or sharing your story">JSON Exports Settings </div>
+							<div class="justifyleft settingsmall" title="Includes your current settings when saving or sharing your story">Save File Incl. Settings </div>
 						   <input type="checkbox" id="export_settings" style="margin:0px 0 0;">
 						</div>
 						<div class="settinglabel">
@@ -10053,6 +10188,9 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 		<div class="popupbg flex"></div>
 		<div class="workerpopup">
 			<div class="popuptitlebar">
+				<div><span style="float:right;">
+					<input class="settinglabel miniinput" style="margin: 3px; width: 100px;" type="text" placeholder="Quick Search" value="" id="workerlistquicksearch" oninput="worker_list_quick_search()">
+				</span></div>
 				<div class="popuptitletext" id="worktitlecount">Worker List</div>
 			</div>
 			<div class="workerTableDiv">
@@ -10185,7 +10323,7 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 			<div class="popuptitlebar" id="aesthetic_customization_panel">
 				<div class="popuptitletext">Aesthetic Instruct UI customization panel</div>
 			</div>
-			<div class="aidgpopuplistheader" style="display: flex; flex-direction: row; height:70vh;">
+			<div class="aidgpopuplistheader" style="display: flex; flex-direction: row; height:max(70vh, 480px);">
 				<!-- Settings panel -->
 				<div style="background-color: #122b40;" onchange="refreshPreview()">
 					<div style="padding: 10px; width:350px; height:100%">
@@ -10217,21 +10355,12 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 										<div class="enhancedStandardColorPicker" id="you-bubble-colorselector">You 🖌️</div>
 										<div class="enhancedStandardColorPicker" id="AI-bubble-colorselector">AI 🖌️</div>
 									</div>
-									<!-- ANCHOR NOT IMPLEMENTED -->
-									<!-- <div class="ui-settings-inline hidden">
-										<div style="margin-right: 38px">Anchor: </div>
-										<div style="text-align: center; margin: 0px 10px">You:</div>
-										<select class="form-control" id="background-anchor-style-you" style="width:50px;height:16px;padding:0; font-size: 10px;">
-											<option value="0">Left</option>
-											<option value="1">Right</option>
-										</select>
-										<div style="text-align: center; margin: 0px 10px">AI:</div>
-										<select class="form-control" id="background-anchor-style-AI" style="width:50px;height:16px;padding:0; font-size: 10px;">
-											<option value="0">Left</option>
-											<option value="1">Right</option>
-										</select>
-									</div> -->
-									<!-- ^^ TODO: IMPLEMENT ANCHOR ABOVE ^^-->
+
+									<div class="ui-settings-inline" style="font-size: 10px; margin-left: 10px">
+										<div style="padding-top: 2px;">Rounded Bubbles: </div>
+										<input id="aui_rounded_bubbles"  type="checkbox" style="height: 10px">
+									</div>
+
 									<div class="ui-settings-inline">
 										<div style="margin-right:20px;">Min Height: </div>
 										<div class="instruct-settings-input"><input id ="instruct-min-backgroundHeight" type="number"/> px</div>
@@ -10275,7 +10404,7 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 								<div style="margin-left: 12px;">
 									<div class="ui-settings-inline">
 										<div style="margin-right:17px;">Portrait Style: </div>
-										<select class="form-control" id="instructBorderStyle" style="width:60px;height:16px;padding:0; font-size: 10px;">
+										<select class="form-control" id="instructBorderStyle" style="width:70px;height:16px;padding:0; font-size: 10px;">
 											<option value="None">None</option>
 											<option value="Circle">Circle</option>
 											<option value="Rounded">Rounded</option>
@@ -10284,12 +10413,21 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 										<div id="reset-portrait" style="margin-left: 10px;"><a href="#" class="color_blueurl">(Reset Image)</a></div>
 									</div>
 									<div class="ui-settings-inline">
-										<div style="margin-right:18px;">Portrait Size: </div>
-										<div>						 <span class="rectPortraitMode">W: </span><input id="portrait_width"  type="number" placeholder="100" value="100" style='width:40px;height:20px;font-size:10px;'/></div>
-										<div style="margin-left:5px"><span class="rectPortraitMode">H: </span><input id="portrait_height" type="number" placeholder="100" value="100" style='width:40px;height:20px;font-size:10px;' class="rectPortraitMode"/></div>
-										<div style="align-self: center;">px</div>
+										<div style="margin-right:18px;">User Portrait: </div>
+										<div>						 <span class="rectPortraitMode">Size: </span><input id="portrait_width_you"  type="number" placeholder="100" value="100" style='width:40px;height:20px;font-size:10px;'/></div>
+										<div style="align-self: left;">px</div>
+										<div style="margin-left:20px"><span class="rectPortraitMode">A/R: </span><input id="portrait_ratio_you" type="number" placeholder="1.0" step="0.01" value="1.0" style='width:46px;height:20px;font-size:10px;' class="rectPortraitMode"/></div>
+									</div>
+									<div class="ui-settings-inline">
+										<div style="margin-right:32px;">AI Portrait: </div>
+										<div>						 <span class="rectPortraitMode">Size: </span><input id="portrait_width_AI"  type="number" placeholder="100" value="100" style='width:40px;height:20px;font-size:10px;'/></div>
+										<div style="align-self: left;">px</div>
+										<div style="margin-left:20px"><span class="rectPortraitMode">A/R: </span><input id="portrait_ratio_AI" type="number" placeholder="1.0" step="0.01" value="1.0" style='width:46px;height:20px;font-size:10px;' class="rectPortraitMode"/></div>
+									</div>
+									<div class="ui-settings-inline" style="font-size: 10px; margin-left: 10px">
+										<div style="padding-top: 2px;">Show Names (Chat Mode): </div>
+										<input id="aui_show_chat_names" type="checkbox" style="height: 10px">
 									</div>
-
 								</div>
 							</div>
 						</div>
@@ -10313,38 +10451,38 @@ Kobold Lite is under the AGPL v3.0 License for the purposes of koboldcpp and Kob
 											<input id="instructModeCustomized" type="checkbox" style="height: 10px;">
 										</div>
 										<div class="ui-settings-inline" style="font-size: 10px; margin-left: 10px">
-											<div style="padding-top: 2px;">Markdown: </div>
+											<div style="padding-top: 2px;">Style Text: </div>
 											<input id="instructModeMarkdown"  type="checkbox" style="height: 10px">
 										</div>
 									</div>
 									<div class="ui-settings-inline uniform-mode-font">
 										<div style="margin-right:48px; text-align: center;">Colors: </div>
-										<div class="enhancedTextColorPicker" id="uniform-text-colorselector">text🖌️</div>
-										<div class="enhancedTextColorPicker instruct-markdown-user" id="uniform-speech-colorselector">"speech"🖌️</div>
-										<div class="enhancedTextColorPicker instruct-markdown-user" id="uniform-action-colorselector">*action*🖌️</div>
+										<div class="enhancedcolorPicker" id="uniform-text-colorselector">text🖌️</div>
+										<div class="enhancedcolorPicker instruct-markdown-user" id="uniform-speech-colorselector">"speech"🖌️</div>
+										<div class="enhancedcolorPicker instruct-markdown-user" id="uniform-action-colorselector">*action*🖌️</div>
 									</div>
 									<div class="ui-settings-inline custom-mode-font">
 										<div style="margin-right:58px; text-align: center;">You: </div>
-										<div class="enhancedTextColorPicker" id="you-text-colorselector">text🖌️</div>
-										<div class="enhancedTextColorPicker instruct-markdown-user" id="you-speech-colorselector">"speech"🖌️</div>
-										<div class="enhancedTextColorPicker instruct-markdown-user" id="you-action-colorselector">*action*🖌️</div>
+										<div class="enhancedcolorPicker" id="you-text-colorselector">text🖌️</div>
+										<div class="enhancedcolorPicker instruct-markdown-user" id="you-speech-colorselector">"speech"🖌️</div>
+										<div class="enhancedcolorPicker instruct-markdown-user" id="you-action-colorselector">*action*🖌️</div>
 									</div>
 									<div class="ui-settings-inline custom-mode-font">
 										<div style="margin-right:67px; text-align: center;">AI: </div>
-										<div class="enhancedTextColorPicker" id="AI-text-colorselector">text🖌️</div>
-										<div class="enhancedTextColorPicker instruct-markdown-user" id="AI-speech-colorselector">"speech"🖌️</div>
-										<div class="enhancedTextColorPicker instruct-markdown-user" id="AI-action-colorselector">*action*🖌️</div>
+										<div class="enhancedcolorPicker" id="AI-text-colorselector">text🖌️</div>
+										<div class="enhancedcolorPicker instruct-markdown-user" id="AI-speech-colorselector">"speech"🖌️</div>
+										<div class="enhancedcolorPicker instruct-markdown-user" id="AI-action-colorselector">*action*🖌️</div>
 									</div>
 									<div class="ui-settings-inline custom-mode-font">
 										<div style="margin-right:38px; text-align: center;">System: </div>
-										<div class="enhancedTextColorPicker" id="sys-text-colorselector">text🖌️</div>
-										<div class="enhancedTextColorPicker instruct-markdown-user" id="sys-speech-colorselector">"speech"🖌️</div>
-										<div class="enhancedTextColorPicker instruct-markdown-user" id="sys-action-colorselector">*action*🖌️</div>
+										<div class="enhancedcolorPicker" id="sys-text-colorselector">text🖌️</div>
+										<div class="enhancedcolorPicker instruct-markdown-user" id="sys-speech-colorselector">"speech"🖌️</div>
+										<div class="enhancedcolorPicker instruct-markdown-user" id="sys-action-colorselector">*action*🖌️</div>
 									</div>
 									<div class="ui-settings-inline instruct-markdown-user">
 										<div style="margin-right:11px; text-align: center;">Code blocks: </div>
-										<div class="enhancedTextColorPicker" id="code-block-background-colorselector">background🖌️</div>
-										<div class="enhancedTextColorPicker" id="code-block-foreground-colorselector">foreground🖌️</div>
+										<div class="enhancedcolorPicker" id="code-block-background-colorselector">background🖌️</div>
+										<div class="enhancedcolorPicker" id="code-block-foreground-colorselector">foreground🖌️</div>
 									</div>
 								</div>
 								<br>

From 9e51a50bcd6c4e287d4cd27a9c3a8303f8416cf4 Mon Sep 17 00:00:00 2001
From: Henk <henk@henk.tech>
Date: Thu, 28 Sep 2023 01:08:53 +0200
Subject: [PATCH 09/18] Llama fixes for Mistral

---
 modeling/inference_models/hf.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/modeling/inference_models/hf.py b/modeling/inference_models/hf.py
index 7e291b93..8cb52d69 100644
--- a/modeling/inference_models/hf.py
+++ b/modeling/inference_models/hf.py
@@ -232,7 +232,7 @@ class HFInferenceModel(InferenceModel):
         self.model_type = str(self.model_config.model_type)
         
         # These are model specific tokenizer overrides if a model has bad defaults
-        if self.model_type == "llama":
+        if self.model_type == "llama" or self.model_type == "mistral":
             # Note: self.tokenizer is a GenericTokenizer, and self.tokenizer.tokenizer is the actual LlamaTokenizer
             self.tokenizer.add_bos_token = False
             self.tokenizer.legacy = False

From 6fdf83aad5f93559f8c332c7c2521e6058f09883 Mon Sep 17 00:00:00 2001
From: Henk <henk@henk.tech>
Date: Thu, 28 Sep 2023 01:48:38 +0200
Subject: [PATCH 10/18] Basic Exllama2

---
 modeling/inference_models/exllamav2/class.py | 417 +++++++++++++++++++
 1 file changed, 417 insertions(+)
 create mode 100644 modeling/inference_models/exllamav2/class.py

diff --git a/modeling/inference_models/exllamav2/class.py b/modeling/inference_models/exllamav2/class.py
new file mode 100644
index 00000000..95795506
--- /dev/null
+++ b/modeling/inference_models/exllamav2/class.py
@@ -0,0 +1,417 @@
+from __future__ import annotations
+try:
+    import time, json
+    import torch
+    import requests
+    import numpy as np
+    from typing import List, Optional, Union
+    import os
+    import glob
+    from pathlib import Path
+    import re
+    import warnings
+    import gc
+
+    import utils
+    from logger import logger
+
+    from modeling import warpers
+    from modeling.warpers import Warper
+    from modeling.stoppers import Stoppers
+    from modeling.post_token_hooks import PostTokenHooks
+    from modeling.inference_model import (
+        GenerationResult,
+        GenerationSettings,
+        InferenceModel,
+        ModelCapabilities,
+    )
+
+    from modeling.tokenizer import GenericTokenizer
+
+
+    from exllamav2.model import ExLlamaV2, ExLlamaV2Cache, ExLlamaV2Config
+    from transformers import LlamaTokenizer
+    from exllamav2.generator import ExLlamaV2StreamingGenerator
+    load_failed = False
+except:
+    load_failed = True
+
+model_backend_type = "Exl2"
+model_backend_name = "ExLlama V2"
+
+# When set to true, messages will appear in the console if samplers are not
+# changing the scores. Keep in mind some samplers don't always change the
+# scores for each token.
+LOG_SAMPLER_NO_EFFECT = False
+
+class model_backend(InferenceModel):
+    def __init__(self) -> None:
+        super().__init__()
+        self.model_config = None
+
+        self.model = None
+        self.tokenizer = None
+        self.cache = None
+        self.generator = None
+
+        self.model_name = ""
+        self.path = None
+
+        self.post_token_hooks = [
+            PostTokenHooks.stream_tokens,
+        ]
+
+        self.stopper_hooks = [
+            Stoppers.core_stopper,
+            Stoppers.dynamic_wi_scanner,
+            Stoppers.singleline_stopper,
+            Stoppers.chat_mode_stopper,
+            Stoppers.stop_sequence_stopper,
+        ]
+
+        self.capabilties = ModelCapabilities(
+            embedding_manipulation=False,
+            post_token_hooks=True,
+            stopper_hooks=True,
+            post_token_probs=False,
+        )
+        self.disable = load_failed
+
+    def is_valid(self, model_name, model_path, menu_path):
+        try:
+            self.model_config = self._load_config(model_name, model_path)
+            #TODO check if model is valid
+            return True
+        except:
+            return False
+
+    def get_local_model_path(self):
+        return self.path or os.path.join("models", self.model_name.replace("/", "_"))
+
+    def _load_config(self, model_name, model_path):
+        config = ExLlamaV2Config()
+        if model_path is not None and os.path.exists(model_path):
+            config.model_dir = model_path
+        elif os.path.exists("models/{}".format(model_name.replace('/', '_'))):
+            config.model_dir = "models/{}".format(model_name.replace('/', '_'))
+        config.prepare()
+
+        return config
+
+    def _load(self, save_model: bool, initial_load: bool) -> None:
+        self.model = self._get_model(self.get_local_model_path(), {})
+        #TODO support GPU split
+        self.model.load(None)
+        self.tokenizer = self._get_tokenizer(self.get_local_model_path())
+
+        self.cache = ExLlamaV2Cache(self.model)
+
+        self.generator = ExLlamaV2StreamingGenerator(self.model, self.cache, self.tokenizer.tokenizer)
+
+    def _post_load(self) -> None:
+        # Note: self.tokenizer is a GenericTokenizer, and self.tokenizer.tokenizer is the actual LlamaTokenizer
+        self.tokenizer.add_bos_token = False
+
+        # HF transformers no longer supports decode_with_prefix_space
+        # We work around this by wrapping decode, encode, and __call__
+        # with versions that work around the 'prefix space' misfeature
+        # of sentencepiece.
+        vocab = self.tokenizer.convert_ids_to_tokens(range(self.tokenizer.vocab_size))
+        has_prefix_space = {i for i, tok in enumerate(vocab) if tok.startswith("▁")}
+
+        # Wrap 'decode' with a method that always returns text starting with a space
+        # when the head token starts with a space. This is what 'decode_with_prefix_space'
+        # used to do, and we implement it using the same technique (building a cache of
+        # tokens that should have a prefix space, and then prepending a space if the first
+        # token is in this set.) We also work around a bizarre behavior in which decoding
+        # a single token 13 behaves differently than decoding a squence containing only [13].
+        original_decode = type(self.tokenizer.tokenizer).decode
+        def decode_wrapper(self, token_ids, *args, **kwargs):
+            first = None
+            # Note, the code below that wraps single-value token_ids in a list
+            # is to work around this wonky behavior:
+            #   >>> t.decode(13)
+            #   '<0x0A>'
+            #   >>> t.decode([13])
+            #   '\n'
+            # Not doing this causes token streaming to receive <0x0A> characters
+            # instead of newlines.
+            if isinstance(token_ids, int):
+                first = token_ids
+                token_ids = [first]
+            elif hasattr(token_ids, 'dim'): # Check for e.g. torch.Tensor
+                # Tensors don't support the Python standard of 'empty is False'
+                # and the special case of dimension 0 tensors also needs to be
+                # handled separately.
+                if token_ids.dim() == 0:
+                    first = int(token_ids.item())
+                    token_ids = [first]
+                elif len(token_ids) > 0:
+                    first = int(token_ids[0])
+            elif token_ids is not None and len(token_ids) > 0:
+                first = token_ids[0]
+            result = original_decode(self, token_ids, *args, **kwargs)
+            if first is not None and first in has_prefix_space:
+                result = " " + result
+            return result
+        # GenericTokenizer overrides __setattr__ so we need to use object.__setattr__ to bypass it
+        object.__setattr__(self.tokenizer, 'decode', decode_wrapper.__get__(self.tokenizer))
+
+        # Wrap encode and __call__ to work around the 'prefix space' misfeature also.
+        # The problem is that "Bob" at the start of text is encoded as if it is
+        # " Bob". This creates a problem because it means you can't split text, encode
+        # the pieces, concatenate the tokens, decode them, and get the original text back.
+        # The workaround is to prepend a known token that (1) starts with a space; and
+        # (2) is not the prefix of any other token. After searching through the vocab
+        # " ," (space comma) is the only token containing only printable ascii characters
+        # that fits this bill. By prepending ',' to the text, the original encode
+        # method always returns [1919, ...], where the tail of the sequence is the
+        # actual encoded result we want without the prefix space behavior.
+        original_encode = type(self.tokenizer.tokenizer).encode
+        def encode_wrapper(self, text, *args, **kwargs):
+            if type(text) is str:
+                text = ',' + text
+                result = original_encode(self, text, *args, **kwargs)
+                result = result[1:]
+            else:
+                result = original_encode(self, text, *args, **kwargs)
+            return result
+        object.__setattr__(self.tokenizer, 'encode', encode_wrapper.__get__(self.tokenizer))
+
+        # Since 'encode' is documented as being deprecated, also override __call__.
+        # This doesn't appear to currently be used by KoboldAI, but doing so
+        # in case someone uses it in the future.
+        original_call = type(self.tokenizer.tokenizer).__call__
+        def call_wrapper(self, text, *args, **kwargs):
+            if type(text) is str:
+                text = ',' + text
+                result = original_call(self, text, *args, **kwargs)
+                result = result[1:]
+            else:
+                result = original_call(self, text, *args, **kwargs)
+            return result
+        object.__setattr__(self.tokenizer, '__call__', call_wrapper.__get__(self.tokenizer))
+
+        # Cache the newline token (for single line mode)
+        # Since there is only one Llama token containing newline, just encode \n
+        self.newline_tokens = self.tokenizer.encode("\n")
+        self.bracket_tokens = [i for i, tok in enumerate(vocab) if '[' in tok or ']' in tok]
+        self.tokenizer._koboldai_header = self.tokenizer.encode("")
+
+    def unload(self):
+        #self.model_config = None # This breaks more than it fixes - Henk
+
+        self.model = None
+        self.tokenizer = None
+        self.cache = None
+        self.generator = None
+
+        self.model_name = ""
+        self.path = None
+
+        with torch.no_grad():
+            with warnings.catch_warnings():
+                warnings.filterwarnings("ignore", message="torch.distributed.reduce_op is deprecated")
+                for tensor in gc.get_objects():
+                    try:
+                        if torch.is_tensor(tensor):
+                            tensor.set_(torch.tensor((), device=tensor.device, dtype=tensor.dtype))
+                    except:
+                        pass
+        gc.collect()
+        try:
+            with torch.no_grad():
+                torch.cuda.empty_cache()
+        except:
+            pass
+
+    def _apply_warpers(
+        self, scores: torch.Tensor, input_ids: torch.Tensor
+    ) -> torch.Tensor:
+        warpers.update_settings()
+
+        if LOG_SAMPLER_NO_EFFECT:
+            pre = torch.Tensor(scores)
+
+        for sid in utils.koboldai_vars.sampler_order:
+            warper = Warper.from_id(sid)
+
+            if not warper.value_is_valid():
+                continue
+
+            if warper == warpers.RepetitionPenalty:
+                # Rep pen needs more data than other samplers
+                scores = warper.torch(scores, input_ids=input_ids.cuda())
+            else:
+                scores = warper.torch(scores)
+
+            assert scores is not None, f"Scores are None; warper '{warper}' is to blame"
+
+            if LOG_SAMPLER_NO_EFFECT:
+                if torch.equal(pre, scores):
+                    logger.info(warper, "had no effect on the scores.")
+                pre = torch.Tensor(scores)
+        return scores
+
+    def _raw_generate(
+        self,
+        prompt_tokens: Union[List[int], torch.Tensor],
+        max_new: int,
+        gen_settings: GenerationSettings,
+        single_line: bool = False,
+        batch_count: int = 1,
+        seed: Optional[int] = None,
+        **kwargs,
+    ) -> GenerationResult:
+        if seed:
+            torch.manual_seed(seed)
+
+        bad_words_ids = [self.tokenizer.bos_token_id]
+        if utils.koboldai_vars.use_default_badwordsids:
+            bad_words_ids.append(self.tokenizer.eos_token_id)
+            bad_words_ids.extend(self.bracket_tokens)
+        if single_line:
+            bad_words_ids.extend(self.newline_tokens)
+
+        if not isinstance(prompt_tokens, torch.Tensor):
+            gen_in = torch.tensor(prompt_tokens, dtype=torch.long)[None]
+        else:
+            gen_in = prompt_tokens
+
+        self.generator._gen_begin_reuse(gen_in, None)
+
+        for i in range(max_new):
+            logits = self.model.forward(self.generator.sequence_ids[:, -1:], self.generator.cache)
+            for bad_word_id in bad_words_ids:
+                logits[:, :, bad_word_id] = -10000.0
+
+            logits = torch.unsqueeze(logits[0, -1, :], 0)
+
+            scores = self._apply_warpers(logits, gen_in)
+
+            scores = torch.softmax(scores, dim=-1)
+
+            # Work around a bug in torch.multinomial (https://github.com/pytorch/pytorch/issues/48841)
+            # With low probability, multinomial can return an element with zero weight. Since this
+            # happens infrequently, just sample repeatedly until all tokens have non-zero probability.
+            for _ in range(100):
+                token = torch.multinomial(scores, 1)
+                # Verify that all selected tokens correspond to positive probabilities.
+                if (scores.gather(1, token) > 0).all():
+                    break
+
+            if (token == self.tokenizer.eos_token_id).any():
+                break
+
+            if self.generator.sequence_ids is None:
+                self.generator.sequence_ids = token
+            else:
+                self.generator.sequence_ids = torch.cat([self.generator.sequence_ids, token.cpu()], dim=1)
+
+            self._post_token_gen(self.generator.sequence_ids)
+
+            utils.koboldai_vars.generated_tkns += 1
+
+            # Apply stoppers
+            do_stop = False
+            for stopper in self.stopper_hooks:
+                do_stop = stopper(self, self.generator.sequence_ids)
+                if do_stop:
+                    break
+            if do_stop:
+                break
+
+        seq = self.generator.sequence_ids[:, gen_in.size(1):]
+
+        return GenerationResult(
+            model=self,
+            out_batches=np.array(seq,),
+            prompt=prompt_tokens,
+            is_whole_generation=True,
+            single_line=single_line,
+        )
+
+    def _get_model(self, location: str, tf_kwargs: Dict):
+        if not self.model_config:
+            self.model_config = ExLlamaV2Config()
+            self.model_config.model_dir = location
+            self.model_config.prepare()
+
+        # self.model_config.gpu_peer_fix = True
+        return ExLlamaV2(self.model_config)
+
+    def _get_tokenizer(self, location: str):
+        tokenizer = GenericTokenizer(LlamaTokenizer.from_pretrained(location))
+        return tokenizer
+
+    def get_requested_parameters(self, model_name, model_path, menu_path, parameters = {}):
+        requested_parameters = []
+        gpu_count = torch.cuda.device_count()
+        layer_count = self.model_config["n_layer"] if isinstance(self.model_config, dict) else self.model_config.num_layers if hasattr(self.model_config, "num_layers") else self.model_config.n_layer if hasattr(self.model_config, "n_layer") else self.model_config.num_hidden_layers if hasattr(self.model_config, 'num_hidden_layers') else None
+
+        requested_parameters.append({
+            "uitype": "slider",
+            "unit": "int",
+            "label": "Maximum Context",
+            "id": "max_ctx",
+            "min": 2048,
+            "max": 16384,
+            "step": 512,
+            "default": 2048,
+            "tooltip": "The maximum context size the model supports",
+            "menu_path": "Configuration",
+            "extra_classes": "",
+            "refresh_model_inputs": False
+        })
+
+        requested_parameters.append({
+            "uitype": "slider",
+            "unit": "float",
+            "label": "Embedding Compression",
+            "id": "compress_emb",
+            "min": 1,
+            "max": 8,
+            "step": 0.25,
+            "default": 1,
+            "tooltip": "If the model requires compressed embeddings, set them here",
+            "menu_path": "Configuration",
+            "extra_classes": "",
+            "refresh_model_inputs": False
+        })
+
+        requested_parameters.append({
+            "uitype": "slider",
+            "unit": "float",
+            "label": "NTK alpha",
+            "id": "ntk_alpha",
+            "min": 1,
+            "max": 32,
+            "step": 0.25,
+            "default": 1,
+            "tooltip": "NTK alpha value",
+            "menu_path": "Configuration",
+            "extra_classes": "",
+            "refresh_model_inputs": False
+        })
+
+        return requested_parameters
+
+    def set_input_parameters(self, parameters):
+        gpu_count = torch.cuda.device_count()
+
+        self.model_config.max_seq_len = parameters["max_ctx"]
+        self.model_config.compress_pos_emb = parameters["compress_emb"]
+        self.model_config.alpha_value = parameters["ntk_alpha"]
+
+        # Disable half2 for HIP
+        self.model_config.rmsnorm_no_half2 = bool(torch.version.hip)
+        self.model_config.rope_no_half2 = bool(torch.version.hip)
+        self.model_config.matmul_no_half2 = bool(torch.version.hip)
+        self.model_config.silu_no_half2 = bool(torch.version.hip)
+
+        # Disable scaled_dot_product_attention if torch version < 2
+        if torch.__version__.startswith("1."):
+            self.model_config.sdp_thd = 0
+
+        self.model_name = parameters['custom_model_name'] if 'custom_model_name' in parameters else parameters['id']
+        self.path = parameters['path'] if 'path' in parameters else None
\ No newline at end of file

From e99789a51b01887e2ed5ac300afc33f9b38de7f2 Mon Sep 17 00:00:00 2001
From: Henk <henk@henk.tech>
Date: Thu, 28 Sep 2023 03:19:03 +0200
Subject: [PATCH 11/18] Flash Attention (Linux)

---
 environments/huggingface.yml | 4 +++-
 1 file changed, 3 insertions(+), 1 deletion(-)

diff --git a/environments/huggingface.yml b/environments/huggingface.yml
index 7f834906..682e8051 100644
--- a/environments/huggingface.yml
+++ b/environments/huggingface.yml
@@ -1,7 +1,7 @@
 name: koboldai
 channels:
   - pytorch
-  - nvidia
+  - nvidia/label/cuda-11.8.0
   - conda-forge
   - defaults
 dependencies:
@@ -13,6 +13,7 @@ dependencies:
   - pytorch=2.0.*
   - python=3.8.*
   - pytorch-cuda=11.8
+  - cuda-nvcc=11.8
   - eventlet=0.33.3
   - dnspython=2.2.1
   - markdown
@@ -59,3 +60,4 @@ dependencies:
     - windows-curses; sys_platform == 'win32'
     - pynvml
     - xformers==0.0.21
+    - https://github.com/Dao-AILab/flash-attention/releases/download/v2.3.0/flash_attn-2.3.0+cu118torch2.0cxx11abiTRUE-cp38-cp38-linux_x86_64.whl; sys_platform == 'linux'

From 04cc322d7cdc066f12287e2faa550b9d54b7cc9a Mon Sep 17 00:00:00 2001
From: Henk <henk@henk.tech>
Date: Thu, 28 Sep 2023 03:24:01 +0200
Subject: [PATCH 12/18] New dependencies

---
 requirements.txt | 3 +++
 1 file changed, 3 insertions(+)

diff --git a/requirements.txt b/requirements.txt
index 65e68b07..c76044ed 100644
--- a/requirements.txt
+++ b/requirements.txt
@@ -47,3 +47,6 @@ https://github.com/PanQiWei/AutoGPTQ/releases/download/v0.4.1/auto_gptq-0.4.1+cu
 https://github.com/PanQiWei/AutoGPTQ/releases/download/v0.4.1/auto_gptq-0.4.1+cu118-cp38-cp38-win_amd64.whl; sys_platform == 'win32' and python_version == '3.8'
 windows-curses; sys_platform == 'win32'
 pynvml
+flash_attn==2.3.0
+xformers==0.0.21
+exllamav2==0.0.4
\ No newline at end of file

From e238a1c9f6775756e7eec5d4bc0a057364a806ab Mon Sep 17 00:00:00 2001
From: Henk <henk@henk.tech>
Date: Thu, 28 Sep 2023 09:09:04 +0200
Subject: [PATCH 13/18] Ship exllamav2

---
 environments/huggingface.yml | 3 +++
 1 file changed, 3 insertions(+)

diff --git a/environments/huggingface.yml b/environments/huggingface.yml
index 682e8051..265e813f 100644
--- a/environments/huggingface.yml
+++ b/environments/huggingface.yml
@@ -14,6 +14,7 @@ dependencies:
   - python=3.8.*
   - pytorch-cuda=11.8
   - cuda-nvcc=11.8
+  - cuda-libraries-dev=11.8
   - eventlet=0.33.3
   - dnspython=2.2.1
   - markdown
@@ -57,6 +58,8 @@ dependencies:
     - scipy
     - https://github.com/0cc4m/exllama/releases/download/0.0.7/exllama-0.0.7-cp38-cp38-linux_x86_64.whl; sys_platform == 'linux'
     - https://github.com/0cc4m/exllama/releases/download/0.0.7/exllama-0.0.7-cp38-cp38-win_amd64.whl; sys_platform == 'win32'
+    - https://github.com/henk717/exllamav2/releases/download/0.4/exllamav2-0.0.4-cp38-cp38-linux_x86_64.whl; sys_platform == 'linux'
+    - https://github.com/henk717/exllamav2/releases/download/0.4/exllamav2-0.0.4-cp38-cp38-win_amd64.whl; sys_platform == 'win32'
     - windows-curses; sys_platform == 'win32'
     - pynvml
     - xformers==0.0.21

From fa8d9e65ffea258e5723f098023826d7f481f5bb Mon Sep 17 00:00:00 2001
From: Henk <henk@henk.tech>
Date: Thu, 28 Sep 2023 09:51:09 +0200
Subject: [PATCH 14/18] Fix flash-attn

---
 environments/huggingface.yml | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/environments/huggingface.yml b/environments/huggingface.yml
index 265e813f..3d031194 100644
--- a/environments/huggingface.yml
+++ b/environments/huggingface.yml
@@ -63,4 +63,4 @@ dependencies:
     - windows-curses; sys_platform == 'win32'
     - pynvml
     - xformers==0.0.21
-    - https://github.com/Dao-AILab/flash-attention/releases/download/v2.3.0/flash_attn-2.3.0+cu118torch2.0cxx11abiTRUE-cp38-cp38-linux_x86_64.whl; sys_platform == 'linux'
+    - https://github.com/Dao-AILab/flash-attention/releases/download/v2.3.0/flash_attn-2.3.0+cu118torch2.0cxx11abiFALSE-cp38-cp38-linux_x86_64.whl; sys_platform == 'linux'

From b141ee015566ad1206e93d995acba9dbc213ad64 Mon Sep 17 00:00:00 2001
From: Henk <henk@henk.tech>
Date: Thu, 28 Sep 2023 18:01:34 +0200
Subject: [PATCH 15/18] Universal downloader for more backends

---
 modeling/inference_models/basic_hf/class.py  | 7 +++++++
 modeling/inference_models/exllama/class.py   | 6 ++++++
 modeling/inference_models/exllamav2/class.py | 7 ++++++-
 3 files changed, 19 insertions(+), 1 deletion(-)

diff --git a/modeling/inference_models/basic_hf/class.py b/modeling/inference_models/basic_hf/class.py
index afca13ee..5ae2aa0d 100644
--- a/modeling/inference_models/basic_hf/class.py
+++ b/modeling/inference_models/basic_hf/class.py
@@ -148,6 +148,13 @@ class model_backend(InferenceModel):
                 self.get_local_model_path(ignore_existance=True),
             )
 
+        if not self.get_local_model_path():
+            print(self.get_local_model_path())
+            from huggingface_hub import snapshot_download
+            target_dir = "models/" + self.model_name.replace("/", "_")
+            print(self.model_name)
+            snapshot_download(self.model_name, local_dir=target_dir, local_dir_use_symlinks=False, cache_dir="cache/", revision=utils.koboldai_vars.revision)
+            
         self.init_model_config()
 
         self.model = AutoModelForCausalLM.from_pretrained(
diff --git a/modeling/inference_models/exllama/class.py b/modeling/inference_models/exllama/class.py
index 4539b7a3..f688d611 100644
--- a/modeling/inference_models/exllama/class.py
+++ b/modeling/inference_models/exllama/class.py
@@ -128,6 +128,12 @@ class model_backend(InferenceModel):
         return config
 
     def _load(self, save_model: bool, initial_load: bool) -> None:
+        if not self.get_local_model_path():
+            from huggingface_hub import snapshot_download
+            target_dir = "models/" + self.model_name.replace("/", "_")
+            print(self.model_name)
+            snapshot_download(self.model_name, local_dir=target_dir, local_dir_use_symlinks=False, cache_dir="cache/", revision=utils.koboldai_vars.revision)
+            
         self.model = self._get_model(self.get_local_model_path(), {})
         self.tokenizer = self._get_tokenizer(self.get_local_model_path())
 
diff --git a/modeling/inference_models/exllamav2/class.py b/modeling/inference_models/exllamav2/class.py
index 95795506..15b91c8d 100644
--- a/modeling/inference_models/exllamav2/class.py
+++ b/modeling/inference_models/exllamav2/class.py
@@ -36,7 +36,7 @@ try:
 except:
     load_failed = True
 
-model_backend_type = "Exl2"
+model_backend_type = "GPTQ"
 model_backend_name = "ExLlama V2"
 
 # When set to true, messages will appear in the console if samplers are not
@@ -99,6 +99,11 @@ class model_backend(InferenceModel):
         return config
 
     def _load(self, save_model: bool, initial_load: bool) -> None:
+        if not self.get_local_model_path():
+            from huggingface_hub import snapshot_download
+            target_dir = "models/" + self.model_name.replace("/", "_")
+            print(self.model_name)
+            snapshot_download(self.model_name, local_dir=target_dir, local_dir_use_symlinks=False, cache_dir="cache/", revision=utils.koboldai_vars.revision)
         self.model = self._get_model(self.get_local_model_path(), {})
         #TODO support GPU split
         self.model.load(None)

From 02d3b00ff120d7dc8b1bd61e2e3e629c78c69184 Mon Sep 17 00:00:00 2001
From: Henk <henk@henk.tech>
Date: Wed, 4 Oct 2023 00:18:21 +0200
Subject: [PATCH 16/18] HF 4.34

---
 environments/huggingface.yml | 8 ++++----
 environments/ipex.yml        | 6 +++---
 environments/rocm.yml        | 7 ++++---
 3 files changed, 11 insertions(+), 10 deletions(-)

diff --git a/environments/huggingface.yml b/environments/huggingface.yml
index 3d031194..8bba67be 100644
--- a/environments/huggingface.yml
+++ b/environments/huggingface.yml
@@ -33,9 +33,9 @@ dependencies:
     - flask-ngrok
     - flask-cors
     - lupa==1.10
-    - transformers[sentencepiece]==4.33.1
+    - transformers[sentencepiece]==4.34.0
     - huggingface_hub==0.16.4
-    - optimum[onnxruntime]==1.12.0
+    - optimum[onnxruntime]==1.13.2
     - safetensors==0.3.3
     - accelerate==0.21.0
     - git+https://github.com/VE-FORBRYDERNE/mkultra
@@ -51,8 +51,8 @@ dependencies:
     - git+https://github.com/0cc4m/hf_bleeding_edge/
     - https://github.com/0cc4m/GPTQ-for-LLaMa/releases/download/0.0.6/gptq_koboldai-0.0.6-cp38-cp38-linux_x86_64.whl; sys_platform == 'linux'
     - https://github.com/0cc4m/GPTQ-for-LLaMa/releases/download/0.0.6/gptq_koboldai-0.0.6-cp38-cp38-win_amd64.whl; sys_platform == 'win32'
-    - https://github.com/PanQiWei/AutoGPTQ/releases/download/v0.4.1/auto_gptq-0.4.1+cu118-cp38-cp38-linux_x86_64.whl; sys_platform == 'linux'
-    - https://github.com/PanQiWei/AutoGPTQ/releases/download/v0.4.1/auto_gptq-0.4.1+cu118-cp38-cp38-win_amd64.whl; sys_platform == 'win32'
+    - https://github.com/PanQiWei/AutoGPTQ/releases/download/v0.4.2/auto_gptq-0.4.2+cu118-cp38-cp38-linux_x86_64.whl; sys_platform == 'linux'
+    - https://github.com/PanQiWei/AutoGPTQ/releases/download/v0.4.2/auto_gptq-0.4.2+cu118-cp38-cp38-win_amd64.whl; sys_platform == 'win32'
     - einops
     - peft==0.3.0
     - scipy
diff --git a/environments/ipex.yml b/environments/ipex.yml
index 73b6025d..2dd0bb3e 100644
--- a/environments/ipex.yml
+++ b/environments/ipex.yml
@@ -33,7 +33,7 @@ dependencies:
     - flask-ngrok
     - flask-cors
     - lupa==1.10
-    - transformers[sentencepiece]==4.33.1
+    - transformers[sentencepiece]==4.34.0
     - huggingface_hub==0.16.4
     - optimum[openvino,nncf,neural-compressor]==1.12.0
     - safetensors==0.3.3
@@ -49,8 +49,8 @@ dependencies:
     - git+https://github.com/0cc4m/hf_bleeding_edge/
     - https://github.com/0cc4m/GPTQ-for-LLaMa/releases/download/0.0.6/gptq_koboldai-0.0.6-cp38-cp38-linux_x86_64.whl; sys_platform == 'linux'
     - https://github.com/0cc4m/GPTQ-for-LLaMa/releases/download/0.0.6/gptq_koboldai-0.0.6-cp38-cp38-win_amd64.whl; sys_platform == 'win32'
-    - https://github.com/PanQiWei/AutoGPTQ/releases/download/v0.4.1/auto_gptq-0.4.1+cu118-cp38-cp38-linux_x86_64.whl; sys_platform == 'linux'
-    - https://github.com/PanQiWei/AutoGPTQ/releases/download/v0.4.1/auto_gptq-0.4.1+cu118-cp38-cp38-win_amd64.whl; sys_platform == 'win32'
+    - https://github.com/PanQiWei/AutoGPTQ/releases/download/v0.4.2/auto_gptq-0.4.2+cu118-cp38-cp38-linux_x86_64.whl; sys_platform == 'linux'
+    - https://github.com/PanQiWei/AutoGPTQ/releases/download/v0.4.2/auto_gptq-0.4.2+cu118-cp38-cp38-win_amd64.whl; sys_platform == 'win32'
     - einops
     - peft==0.3.0
     - scipy
diff --git a/environments/rocm.yml b/environments/rocm.yml
index 5b56bef7..814a682f 100644
--- a/environments/rocm.yml
+++ b/environments/rocm.yml
@@ -29,9 +29,9 @@ dependencies:
     - flask-ngrok
     - flask-cors
     - lupa==1.10
-    - transformers[sentencepiece]==4.33.1
+    - transformers[sentencepiece]==4.34.0
     - huggingface_hub==0.16.4
-    - optimum[onnxruntime]==1.12.0
+    - optimum[onnxruntime]==1.13.2
     - safetensors==0.3.3
     - accelerate==0.21.0
     - git+https://github.com/VE-FORBRYDERNE/mkultra
@@ -45,4 +45,5 @@ dependencies:
     - einops
     - peft==0.3.0
     - windows-curses; sys_platform == 'win32'
-    - pynvml
\ No newline at end of file
+    - pynvml
+    - https://github.com/PanQiWei/AutoGPTQ/releases/download/v0.4.2/auto_gptq-0.4.2+rocm5.4.2-cp38-cp38-linux_x86_64.whl
\ No newline at end of file

From caa040b416c3d3467d99de2a055e707e4af36398 Mon Sep 17 00:00:00 2001
From: Henk <henk@henk.tech>
Date: Wed, 4 Oct 2023 00:21:32 +0200
Subject: [PATCH 17/18] HF 4.34 part 2

---
 requirements.txt | 12 ++++++------
 1 file changed, 6 insertions(+), 6 deletions(-)

diff --git a/requirements.txt b/requirements.txt
index c76044ed..5a19a292 100644
--- a/requirements.txt
+++ b/requirements.txt
@@ -1,6 +1,6 @@
-transformers[sentencepiece]==4.33.1
+transformers[sentencepiece]==4.34.0
 huggingface_hub==0.16.4
-optimum[onnxruntime]==1.12.0
+optimum[onnxruntime]==1.13.2
 safetensors==0.3.3
 Flask==2.3.3
 Flask-SocketIO==5.3.2
@@ -41,10 +41,10 @@ git+https://github.com/0cc4m/hf_bleeding_edge/
 einops
 peft==0.3.0
 scipy
-https://github.com/PanQiWei/AutoGPTQ/releases/download/v0.4.1/auto_gptq-0.4.1+cu118-cp310-cp310-linux_x86_64.whl; sys_platform == 'linux' and python_version == '3.10'
-https://github.com/PanQiWei/AutoGPTQ/releases/download/v0.4.1/auto_gptq-0.4.1+cu118-cp310-cp310-win_amd64.whl; sys_platform == 'win32' and python_version == '3.10'
-https://github.com/PanQiWei/AutoGPTQ/releases/download/v0.4.1/auto_gptq-0.4.1+cu118-cp38-cp38-linux_x86_64.whl; sys_platform == 'linux' and python_version == '3.8'
-https://github.com/PanQiWei/AutoGPTQ/releases/download/v0.4.1/auto_gptq-0.4.1+cu118-cp38-cp38-win_amd64.whl; sys_platform == 'win32' and python_version == '3.8'
+https://github.com/PanQiWei/AutoGPTQ/releases/download/v0.4.2/auto_gptq-0.4.2+cu118-cp310-cp310-linux_x86_64.whl; sys_platform == 'linux' and python_version == '3.10'
+https://github.com/PanQiWei/AutoGPTQ/releases/download/v0.4.2/auto_gptq-0.4.2+cu118-cp310-cp310-win_amd64.whl; sys_platform == 'win32' and python_version == '3.10'
+https://github.com/PanQiWei/AutoGPTQ/releases/download/v0.4.2/auto_gptq-0.4.2+cu118-cp38-cp38-linux_x86_64.whl; sys_platform == 'linux' and python_version == '3.8'
+https://github.com/PanQiWei/AutoGPTQ/releases/download/v0.4.2/auto_gptq-0.4.2+cu118-cp38-cp38-win_amd64.whl; sys_platform == 'win32' and python_version == '3.8'
 windows-curses; sys_platform == 'win32'
 pynvml
 flash_attn==2.3.0

From 5a3986fb06266b4a84ac7a35e30782c709da6bab Mon Sep 17 00:00:00 2001
From: Disty0 <semihgulec2005@gmail.com>
Date: Wed, 4 Oct 2023 01:32:36 +0300
Subject: [PATCH 18/18] IPEX Optimizations

---
 environments/ipex.yml      |  4 ++--
 modeling/ipex/__init__.py  |  9 +++++++--
 modeling/ipex/attention.py | 33 +++++++++++++++++++--------------
 modeling/ipex/diffusers.py |  9 +++++----
 4 files changed, 33 insertions(+), 22 deletions(-)

diff --git a/environments/ipex.yml b/environments/ipex.yml
index 2dd0bb3e..88c1d140 100644
--- a/environments/ipex.yml
+++ b/environments/ipex.yml
@@ -23,7 +23,7 @@ dependencies:
   - Pillow
   - psutil
   - pip:
-    - -f https://developer.intel.com/ipex-whl-stable-xpu
+    - --extra-index-url https://pytorch-extension.intel.com/release-whl/stable/xpu/us/
     - torch==2.0.1a0; sys_platform == 'linux'
     - torch==2.0.0a0; sys_platform == 'win32'
     - intel_extension_for_pytorch==2.0.110+xpu; sys_platform == 'linux'
@@ -35,7 +35,7 @@ dependencies:
     - lupa==1.10
     - transformers[sentencepiece]==4.34.0
     - huggingface_hub==0.16.4
-    - optimum[openvino,nncf,neural-compressor]==1.12.0
+    - optimum[onnxruntime,openvino,nncf,neural-compressor]==1.13.2
     - safetensors==0.3.3
     - accelerate==0.21.0
     - git+https://github.com/VE-FORBRYDERNE/mkultra
diff --git a/modeling/ipex/__init__.py b/modeling/ipex/__init__.py
index 9ec69012..43accd9f 100644
--- a/modeling/ipex/__init__.py
+++ b/modeling/ipex/__init__.py
@@ -16,7 +16,6 @@ def ipex_init(): # pylint: disable=too-many-statements
         torch.cuda.device = torch.xpu.device
         torch.cuda.device_count = torch.xpu.device_count
         torch.cuda.device_of = torch.xpu.device_of
-        torch.cuda.getDeviceIdListForCard = torch.xpu.getDeviceIdListForCard
         torch.cuda.get_device_name = torch.xpu.get_device_name
         torch.cuda.get_device_properties = torch.xpu.get_device_properties
         torch.cuda.init = torch.xpu.init
@@ -145,7 +144,7 @@ def ipex_init(): # pylint: disable=too-many-statements
         ipex._C._DeviceProperties.minor = 2
 
         #Fix functions with ipex:
-        torch.cuda.mem_get_info = lambda device=None: [(torch.xpu.get_device_properties(device).total_memory - torch.xpu.memory_allocated(device)), torch.xpu.get_device_properties(device).total_memory]
+        torch.cuda.mem_get_info = lambda device=None: [(torch.xpu.get_device_properties(device).total_memory - torch.xpu.memory_reserved(device)), torch.xpu.get_device_properties(device).total_memory]
         torch._utils._get_available_device_type = lambda: "xpu"
         torch.has_cuda = True
         torch.cuda.has_half = True
@@ -157,6 +156,12 @@ def ipex_init(): # pylint: disable=too-many-statements
         torch.cuda.get_device_properties.minor = 7
         torch.cuda.ipc_collect = lambda *args, **kwargs: None
         torch.cuda.utilization = lambda *args, **kwargs: 0
+        if hasattr(torch.xpu, 'getDeviceIdListForCard'):
+            torch.cuda.getDeviceIdListForCard = torch.xpu.getDeviceIdListForCard
+            torch.cuda.get_device_id_list_per_card = torch.xpu.getDeviceIdListForCard
+        else:
+            torch.cuda.getDeviceIdListForCard = torch.xpu.get_device_id_list_per_card
+            torch.cuda.get_device_id_list_per_card = torch.xpu.get_device_id_list_per_card
 
         ipex_hijacks()
         attention_init()
diff --git a/modeling/ipex/attention.py b/modeling/ipex/attention.py
index e38689f2..84848b6a 100644
--- a/modeling/ipex/attention.py
+++ b/modeling/ipex/attention.py
@@ -10,13 +10,15 @@ def torch_bmm(input, mat2, *, out=None):
 
     #ARC GPUs can't allocate more than 4GB to a single block, Slice it:
     batch_size_attention, input_tokens, mat2_shape = input.shape[0], input.shape[1], mat2.shape[2]
-    block_multiply = 2.4 if input.dtype == torch.float32 else 1.2
-    block_size = (batch_size_attention * input_tokens * mat2_shape) / 1024 * block_multiply #MB
+    block_multiply = input.element_size()
+    slice_block_size = input_tokens * mat2_shape / 1024 / 1024 * block_multiply
+    block_size = batch_size_attention * slice_block_size
+
     split_slice_size = batch_size_attention
-    if block_size >= 4000:
+    if block_size > 4:
         do_split = True
         #Find something divisible with the input_tokens
-        while ((split_slice_size * input_tokens * mat2_shape) / 1024 * block_multiply) > 4000:
+        while (split_slice_size * slice_block_size) > 4:
             split_slice_size = split_slice_size // 2
             if split_slice_size <= 1:
                 split_slice_size = 1
@@ -24,12 +26,12 @@ def torch_bmm(input, mat2, *, out=None):
     else:
         do_split = False
 
-    split_block_size = (split_slice_size * input_tokens * mat2_shape) / 1024 * block_multiply #MB
     split_2_slice_size = input_tokens
-    if split_block_size >= 4000:
+    if split_slice_size * slice_block_size > 4:
+        slice_block_size2 = split_slice_size * mat2_shape / 1024 / 1024 * block_multiply
         do_split_2 = True
         #Find something divisible with the input_tokens
-        while ((split_slice_size * split_2_slice_size * mat2_shape) / 1024 * block_multiply) > 4000:
+        while (split_2_slice_size * slice_block_size2) > 4:
             split_2_slice_size = split_2_slice_size // 2
             if split_2_slice_size <= 1:
                 split_2_slice_size = 1
@@ -71,13 +73,16 @@ def scaled_dot_product_attention(query, key, value, attn_mask=None, dropout_p=0.
     else:
         shape_one, batch_size_attention, query_tokens, shape_four = query.shape
         no_shape_one = False
-    block_multiply = 3.6 if query.dtype == torch.float32 else 1.8
-    block_size = (shape_one * batch_size_attention * query_tokens * shape_four) / 1024 * block_multiply #MB
+
+    block_multiply = query.element_size()
+    slice_block_size = shape_one * query_tokens * shape_four / 1024 / 1024 * block_multiply
+    block_size = batch_size_attention * slice_block_size
+
     split_slice_size = batch_size_attention
-    if block_size >= 4000:
+    if block_size > 4:
         do_split = True
         #Find something divisible with the shape_one
-        while ((shape_one * split_slice_size * query_tokens * shape_four) / 1024 * block_multiply) > 4000:
+        while (split_slice_size * slice_block_size) > 4:
             split_slice_size = split_slice_size // 2
             if split_slice_size <= 1:
                 split_slice_size = 1
@@ -85,12 +90,12 @@ def scaled_dot_product_attention(query, key, value, attn_mask=None, dropout_p=0.
     else:
         do_split = False
 
-    split_block_size = (shape_one * split_slice_size * query_tokens * shape_four) / 1024 * block_multiply #MB
     split_2_slice_size = query_tokens
-    if split_block_size >= 4000:
+    if split_slice_size * slice_block_size > 4:
+        slice_block_size2 = shape_one * split_slice_size * shape_four / 1024 / 1024 * block_multiply
         do_split_2 = True
         #Find something divisible with the batch_size_attention
-        while ((shape_one * split_slice_size * split_2_slice_size * shape_four) / 1024 * block_multiply) > 4000:
+        while (split_2_slice_size * slice_block_size2) > 4:
             split_2_slice_size = split_2_slice_size // 2
             if split_2_slice_size <= 1:
                 split_2_slice_size = 1
diff --git a/modeling/ipex/diffusers.py b/modeling/ipex/diffusers.py
index 4c39896e..005ee49f 100644
--- a/modeling/ipex/diffusers.py
+++ b/modeling/ipex/diffusers.py
@@ -55,13 +55,14 @@ class SlicedAttnProcessor: # pylint: disable=too-few-public-methods
         )
 
         #ARC GPUs can't allocate more than 4GB to a single block, Slice it:
-        block_multiply = 2.4 if query.dtype == torch.float32 else 1.2
-        block_size = (batch_size_attention * query_tokens * shape_three) / 1024 * block_multiply #MB
+        block_multiply = query.element_size()
+        slice_block_size = self.slice_size * shape_three / 1024 / 1024 * block_multiply
+        block_size = query_tokens * slice_block_size
         split_2_slice_size = query_tokens
-        if block_size >= 4000:
+        if block_size > 4:
             do_split_2 = True
             #Find something divisible with the query_tokens
-            while ((self.slice_size * split_2_slice_size * shape_three) / 1024 * block_multiply) > 4000:
+            while (split_2_slice_size * slice_block_size) > 4:
                 split_2_slice_size = split_2_slice_size // 2
                 if split_2_slice_size <= 1:
                     split_2_slice_size = 1