Add koboldcpp as Text Completion source

This commit is contained in:
Cohee 2023-11-19 17:14:53 +02:00
parent 1dc1b926c4
commit 96caddfd71
5 changed files with 45 additions and 11 deletions

View File

@ -1467,10 +1467,10 @@
<div class="flex-container flexFlowColumn"> <div class="flex-container flexFlowColumn">
<div id="main-API-selector-block"> <div id="main-API-selector-block">
<select id="main_api"> <select id="main_api">
<option value="kobold"><span data-i18n="KoboldAI">KoboldAI</span></option> <option value="kobold"><span data-i18n="KoboldAI">KoboldAI Classic</span></option>
<option value="koboldhorde"><span data-i18n="KoboldAI Horde">KoboldAI Horde</span></option> <option value="koboldhorde"><span data-i18n="KoboldAI Horde">KoboldAI Horde</span></option>
<option value="novel"><span data-i18n="NovelAI">NovelAI</span></option> <option value="novel"><span data-i18n="NovelAI">NovelAI</span></option>
<option value="textgenerationwebui"><span data-i18n="Text Completion">Text Completion (ooba, Mancer, Aphrodite)</span></option> <option value="textgenerationwebui"><span data-i18n="Text Completion">Text Completion (ooba, Mancer, Aphrodite, KoboldCpp)</span></option>
<option value="openai"><span data-i18n="Chat Completion (OpenAI, Claude, Window/OpenRouter, Scale, AI21)">Chat Completion (OpenAI, Claude, Window, OpenRouter, Scale, AI21, PaLM)</span></option> <option value="openai"><span data-i18n="Chat Completion (OpenAI, Claude, Window/OpenRouter, Scale, AI21)">Chat Completion (OpenAI, Claude, Window, OpenRouter, Scale, AI21, PaLM)</span></option>
</select> </select>
</div> </div>
@ -1600,6 +1600,7 @@
<option value="mancer">Mancer</option> <option value="mancer">Mancer</option>
<option value="aphrodite">Aphrodite</option> <option value="aphrodite">Aphrodite</option>
<option value="tabby">TabbyAPI</option> <option value="tabby">TabbyAPI</option>
<option value="koboldcpp">KoboldCpp</option>
</select> </select>
</div> </div>
<div data-tg-type="mancer" class="flex-container flexFlowColumn"> <div data-tg-type="mancer" class="flex-container flexFlowColumn">
@ -1681,8 +1682,20 @@
<input id="tabby_api_url_text" class="text_pole wide100p" maxlength="500" value="" autocomplete="off" data-server-history="tabby"> <input id="tabby_api_url_text" class="text_pole wide100p" maxlength="500" value="" autocomplete="off" data-server-history="tabby">
</div> </div>
</div> </div>
<div data-tg-type="koboldcpp">
<div class="flex-container flexFlowColumn">
<a href="https://github.com/LostRuins/koboldcpp" target="_blank">
LostRuins/koboldcpp
</a>
</div>
<div class="flex1">
<h4 data-i18n="API url">API URL</h4>
<small data-i18n="Example: http://127.0.0.1:5001">Example: http://127.0.0.1:5001</small>
<input id="koboldcpp_api_url_text" class="text_pole wide100p" maxlength="500" value="" autocomplete="off" data-server-history="koboldcpp">
</div>
</div>
<div class="flex-container"> <div class="flex-container">
<div id="api_button_textgenerationwebui" class="api_button menu_button" type="submit" data-i18n="Connect" data-server-connect="ooba_blocking,aphrodite,tabby">Connect</div> <div id="api_button_textgenerationwebui" class="api_button menu_button" type="submit" data-i18n="Connect" data-server-connect="ooba_blocking,aphrodite,tabby,koboldcpp">Connect</div>
<div class="api_loading menu_button" data-i18n="Cancel">Cancel</div> <div class="api_loading menu_button" data-i18n="Cancel">Cancel</div>
</div> </div>
<label class="checkbox_label margin-bot-10px" for="legacy_api_textgenerationwebui"> <label class="checkbox_label margin-bot-10px" for="legacy_api_textgenerationwebui">

View File

@ -24,6 +24,7 @@ import {
textgenerationwebui_banned_in_macros, textgenerationwebui_banned_in_macros,
isOoba, isOoba,
MANCER_SERVER, MANCER_SERVER,
isKoboldCpp,
} from "./scripts/textgen-settings.js"; } from "./scripts/textgen-settings.js";
import { import {
@ -886,6 +887,7 @@ async function getStatus() {
use_aphrodite: main_api == "textgenerationwebui" ? isAphrodite() : false, use_aphrodite: main_api == "textgenerationwebui" ? isAphrodite() : false,
use_ooba: main_api == "textgenerationwebui" ? isOoba() : false, use_ooba: main_api == "textgenerationwebui" ? isOoba() : false,
use_tabby: main_api == "textgenerationwebui" ? isTabby() : false, use_tabby: main_api == "textgenerationwebui" ? isTabby() : false,
use_koboldcpp: main_api == "textgenerationwebui" ? isKoboldCpp() : false,
legacy_api: main_api == "textgenerationwebui" ? textgenerationwebui_settings.legacy_api && !isMancer() : false, legacy_api: main_api == "textgenerationwebui" ? textgenerationwebui_settings.legacy_api && !isMancer() : false,
}), }),
signal: abortStatusCheck.signal, signal: abortStatusCheck.signal,
@ -5505,6 +5507,7 @@ async function getSettings() {
$("#textgenerationwebui_api_url_text").val(api_server_textgenerationwebui); $("#textgenerationwebui_api_url_text").val(api_server_textgenerationwebui);
$("#aphrodite_api_url_text").val(api_server_textgenerationwebui); $("#aphrodite_api_url_text").val(api_server_textgenerationwebui);
$("#tabby_api_url_text").val(api_server_textgenerationwebui); $("#tabby_api_url_text").val(api_server_textgenerationwebui);
$('#koboldcpp_api_url_text').val(api_server_textgenerationwebui);
selected_button = settings.selected_button; selected_button = settings.selected_button;

View File

@ -28,7 +28,8 @@ export const textgen_types = {
OOBA: 'ooba', OOBA: 'ooba',
MANCER: 'mancer', MANCER: 'mancer',
APHRODITE: 'aphrodite', APHRODITE: 'aphrodite',
TABBY: 'tabby' TABBY: 'tabby',
KOBOLDCPP: 'koboldcpp',
}; };
// Maybe let it be configurable in the future? // Maybe let it be configurable in the future?
@ -292,6 +293,10 @@ export function isOoba() {
return textgenerationwebui_settings.type === textgen_types.OOBA; return textgenerationwebui_settings.type === textgen_types.OOBA;
} }
export function isKoboldCpp() {
return textgenerationwebui_settings.type === textgen_types.KOBOLDCPP;
}
export function getTextGenUrlSourceId() { export function getTextGenUrlSourceId() {
switch (textgenerationwebui_settings.type) { switch (textgenerationwebui_settings.type) {
case textgen_types.OOBA: case textgen_types.OOBA:
@ -300,6 +305,8 @@ export function getTextGenUrlSourceId() {
return "#aphrodite_api_url_text"; return "#aphrodite_api_url_text";
case textgen_types.TABBY: case textgen_types.TABBY:
return "#tabby_api_url_text"; return "#tabby_api_url_text";
case textgen_types.KOBOLDCPP:
return "#koboldcpp_api_url_text";
} }
} }
@ -559,6 +566,7 @@ export function getTextGenGenerationData(finalPrompt, this_amount_gen, isImperso
'use_mancer': isMancer(), 'use_mancer': isMancer(),
'use_aphrodite': isAphrodite(), 'use_aphrodite': isAphrodite(),
'use_tabby': isTabby(), 'use_tabby': isTabby(),
'use_koboldcpp': isKoboldCpp(),
'use_ooba': isOoba(), 'use_ooba': isOoba(),
'api_server': isMancer() ? MANCER_SERVER : api_server_textgenerationwebui, 'api_server': isMancer() ? MANCER_SERVER : api_server_textgenerationwebui,
'legacy_api': textgenerationwebui_settings.legacy_api && !isMancer(), 'legacy_api': textgenerationwebui_settings.legacy_api && !isMancer(),

View File

@ -4,7 +4,7 @@ import { chat_completion_sources, model_list, oai_settings } from "./openai.js";
import { groups, selected_group } from "./group-chats.js"; import { groups, selected_group } from "./group-chats.js";
import { getStringHash } from "./utils.js"; import { getStringHash } from "./utils.js";
import { kai_flags } from "./kai-settings.js"; import { kai_flags } from "./kai-settings.js";
import { isMancer, isTabby, textgenerationwebui_settings } from "./textgen-settings.js"; import { isKoboldCpp, isMancer, isTabby, textgenerationwebui_settings } from "./textgen-settings.js";
export const CHARACTERS_PER_TOKEN_RATIO = 3.35; export const CHARACTERS_PER_TOKEN_RATIO = 3.35;
const TOKENIZER_WARNING_KEY = 'tokenizationWarningShown'; const TOKENIZER_WARNING_KEY = 'tokenizationWarningShown';
@ -369,7 +369,8 @@ function getRemoteTokenizationParams(str) {
api: main_api, api: main_api,
url: getAPIServerUrl(), url: getAPIServerUrl(),
legacy_api: main_api === 'textgenerationwebui' && textgenerationwebui_settings.legacy_api && !isMancer(), legacy_api: main_api === 'textgenerationwebui' && textgenerationwebui_settings.legacy_api && !isMancer(),
use_tabby: isTabby() use_tabby: main_api === 'textgenerationwebui' && isTabby(),
use_koboldcpp: main_api === 'textgenerationwebui' && isKoboldCpp(),
}; };
} }

View File

@ -539,6 +539,9 @@ app.post("/api/textgenerationwebui/status", jsonParser, async function (request,
else if (request.body.use_tabby) { else if (request.body.use_tabby) {
url += "/v1/model/list" url += "/v1/model/list"
} }
else if (request.body.use_koboldcpp) {
url += "/v1/models";
}
const modelsReply = await fetch(url, args); const modelsReply = await fetch(url, args);
@ -629,7 +632,7 @@ app.post("/api/textgenerationwebui/generate", jsonParser, async function (reques
if (request.body.legacy_api) { if (request.body.legacy_api) {
url += "/v1/generate"; url += "/v1/generate";
} }
else if (request.body.use_aphrodite || request.body.use_ooba || request.body.use_tabby) { else if (request.body.use_aphrodite || request.body.use_ooba || request.body.use_tabby || request.body.use_koboldcpp) {
url += "/v1/completions"; url += "/v1/completions";
} }
else if (request.body.use_mancer) { else if (request.body.use_mancer) {
@ -3445,10 +3448,16 @@ app.post("/tokenize_via_api", jsonParser, async function (request, response) {
if (legacyApi) { if (legacyApi) {
url += '/v1/token-count'; url += '/v1/token-count';
args.body = JSON.stringify({ "prompt": text }); args.body = JSON.stringify({ "prompt": text });
} else if (request.body.use_tabby) { }
else if (request.body.use_tabby) {
url += '/v1/token/encode'; url += '/v1/token/encode';
args.body = JSON.stringify({ "text": text }); args.body = JSON.stringify({ "text": text });
} else { }
else if (request.body.use_koboldcpp) {
url += '/api/extra/tokencount';
args.body = JSON.stringify({ "prompt": text });
}
else {
url += '/v1/internal/encode'; url += '/v1/internal/encode';
args.body = JSON.stringify({ "text": text }); args.body = JSON.stringify({ "text": text });
} }
@ -3461,8 +3470,8 @@ app.post("/tokenize_via_api", jsonParser, async function (request, response) {
} }
const data = await result.json(); const data = await result.json();
const count = legacyApi ? data?.results[0]?.tokens : data?.length; const count = legacyApi ? data?.results[0]?.tokens : (data?.length ?? data?.value);
const ids = legacyApi ? [] : data?.tokens; const ids = legacyApi ? [] : (data?.tokens ?? []);
return response.send({ count, ids }); return response.send({ count, ids });
} }