mirror of
https://github.com/SillyTavern/SillyTavern.git
synced 2025-02-10 17:10:45 +01:00
217 lines
7.3 KiB
JavaScript
217 lines
7.3 KiB
JavaScript
const { readSecret, SECRET_KEYS } = require("./secrets");
|
|
const fetch = require('node-fetch').default;
|
|
const FormData = require('form-data');
|
|
const fs = require('fs');
|
|
|
|
/**
|
|
* Registers the OpenAI endpoints.
|
|
* @param {import("express").Express} app Express app
|
|
* @param {any} jsonParser JSON parser
|
|
* @param {any} urlencodedParser Form data parser
|
|
*/
|
|
function registerEndpoints(app, jsonParser, urlencodedParser) {
|
|
app.post('/api/openai/caption-image', jsonParser, async (request, response) => {
|
|
try {
|
|
let key = '';
|
|
|
|
if (request.body.api === 'openai') {
|
|
key = readSecret(SECRET_KEYS.OPENAI);
|
|
}
|
|
|
|
if (request.body.api === 'openrouter') {
|
|
key = readSecret(SECRET_KEYS.OPENROUTER);
|
|
}
|
|
|
|
if (!key) {
|
|
console.log('No key found for API', request.body.api);
|
|
return response.sendStatus(401);
|
|
}
|
|
|
|
const body = {
|
|
model: request.body.model,
|
|
messages: [
|
|
{
|
|
role: "user",
|
|
content: [
|
|
{ type: "text", text: request.body.prompt },
|
|
{ type: "image_url", image_url: { "url": request.body.image } }
|
|
]
|
|
}
|
|
],
|
|
max_tokens: 500
|
|
};
|
|
|
|
console.log('Multimodal captioning request', body);
|
|
|
|
let apiUrl = '';
|
|
let headers = {};
|
|
|
|
if (request.body.api === 'openrouter') {
|
|
apiUrl = 'https://openrouter.ai/api/v1/chat/completions';
|
|
headers['HTTP-Referer'] = request.headers.referer;
|
|
}
|
|
|
|
if (request.body.api === 'openai') {
|
|
apiUrl = 'https://api.openai.com/v1/chat/completions';
|
|
}
|
|
|
|
const result = await fetch(apiUrl, {
|
|
method: 'POST',
|
|
headers: {
|
|
'Content-Type': 'application/json',
|
|
Authorization: `Bearer ${key}`,
|
|
...headers,
|
|
},
|
|
body: JSON.stringify(body),
|
|
timeout: 0,
|
|
});
|
|
|
|
if (!result.ok) {
|
|
const text = await result.text();
|
|
console.log('Multimodal captioning request failed', result.statusText, text);
|
|
return response.status(500).send(text);
|
|
}
|
|
|
|
const data = await result.json();
|
|
console.log('Multimodal captioning response', data);
|
|
const caption = data?.choices[0]?.message?.content;
|
|
|
|
if (!caption) {
|
|
return response.status(500).send('No caption found');
|
|
}
|
|
|
|
return response.json({ caption });
|
|
}
|
|
catch (error) {
|
|
console.error(error);
|
|
response.status(500).send('Internal server error');
|
|
}
|
|
});
|
|
|
|
app.post('/api/openai/transcribe-audio', urlencodedParser, async (request, response) => {
|
|
try {
|
|
const key = readSecret(SECRET_KEYS.OPENAI);
|
|
|
|
if (!key) {
|
|
console.log('No OpenAI key found');
|
|
return response.sendStatus(401);
|
|
}
|
|
|
|
if (!request.file) {
|
|
console.log('No audio file found');
|
|
return response.sendStatus(400);
|
|
}
|
|
|
|
const formData = new FormData();
|
|
console.log('Processing audio file', request.file.path);
|
|
formData.append('file', fs.createReadStream(request.file.path), { filename: 'audio.wav', contentType: 'audio/wav' });
|
|
formData.append('model', request.body.model);
|
|
|
|
if (request.body.language) {
|
|
formData.append('language', request.body.language);
|
|
}
|
|
|
|
const result = await fetch('https://api.openai.com/v1/audio/transcriptions', {
|
|
method: 'POST',
|
|
headers: {
|
|
'Authorization': `Bearer ${key}`,
|
|
...formData.getHeaders(),
|
|
},
|
|
body: formData,
|
|
});
|
|
|
|
if (!result.ok) {
|
|
const text = await result.text();
|
|
console.log('OpenAI request failed', result.statusText, text);
|
|
return response.status(500).send(text);
|
|
}
|
|
|
|
fs.rmSync(request.file.path);
|
|
const data = await result.json();
|
|
console.log('OpenAI transcription response', data);
|
|
return response.json(data);
|
|
} catch (error) {
|
|
console.error('OpenAI transcription failed', error);
|
|
response.status(500).send('Internal server error');
|
|
}
|
|
});
|
|
|
|
app.post('/api/openai/generate-voice', jsonParser, async (request, response) => {
|
|
try {
|
|
const key = readSecret(SECRET_KEYS.OPENAI);
|
|
|
|
if (!key) {
|
|
console.log('No OpenAI key found');
|
|
return response.sendStatus(401);
|
|
}
|
|
|
|
const result = await fetch('https://api.openai.com/v1/audio/speech', {
|
|
method: 'POST',
|
|
headers: {
|
|
'Content-Type': 'application/json',
|
|
Authorization: `Bearer ${key}`,
|
|
},
|
|
body: JSON.stringify({
|
|
input: request.body.text,
|
|
response_format: 'mp3',
|
|
voice: request.body.voice ?? 'alloy',
|
|
speed: request.body.speed ?? 1,
|
|
model: request.body.model ?? 'tts-1',
|
|
}),
|
|
});
|
|
|
|
if (!result.ok) {
|
|
const text = await result.text();
|
|
console.log('OpenAI request failed', result.statusText, text);
|
|
return response.status(500).send(text);
|
|
}
|
|
|
|
const buffer = await result.arrayBuffer();
|
|
response.setHeader('Content-Type', 'audio/mpeg');
|
|
return response.send(Buffer.from(buffer));
|
|
} catch (error) {
|
|
console.error('OpenAI TTS generation failed', error);
|
|
response.status(500).send('Internal server error');
|
|
}
|
|
});
|
|
|
|
app.post('/api/openai/generate-image', jsonParser, async (request, response) => {
|
|
try {
|
|
const key = readSecret(SECRET_KEYS.OPENAI);
|
|
|
|
if (!key) {
|
|
console.log('No OpenAI key found');
|
|
return response.sendStatus(401);
|
|
}
|
|
|
|
console.log('OpenAI request', request.body);
|
|
|
|
const result = await fetch('https://api.openai.com/v1/images/generations', {
|
|
method: 'POST',
|
|
headers: {
|
|
'Content-Type': 'application/json',
|
|
Authorization: `Bearer ${key}`,
|
|
},
|
|
body: JSON.stringify(request.body),
|
|
timeout: 0,
|
|
});
|
|
|
|
if (!result.ok) {
|
|
const text = await result.text();
|
|
console.log('OpenAI request failed', result.statusText, text);
|
|
return response.status(500).send(text);
|
|
}
|
|
|
|
const data = await result.json();
|
|
return response.json(data);
|
|
} catch (error) {
|
|
console.error(error);
|
|
response.status(500).send('Internal server error');
|
|
}
|
|
});
|
|
}
|
|
|
|
module.exports = {
|
|
registerEndpoints,
|
|
};
|