SillyTavern/src/transformers.mjs

import path from 'node:path';
import fs from 'node:fs';
import process from 'node:process';
import { Buffer } from 'node:buffer';

import { pipeline, env, RawImage } from 'sillytavern-transformers';
import { getConfigValue } from './util.js';

configureTransformers();

function configureTransformers() {
    // Limit the number of threads to 1 to avoid issues on Android
    env.backends.onnx.wasm.numThreads = 1;
    // Use WASM from a local folder to avoid CDN connections
    env.backends.onnx.wasm.wasmPaths = path.join(process.cwd(), 'dist') + path.sep;
}

const tasks = {
    'text-classification': {
        defaultModel: 'Cohee/distilbert-base-uncased-go-emotions-onnx',
        pipeline: null,
        configField: 'extras.classificationModel',
        quantized: true,
    },
    'image-to-text': {
        defaultModel: 'Xenova/vit-gpt2-image-captioning',
        pipeline: null,
        configField: 'extras.captioningModel',
        quantized: true,
    },
    'feature-extraction': {
        defaultModel: 'Xenova/all-mpnet-base-v2',
        pipeline: null,
        configField: 'extras.embeddingModel',
        quantized: true,
    },
    'automatic-speech-recognition': {
        defaultModel: 'Xenova/whisper-small',
        pipeline: null,
        configField: 'extras.speechToTextModel',
        quantized: true,
    },
    'text-to-speech': {
        defaultModel: 'Xenova/speecht5_tts',
        pipeline: null,
        configField: 'extras.textToSpeechModel',
        quantized: false,
    },
};

/**
 * Gets a RawImage object from a base64-encoded image.
 * @param {string} image Base64-encoded image
 * @returns {Promise<RawImage|null>} Object representing the image
 */
export async function getRawImage(image) {
    try {
        const buffer = Buffer.from(image, 'base64');
        const byteArray = new Uint8Array(buffer);
        const blob = new Blob([byteArray]);

        const rawImage = await RawImage.fromBlob(blob);
        return rawImage;
    } catch {
        return null;
    }
}

/**
 * Gets the model to use for a given transformers.js task.
 * @param {string} task The task to get the model for
 * @returns {string} The model to use for the given task
 */
function getModelForTask(task) {
    const defaultModel = tasks[task].defaultModel;

    try {
        const model = getConfigValue(tasks[task].configField, null);
        return model || defaultModel;
    } catch (error) {
        console.warn('Failed to read config.yaml, using default classification model.');
        return defaultModel;
    }
}

async function migrateCacheToDataDir() {
    const oldCacheDir = path.join(process.cwd(), 'cache');
    const newCacheDir = path.join(global.DATA_ROOT, '_cache');

    if (!fs.existsSync(newCacheDir)) {
        fs.mkdirSync(newCacheDir, { recursive: true });
    }

    if (fs.existsSync(oldCacheDir) && fs.statSync(oldCacheDir).isDirectory()) {
        const files = fs.readdirSync(oldCacheDir);

        if (files.length === 0) {
            return;
        }

        console.log('Migrating model cache files to data directory. Please wait...');

        for (const file of files) {
            try {
                const oldPath = path.join(oldCacheDir, file);
                const newPath = path.join(newCacheDir, file);
                fs.cpSync(oldPath, newPath, { recursive: true, force: true });
                fs.rmSync(oldPath, { recursive: true, force: true });
            } catch (error) {
                console.warn('Failed to migrate cache file. The model will be re-downloaded.', error);
            }
        }
    }
}

/**
 * Gets the transformers.js pipeline for a given task.
 * @param {import('sillytavern-transformers').PipelineType} task The task to get the pipeline for
 * @param {string} forceModel The model to use for the pipeline, if any
 * @returns {Promise<import('sillytavern-transformers').Pipeline>} The transformers.js pipeline
 */
export async function getPipeline(task, forceModel = '') {
    await migrateCacheToDataDir();

    if (tasks[task].pipeline) {
        if (forceModel === '' || tasks[task].currentModel === forceModel) {
            return tasks[task].pipeline;
        }
        console.log('Disposing transformers.js pipeline for for task', task, 'with model', tasks[task].currentModel);
        await tasks[task].pipeline.dispose();
    }

    const cacheDir = path.join(global.DATA_ROOT, '_cache');
    const model = forceModel || getModelForTask(task);
    const localOnly = getConfigValue('extras.disableAutoDownload', false);
    console.log('Initializing transformers.js pipeline for task', task, 'with model', model);
    const instance = await pipeline(task, model, { cache_dir: cacheDir, quantized: tasks[task].quantized ?? true, local_files_only: localOnly });
    tasks[task].pipeline = instance;
    tasks[task].currentModel = model;
    // @ts-ignore
    return instance;
}

export default {
    getRawImage,
    getPipeline,
};
Node: Migrate to ES Modules 2024-10-10 21:37:22 +02:00			`import path from 'node:path';`
			`import fs from 'node:fs';`
Explicitly import node process 2024-10-11 09:43:29 +02:00			`import process from 'node:process';`
Explicitly import Buffer. Specify jsdoc local extensions 2024-10-10 22:36:22 +02:00			`import { Buffer } from 'node:buffer';`
Node: Migrate to ES Modules 2024-10-10 21:37:22 +02:00
[chore] Fix type errors 2024-10-11 20:33:36 +02:00			`import { pipeline, env, RawImage } from 'sillytavern-transformers';`
Add alternative local vectors source. x5 speed boost!! 2023-09-14 22:40:13 +02:00			`import { getConfigValue } from './util.js';`
Refactor transformers.js usage 2023-09-14 22:12:33 +02:00
			`configureTransformers();`

			`function configureTransformers() {`
			`// Limit the number of threads to 1 to avoid issues on Android`
Revert WASM worker threading 2024-07-17 17:02:27 +02:00			`env.backends.onnx.wasm.numThreads = 1;`
Refactor transformers.js usage 2023-09-14 22:12:33 +02:00			`// Use WASM from a local folder to avoid CDN connections`
			`env.backends.onnx.wasm.wasmPaths = path.join(process.cwd(), 'dist') + path.sep;`
			`}`

			`const tasks = {`
			`'text-classification': {`
			`defaultModel: 'Cohee/distilbert-base-uncased-go-emotions-onnx',`
			`pipeline: null,`
			`configField: 'extras.classificationModel',`
Add endpoint for transformers.js TTS 2024-02-02 00:51:02 +01:00			`quantized: true,`
Refactor transformers.js usage 2023-09-14 22:12:33 +02:00			`},`
			`'image-to-text': {`
			`defaultModel: 'Xenova/vit-gpt2-image-captioning',`
			`pipeline: null,`
			`configField: 'extras.captioningModel',`
Add endpoint for transformers.js TTS 2024-02-02 00:51:02 +01:00			`quantized: true,`
Refactor transformers.js usage 2023-09-14 22:12:33 +02:00			`},`
			`'feature-extraction': {`
			`defaultModel: 'Xenova/all-mpnet-base-v2',`
			`pipeline: null,`
			`configField: 'extras.embeddingModel',`
Add endpoint for transformers.js TTS 2024-02-02 00:51:02 +01:00			`quantized: true,`
Refactor transformers.js usage 2023-09-14 22:12:33 +02:00			`},`
Add backend for transformers.js whisper 2024-02-01 23:36:40 +01:00			`'automatic-speech-recognition': {`
			`defaultModel: 'Xenova/whisper-small',`
			`pipeline: null,`
			`configField: 'extras.speechToTextModel',`
Add endpoint for transformers.js TTS 2024-02-02 00:51:02 +01:00			`quantized: true,`
			`},`
			`'text-to-speech': {`
			`defaultModel: 'Xenova/speecht5_tts',`
			`pipeline: null,`
			`configField: 'extras.textToSpeechModel',`
			`quantized: false,`
Add backend for transformers.js whisper 2024-02-01 23:36:40 +01:00			`},`
Move transformers.js model cache under the data root 2024-08-16 13:59:41 +02:00			`};`
Refactor transformers.js usage 2023-09-14 22:12:33 +02:00
Add SD prompt expansion 2023-10-20 14:03:26 +02:00			`/**`
			`* Gets a RawImage object from a base64-encoded image.`
			`* @param {string} image Base64-encoded image`
			`* @returns {Promise<RawImage\|null>} Object representing the image`
			`*/`
Node: Migrate to ES Modules 2024-10-10 21:37:22 +02:00			`export async function getRawImage(image) {`
Fix server crash on local captioning 2023-09-22 22:04:26 +02:00			`try {`
			`const buffer = Buffer.from(image, 'base64');`
			`const byteArray = new Uint8Array(buffer);`
			`const blob = new Blob([byteArray]);`
Refactor transformers.js usage 2023-09-14 22:12:33 +02:00
Fix server crash on local captioning 2023-09-22 22:04:26 +02:00			`const rawImage = await RawImage.fromBlob(blob);`
			`return rawImage;`
			`} catch {`
			`return null;`
			`}`
Refactor transformers.js usage 2023-09-14 22:12:33 +02:00			`}`

Add SD prompt expansion 2023-10-20 14:03:26 +02:00			`/**`
			`* Gets the model to use for a given transformers.js task.`
			`* @param {string} task The task to get the model for`
			`* @returns {string} The model to use for the given task`
			`*/`
Refactor transformers.js usage 2023-09-14 22:12:33 +02:00			`function getModelForTask(task) {`
			`const defaultModel = tasks[task].defaultModel;`

			`try {`
Add alternative local vectors source. x5 speed boost!! 2023-09-14 22:40:13 +02:00			`const model = getConfigValue(tasks[task].configField, null);`
Refactor transformers.js usage 2023-09-14 22:12:33 +02:00			`return model \|\| defaultModel;`
			`} catch (error) {`
Migrate to config.yaml 2023-11-25 22:45:33 +01:00			`console.warn('Failed to read config.yaml, using default classification model.');`
Refactor transformers.js usage 2023-09-14 22:12:33 +02:00			`return defaultModel;`
			`}`
			`}`

Move transformers.js model cache under the data root 2024-08-16 13:59:41 +02:00			`async function migrateCacheToDataDir() {`
			`const oldCacheDir = path.join(process.cwd(), 'cache');`
			`const newCacheDir = path.join(global.DATA_ROOT, '_cache');`

			`if (!fs.existsSync(newCacheDir)) {`
			`fs.mkdirSync(newCacheDir, { recursive: true });`
			`}`

			`if (fs.existsSync(oldCacheDir) && fs.statSync(oldCacheDir).isDirectory()) {`
			`const files = fs.readdirSync(oldCacheDir);`

			`if (files.length === 0) {`
			`return;`
			`}`

			`console.log('Migrating model cache files to data directory. Please wait...');`

			`for (const file of files) {`
			`try {`
			`const oldPath = path.join(oldCacheDir, file);`
			`const newPath = path.join(newCacheDir, file);`
			`fs.cpSync(oldPath, newPath, { recursive: true, force: true });`
			`fs.rmSync(oldPath, { recursive: true, force: true });`
			`} catch (error) {`
			`console.warn('Failed to migrate cache file. The model will be re-downloaded.', error);`
			`}`
			`}`
			`}`
			`}`

Add SD prompt expansion 2023-10-20 14:03:26 +02:00			`/**`
			`* Gets the transformers.js pipeline for a given task.`
Add backend for transformers.js whisper 2024-02-01 23:36:40 +01:00			`* @param {import('sillytavern-transformers').PipelineType} task The task to get the pipeline for`
			`* @param {string} forceModel The model to use for the pipeline, if any`
[chore] Fix type errors 2024-10-11 20:33:36 +02:00			`* @returns {Promise<import('sillytavern-transformers').Pipeline>} The transformers.js pipeline`
Add SD prompt expansion 2023-10-20 14:03:26 +02:00			`*/`
Node: Migrate to ES Modules 2024-10-10 21:37:22 +02:00			`export async function getPipeline(task, forceModel = '') {`
Move transformers.js model cache under the data root 2024-08-16 13:59:41 +02:00			`await migrateCacheToDataDir();`

Refactor transformers.js usage 2023-09-14 22:12:33 +02:00			`if (tasks[task].pipeline) {`
fix transformers model changes 2024-07-08 20:09:42 +02:00			`if (forceModel === '' \|\| tasks[task].currentModel === forceModel) {`
			`return tasks[task].pipeline;`
			`}`
			`console.log('Disposing transformers.js pipeline for for task', task, 'with model', tasks[task].currentModel);`
			`await tasks[task].pipeline.dispose();`
Refactor transformers.js usage 2023-09-14 22:12:33 +02:00			`}`

Move transformers.js model cache under the data root 2024-08-16 13:59:41 +02:00			`const cacheDir = path.join(global.DATA_ROOT, '_cache');`
Add backend for transformers.js whisper 2024-02-01 23:36:40 +01:00			`const model = forceModel \|\| getModelForTask(task);`
Add alternative local vectors source. x5 speed boost!! 2023-09-14 22:40:13 +02:00			`const localOnly = getConfigValue('extras.disableAutoDownload', false);`
Refactor transformers.js usage 2023-09-14 22:12:33 +02:00			`console.log('Initializing transformers.js pipeline for task', task, 'with model', model);`
Move transformers.js model cache under the data root 2024-08-16 13:59:41 +02:00			`const instance = await pipeline(task, model, { cache_dir: cacheDir, quantized: tasks[task].quantized ?? true, local_files_only: localOnly });`
Refactor transformers.js usage 2023-09-14 22:12:33 +02:00			`tasks[task].pipeline = instance;`
fix transformers model changes 2024-07-08 20:09:42 +02:00			`tasks[task].currentModel = model;`
[chore] Fix type errors 2024-10-11 20:33:36 +02:00			`// @ts-ignore`
Refactor transformers.js usage 2023-09-14 22:12:33 +02:00			`return instance;`
			`}`

			`export default {`
			`getRawImage,`
Node: Migrate to ES Modules 2024-10-10 21:37:22 +02:00			`getPipeline,`
Allow WASM threading for non-Android. Fix eslint for transformers.mjs 2024-07-17 14:48:59 +02:00			`};`