Spaces:

liucy98
/

tavern

Running

App Files Files Community

tavern / SillyTavern-1.13.0 /src /vectors /vllm-vectors.js

liucy98's picture

Upload 910 files

d44b3c1 verified 2 months ago

history blame contribute delete

2.1 kB

	import fetch from 'node-fetch';
	import { setAdditionalHeadersByType } from '../additional-headers.js';
	import { TEXTGEN_TYPES } from '../constants.js';

	/**
	* Gets the vector for the given text from VLLM
	* @param {string[]} texts - The array of texts to get the vectors for
	* @param {string} apiUrl - The API URL
	* @param {string} model - The model to use
	* @param {import('../users.js').UserDirectoryList} directories - The directories object for the user
	* @returns {Promise<number[][]>} - The array of vectors for the texts
	*/
	export async function getVllmBatchVector(texts, apiUrl, model, directories) {
	const url = new URL(apiUrl);
	url.pathname = '/v1/embeddings';

	const headers = {};
	setAdditionalHeadersByType(headers, TEXTGEN_TYPES.VLLM, apiUrl, directories);

	const response = await fetch(url, {
	method: 'POST',
	headers: {
	'Content-Type': 'application/json',
	...headers,
	},
	body: JSON.stringify({ input: texts, model }),
	});

	if (!response.ok) {
	const responseText = await response.text();
	throw new Error(`VLLM: Failed to get vector for text: ${response.statusText} ${responseText}`);
	}

	/** @type {any} */
	const data = await response.json();

	if (!Array.isArray(data?.data)) {
	throw new Error('API response was not an array');
	}

	// Sort data by x.index to ensure the order is correct
	data.data.sort((a, b) => a.index - b.index);

	const vectors = data.data.map(x => x.embedding);
	return vectors;
	}

	/**
	* Gets the vector for the given text from VLLM
	* @param {string} text - The text to get the vector for
	* @param {string} apiUrl - The API URL
	* @param {string} model - The model to use
	* @param {import('../users.js').UserDirectoryList} directories - The directories object for the user
	* @returns {Promise<number[]>} - The vector for the text
	*/
	export async function getVllmVector(text, apiUrl, model, directories) {
	const vectors = await getVllmBatchVector([text], apiUrl, model, directories);
	return vectors[0];
	}