Spaces:

duzhong
/

intern-creative-platform

Paused

App Files Files Community

intern-creative-platform / public /scripts /extensions /tts /gpt-sovits-v2.js

duzhong's picture

Upload folder using huggingface_hub

84602ce verified 2 months ago

history blame contribute delete

6.34 kB

	import { saveTtsProviderSettings } from './index.js';

	export { GptSovitsV2Provider };

	class GptSovitsV2Provider {
	//########//
	// Config //
	//########//

	settings;
	ready = false;
	voices = [];
	separator = '. ';
	audioElement = document.createElement('audio');

	/**
	* Perform any text processing before passing to TTS engine.
	* @param {string} text Input text
	* @returns {string} Processed text
	*/
	processText(text) {
	return text;
	}

	audioFormats = ['wav', 'ogg', 'silk', 'mp3', 'flac'];

	languageLabels = {
	'Auto': 'auto',
	};

	langKey2LangCode = {
	'zh': 'zh-CN',
	'en': 'en-US',
	'ja': 'ja-JP',
	'ko': 'ko-KR',
	};


	defaultSettings = {
	provider_endpoint: 'http://localhost:9880',
	format: 'wav',
	lang: 'auto',
	streaming: false,
	text_lang: 'zh',
	prompt_lang: 'zh',

	};

	get settingsHtml() {
	let html = `

	<label for="tts_endpoint">Provider Endpoint:</label>
	<input id="tts_endpoint" type="text" class="text_pole" maxlength="250" height="300" value="${this.defaultSettings.provider_endpoint}"/>
	<span>Use <a target="_blank" href="https://github.com/v3ucn/GPT-SoVITS-V2">GPT-SoVITS-V2</a>(Unofficial).</span><br/>
	<label for="text_lang">Text Lang(Inference text language):</label>
	<input id="text_lang" type="text" class="text_pole" maxlength="250" height="300" value="${this.defaultSettings.text_lang}"/>
	<label for="text_lang">Prompt Lang(Reference audio text language):</label>
	<input id="prompt_lang" type="text" class="text_pole" maxlength="250" height="300" value="${this.defaultSettings.prompt_lang}"/>
	<br/>

	`;

	return html;
	}

	onSettingsChange() {
	// Used when provider settings are updated from UI
	this.settings.provider_endpoint = $('#tts_endpoint').val();
	this.settings.text_lang = $('#text_lang').val();
	this.settings.prompt_lang = $('#prompt_lang').val();


	saveTtsProviderSettings();
	this.changeTTSSettings();
	}

	async loadSettings(settings) {
	// Pupulate Provider UI given input settings
	if (Object.keys(settings).length == 0) {
	console.info('Using default TTS Provider settings');
	}

	// Only accept keys defined in defaultSettings
	this.settings = this.defaultSettings;

	for (const key in settings) {
	if (key in this.settings) {
	this.settings[key] = settings[key];
	} else {
	console.debug(`Ignoring non-user-configurable setting: ${key}`);
	}
	}

	// Set initial values from the settings
	$('#tts_endpoint').val(this.settings.provider_endpoint).on('change', this.onSettingsChange.bind(this));
	$('#text_lang').val(this.settings.text_lang).on('change', this.onSettingsChange.bind(this));
	$('#prompt_lang').val(this.settings.prompt_lang).on('change', this.onSettingsChange.bind(this));

	await this.checkReady();

	console.info('ITS: Settings loaded');
	}

	// Perform a simple readiness check by trying to fetch voiceIds
	async checkReady() {
	await Promise.allSettled([this.fetchTtsVoiceObjects(), this.changeTTSSettings()]);
	}

	async onRefreshClick() {
	return await this.checkReady();
	}

	//#################//
	// TTS Interfaces //
	//#################//

	async getVoice(voiceName) {



	if (this.voices.length == 0) {
	this.voices = await this.fetchTtsVoiceObjects();
	}



	const match = this.voices.filter(
	v => v.name == voiceName,
	)[0];
	console.log(match);
	if (!match) {
	throw `TTS Voice name ${voiceName} not found`;
	}
	return match;
	}



	async generateTts(text, voiceId) {
	const response = await this.fetchTtsGeneration(text, voiceId);
	return response;
	}

	//###########//
	// API CALLS //
	//###########//
	async fetchTtsVoiceObjects() {
	const response = await fetch(`${this.settings.provider_endpoint}/speakers`);
	console.info(response);

	if (!response.ok) {
	throw new Error(`HTTP ${response.status}: ${await response.json()}`);
	}
	const responseJson = await response.json();


	this.voices = responseJson;

	return responseJson;
	}

	// Each time a parameter is changed, we change the configuration
	async changeTTSSettings() {
	}

	/**
	* Fetch TTS generation from the API.
	* @param {string} inputText Text to generate TTS for
	* @param {string} voiceId Voice ID to use (model_type&speaker_id))
	* @returns {Promise<Response\|string>} Fetch response
	*/




	async fetchTtsGeneration(inputText, voiceId, lang = null, forceNoStreaming = false) {
	console.info(`Generating new TTS for voice_id ${voiceId}`);

	function replaceSpeaker(text) {
	return text.replace(/\[.*?\]/gu, '');
	}

	let prompt_text = replaceSpeaker(voiceId);

	const params = {
	text: inputText,
	prompt_text: prompt_text,
	ref_audio_path: './参考音频/' + voiceId + '.wav',
	text_lang: this.settings.text_lang,
	prompt_lang: this.settings.prompt_lang,
	text_split_method: 'cut5',
	batch_size: 1,
	media_type: 'ogg',
	streaming_mode: 'true',
	};


	const url = `${this.settings.provider_endpoint}/`;

	const response = await fetch(
	url,
	{
	method: 'POST',
	headers: {
	'Content-Type': 'application/json',
	},
	body: JSON.stringify(params), // Convert parameter objects to JSON strings
	},
	);
	if (!response.ok) {
	toastr.error(response.statusText, 'TTS Generation Failed');
	throw new Error(`HTTP ${response.status}: ${await response.text()}`);
	}
	return response;
	}



	// Interface not used
	async fetchTtsFromHistory(history_item_id) {
	return Promise.resolve(history_item_id);
	}
	}