Spaces:

NeuroSenko
/

rus-edge-tts-webui

Running

App Files Files Community

rus-edge-tts-webui / app.py

NeuroSenko

added info about original repo

7179888 about 2 years ago

raw

history blame contribute delete

4.56 kB

	import gradio as gr
	import edge_tts
	import asyncio
	import os
	# https://speech.platform.bing.com/consumer/speech/synthesize/readaloud/voices/list?trustedclienttoken=6A5AA1D4EAFF4E9FB37E23D68491D6F4 - там голоса брать. думаю поймете. ShortName короче
	SUPPORTED_VOICES = {
	'DmitryNeural-Руский(муж.)': 'ru-RU-DmitryNeural',
	'SvetlanaNeural-Русский(жен.)': 'ru-RU-SvetlanaNeural',
	'OstapNeural-Украинский(муж.)': 'uk-UA-OstapNeural',
	'PolinaNeural-Украинский(жен.)': 'uk-UA-PolinaNeural'
	}

	# Смена голоса
	def changeVoice(voices):
	example = SUPPORTED_VOICES[voices]
	example_file = os.path.join(os.path.dirname(__file__), "example/"+example+".wav")
	return example_file

	# Преобразование текста в речь
	async def textToSpeech(text, voices, rate, volume):
	output_file = "output.mp3"
	voices = SUPPORTED_VOICES[voices]
	if (rate >= 0):
	rates = rate = "+" + str(rate) + "%"
	else:
	rates = str(rate) + "%"
	if (volume >= 0):
	volumes = "+" + str(volume) + "%"
	else:
	volumes = str(volume) + "%"
	communicate = edge_tts.Communicate(text,
	voices,
	rate=rates,
	volume=volumes,
	proxy=None)
	await communicate.save(output_file)
	audio_file = os.path.join(os.path.dirname(__file__), "output.mp3")
	if (os.path.exists(audio_file)):
	return audio_file
	else:
	raise gr.Error("Преобразование не удалось！")
	return FileNotFoundError


	# Сбросить результат конвертации
	def clearSpeech():
	output_file = os.path.join(os.path.dirname(__file__), "output.mp3")
	if (os.path.exists(output_file)):
	os.remove(output_file)
	return None, None


	with gr.Blocks(css="style.css", title="Преобразование текста в речь") as demo:
	gr.Markdown("""
	# Преобразование текста в речь через Microsoft Edge
	""")
	with gr.Row():
	with gr.Column():
	text = gr.TextArea(label="Текст", elem_classes="text-area")
	btn = gr.Button("Сгенерировать", elem_id="submit-btn")
	gr.Markdown(
	"Original repository: https://github.com/hinaichigo-fox/rus-edge-tts-webui"
	)
	with gr.Column():
	voices = gr.Dropdown(choices=[
	"DmitryNeural-Руский(муж.)", "SvetlanaNeural-Русский(жен.)", "OstapNeural-Украинский(муж.)", "PolinaNeural-Украинский(жен.)"
	],
	value="DmitryNeural-Руский(муж.)",
	label="Голос",
	info="Пожалуйста, выберите голос",
	interactive=True)

	example = gr.Audio(label="Пример голоса",
	value="example/ru-RU-DmitryNeural.wav",
	interactive=False,
	elem_classes="example")

	voices.change(fn=changeVoice,inputs=voices,outputs=example)
	rate = gr.Slider(-100,
	100,
	step=1,
	value=0,
	label="Увеличение / уменьшение скорости речи",
	info="Скорость речи быстрее / медленнее",
	interactive=True)

	volume = gr.Slider(-100,
	100,
	step=1,
	value=0,
	label="Увеличение / уменьшение громкости звука",
	info="Увеличить / уменьшить громкость звука",
	interactive=True)
	audio = gr.Audio(label="Результат",
	interactive=False,
	elem_classes="audio")
	btn.click(fn=textToSpeech,
	inputs=[text, voices, rate, volume],
	outputs=[audio])

	if __name__ == "__main__":
	demo.launch()