text-generation-webui/extensions/elevenlabs_tts/script.py

import re
from pathlib import Path

import gradio as gr
from elevenlabslib import ElevenLabsUser
from elevenlabslib.helpers import save_bytes_to_path

import modules.shared as shared

params = {
    'activate': True,
    'api_key': '12345',
    'selected_voice': 'None',
}

initial_voice = ['None']
wav_idx = 0
user = ElevenLabsUser(params['api_key'])
user_info = None

if not shared.args.no_stream:
    print("Please add --no-stream. This extension is not meant to be used with streaming.")
    raise ValueError

# Check if the API is valid and refresh the UI accordingly.


def check_valid_api():

    global user, user_info, params

    user = ElevenLabsUser(params['api_key'])
    user_info = user._get_subscription_data()
    print('checking api')
    if not params['activate']:
        return gr.update(value='Disconnected')
    elif user_info is None:
        print('Incorrect API Key')
        return gr.update(value='Disconnected')
    else:
        print('Got an API Key!')
        return gr.update(value='Connected')

# Once the API is verified, get the available voices and update the dropdown list


def refresh_voices():

    global user, user_info

    your_voices = [None]
    if user_info is not None:
        for voice in user.get_available_voices():
            your_voices.append(voice.initialName)
        return gr.Dropdown.update(choices=your_voices)
    else:
        return


def remove_surrounded_chars(string):
    # this expression matches to 'as few symbols as possible (0 upwards) between any asterisks' OR
    # 'as few symbols as possible (0 upwards) between an asterisk and the end of the string'
    return re.sub('\*[^\*]*?(\*|$)', '', string)


def input_modifier(string):
    """
    This function is applied to your text inputs before
    they are fed into the model.
    """

    return string


def output_modifier(string):
    """
    This function is applied to the model outputs.
    """

    global params, wav_idx, user, user_info

    if not params['activate']:
        return string
    elif user_info is None:
        return string

    string = remove_surrounded_chars(string)
    string = string.replace('"', '')
    string = string.replace('“', '')
    string = string.replace('\n', ' ')
    string = string.strip()

    if string == '':
        string = 'empty reply, try regenerating'

    output_file = Path(f'extensions/elevenlabs_tts/outputs/{wav_idx:06d}.wav'.format(wav_idx))
    voice = user.get_voices_by_name(params['selected_voice'])[0]
    audio_data = voice.generate_audio_bytes(string)
    save_bytes_to_path(Path(f'extensions/elevenlabs_tts/outputs/{wav_idx:06d}.wav'), audio_data)

    string = f'<audio src="file/{output_file.as_posix()}" controls></audio>'
    wav_idx += 1
    return string


def ui():

    # Gradio elements
    with gr.Row():
        activate = gr.Checkbox(value=params['activate'], label='Activate TTS')
        connection_status = gr.Textbox(value='Disconnected', label='Connection Status')
    voice = gr.Dropdown(value=params['selected_voice'], choices=initial_voice, label='TTS Voice')
    with gr.Row():
        api_key = gr.Textbox(placeholder="Enter your API key.", label='API Key')
        connect = gr.Button(value='Connect')

    # Event functions to update the parameters in the backend
    activate.change(lambda x: params.update({'activate': x}), activate, None)
    voice.change(lambda x: params.update({'selected_voice': x}), voice, None)
    api_key.change(lambda x: params.update({'api_key': x}), api_key, None)
    connect.click(check_valid_api, [], connection_status)
    connect.click(refresh_voices, [], voice)
Minor changes 2023-03-22 19:55:03 +01:00			`import re`
Rename the folder 2023-03-06 23:38:36 +01:00			`from pathlib import Path`
Move new extension to a separate file 2023-03-06 23:28:53 +01:00
Rename the folder 2023-03-06 23:38:36 +01:00			`import gradio as gr`
Remove unused imports 2023-03-16 14:18:34 +01:00			`from elevenlabslib import ElevenLabsUser`
			`from elevenlabslib.helpers import save_bytes_to_path`
Move new extension to a separate file 2023-03-06 23:28:53 +01:00
Sort imports 2023-04-07 19:42:03 +02:00			`import modules.shared as shared`

Move new extension to a separate file 2023-03-06 23:28:53 +01:00			`params = {`
			`'activate': True,`
			`'api_key': '12345',`
			`'selected_voice': 'None',`
			`}`
Improve readability 2023-03-06 23:46:46 +01:00
Move new extension to a separate file 2023-03-06 23:28:53 +01:00			`initial_voice = ['None']`
			`wav_idx = 0`
			`user = ElevenLabsUser(params['api_key'])`
			`user_info = None`

Exit elevenlabs_tts if streaming is enabled 2023-03-20 15:49:42 +01:00			`if not shared.args.no_stream:`
			`print("Please add --no-stream. This extension is not meant to be used with streaming.")`
			`raise ValueError`
Make the code more like PEP8 for readability (#862) 2023-04-07 05:15:45 +02:00
Improve readability 2023-03-06 23:46:46 +01:00			`# Check if the API is valid and refresh the UI accordingly.`
Make the code more like PEP8 for readability (#862) 2023-04-07 05:15:45 +02:00

Move new extension to a separate file 2023-03-06 23:28:53 +01:00			`def check_valid_api():`
Make the code more like PEP8 for readability (#862) 2023-04-07 05:15:45 +02:00
Move new extension to a separate file 2023-03-06 23:28:53 +01:00			`global user, user_info, params`

			`user = ElevenLabsUser(params['api_key'])`
			`user_info = user._get_subscription_data()`
			`print('checking api')`
Make the code more like PEP8 for readability (#862) 2023-04-07 05:15:45 +02:00			`if not params['activate']:`
Move new extension to a separate file 2023-03-06 23:28:53 +01:00			`return gr.update(value='Disconnected')`
			`elif user_info is None:`
			`print('Incorrect API Key')`
			`return gr.update(value='Disconnected')`
			`else:`
			`print('Got an API Key!')`
			`return gr.update(value='Connected')`
Make the code more like PEP8 for readability (#862) 2023-04-07 05:15:45 +02:00
Improve readability 2023-03-06 23:46:46 +01:00			`# Once the API is verified, get the available voices and update the dropdown list`
Make the code more like PEP8 for readability (#862) 2023-04-07 05:15:45 +02:00

Move new extension to a separate file 2023-03-06 23:28:53 +01:00			`def refresh_voices():`
Make the code more like PEP8 for readability (#862) 2023-04-07 05:15:45 +02:00
Move new extension to a separate file 2023-03-06 23:28:53 +01:00			`global user, user_info`
Make the code more like PEP8 for readability (#862) 2023-04-07 05:15:45 +02:00
Move new extension to a separate file 2023-03-06 23:28:53 +01:00			`your_voices = [None]`
			`if user_info is not None:`
			`for voice in user.get_available_voices():`
			`your_voices.append(voice.initialName)`
Make the code more like PEP8 for readability (#862) 2023-04-07 05:15:45 +02:00			`return gr.Dropdown.update(choices=your_voices)`
Move new extension to a separate file 2023-03-06 23:28:53 +01:00			`else:`
			`return`

Make the code more like PEP8 for readability (#862) 2023-04-07 05:15:45 +02:00
Move new extension to a separate file 2023-03-06 23:28:53 +01:00			`def remove_surrounded_chars(string):`
Extensions performance & memory optimisations Reworked remove_surrounded_chars() to use regular expression ( https://regexr.com/7alb5 ) instead of repeated string concatenations for elevenlab_tts, silero_tts, sd_api_pictures. This should be both faster and more robust in handling asterisks. Reduced the memory footprint of send_pictures and sd_api_pictures by scaling the images in the chat to 300 pixels max-side wise. (The user already has the original in case of the sent picture and there's an option to save the SD generation). This should fix history growing annoyingly large with multiple pictures present 2023-03-22 05:47:54 +01:00			`# this expression matches to 'as few symbols as possible (0 upwards) between any asterisks' OR`
			`# 'as few symbols as possible (0 upwards) between an asterisk and the end of the string'`
Make the code more like PEP8 for readability (#862) 2023-04-07 05:15:45 +02:00			`return re.sub('\[^\]?(\\|$)', '', string)`

Move new extension to a separate file 2023-03-06 23:28:53 +01:00
			`def input_modifier(string):`
			`"""`
			`This function is applied to your text inputs before`
			`they are fed into the model.`
			`"""`

			`return string`

Make the code more like PEP8 for readability (#862) 2023-04-07 05:15:45 +02:00
Move new extension to a separate file 2023-03-06 23:28:53 +01:00			`def output_modifier(string):`
			`"""`
			`This function is applied to the model outputs.`
			`"""`
Improve readability 2023-03-06 23:46:46 +01:00
Move new extension to a separate file 2023-03-06 23:28:53 +01:00			`global params, wav_idx, user, user_info`
Make the code more like PEP8 for readability (#862) 2023-04-07 05:15:45 +02:00
			`if not params['activate']:`
Move new extension to a separate file 2023-03-06 23:28:53 +01:00			`return string`
Make the code more like PEP8 for readability (#862) 2023-04-07 05:15:45 +02:00			`elif user_info is None:`
Move new extension to a separate file 2023-03-06 23:28:53 +01:00			`return string`

			`string = remove_surrounded_chars(string)`
			`string = string.replace('"', '')`
			`string = string.replace('“', '')`
			`string = string.replace('\n', ' ')`
			`string = string.strip()`

			`if string == '':`
			`string = 'empty reply, try regenerating'`
Make the code more like PEP8 for readability (#862) 2023-04-07 05:15:45 +02:00
Improve readability 2023-03-06 23:46:46 +01:00			`output_file = Path(f'extensions/elevenlabs_tts/outputs/{wav_idx:06d}.wav'.format(wav_idx))`
Move new extension to a separate file 2023-03-06 23:28:53 +01:00			`voice = user.get_voices_by_name(params['selected_voice'])[0]`
			`audio_data = voice.generate_audio_bytes(string)`
Improve readability 2023-03-06 23:46:46 +01:00			`save_bytes_to_path(Path(f'extensions/elevenlabs_tts/outputs/{wav_idx:06d}.wav'), audio_data)`
Move new extension to a separate file 2023-03-06 23:28:53 +01:00
			`string = f'<audio src="file/{output_file.as_posix()}" controls></audio>'`
			`wav_idx += 1`
			`return string`

Make the code more like PEP8 for readability (#862) 2023-04-07 05:15:45 +02:00
Move new extension to a separate file 2023-03-06 23:28:53 +01:00			`def ui():`
Improve readability 2023-03-06 23:46:46 +01:00
Move new extension to a separate file 2023-03-06 23:28:53 +01:00			`# Gradio elements`
			`with gr.Row():`
			`activate = gr.Checkbox(value=params['activate'], label='Activate TTS')`
			`connection_status = gr.Textbox(value='Disconnected', label='Connection Status')`
			`voice = gr.Dropdown(value=params['selected_voice'], choices=initial_voice, label='TTS Voice')`
			`with gr.Row():`
			`api_key = gr.Textbox(placeholder="Enter your API key.", label='API Key')`
			`connect = gr.Button(value='Connect')`
Improve readability 2023-03-06 23:46:46 +01:00
Move new extension to a separate file 2023-03-06 23:28:53 +01:00			`# Event functions to update the parameters in the backend`
			`activate.change(lambda x: params.update({'activate': x}), activate, None)`
			`voice.change(lambda x: params.update({'selected_voice': x}), voice, None)`
			`api_key.change(lambda x: params.update({'api_key': x}), api_key, None)`
			`connect.click(check_valid_api, [], connection_status)`
Make the code more like PEP8 for readability (#862) 2023-04-07 05:15:45 +02:00			`connect.click(refresh_voices, [], voice)`