openaitts

Sleeping

File size: 1,858 Bytes

aa95dd5
 
 
530748c
aa95dd5
99bdf0c
aa95dd5
2240547
7d0efdb
 
 
 
e92c6df
7d0efdb
 
a7f8c36
 
 
7d0efdb
 
 
 
 
 
aa95dd5
 
 
 
 
 
 
 
 
 
 
 
99bdf0c
2240547
7ebcd98
 
aa95dd5
2240547
ae677e4
aa95dd5
 
7d0efdb
 
aa95dd5
c594df9

import gradio as gr
import os
import tempfile
from openai import OpenAI

api_key = os.getenv('apikey')

def tts(text, model, voice, api_key):
    if api_key == '':
        raise gr.Error('Please enter your OpenAI API Key')
    else:
        try:
            client = OpenAI(api_key=api_key)

            response = client.audio.speech.create(
                model=model, # "tts-1","tts-1-hd"
                voice=voice, # 'alloy', 'echo', 'fable', 'onyx', 'nova', 'shimmer'
                input=text,
            )

        except Exception as error:
            # Handle any exception that occurs
            raise gr.Error("An error occurred while generating speech. Please check your API key and try again.")
            print(str(error))

    # Create a temp file to save the audio
    with tempfile.NamedTemporaryFile(suffix=".mp3", delete=False) as temp_file:
        temp_file.write(response.content)

    # Get the file path of the temp file
    temp_file_path = temp_file.name

    return temp_file_path


with gr.Blocks() as demo:
    gr.Markdown("## OpenAI Text-To-Speech")
    with gr.Row(variant='panel'):
      model = gr.Dropdown(choices=['tts-1','tts-1-hd'], label='Model', value='tts-1')
      voice = gr.Dropdown(choices=['alloy', 'echo', 'fable', 'onyx', 'nova', 'shimmer'], label='Voice Options', value='alloy')

    text = gr.Textbox(label="Input text", placeholder="Enter your text and then click on the 'Text-To-Speech' button, or simply press the Enter key.")
    btn = gr.Button("Text-To-Speech")
    output_audio = gr.Audio(label="Speech Output")
    
    text.submit(fn=tts, inputs=[text, model, voice, api_key], outputs=output_audio, api_name="tts_enter_key", concurrency_limit=None)
    btn.click(fn=tts, inputs=[text, model, voice, api_key], outputs=output_audio, api_name="tts_button", concurrency_limit=None)

demo.launch()