Spaces:
Running
on
CPU Upgrade
Running
on
CPU Upgrade
import gradio as gr | |
import cohere | |
import os | |
import re | |
import uuid | |
import secrets | |
cohere_api_key = os.getenv("COHERE_API_KEY") | |
AYA_MODEL_NAME = os.getenv("AYA_MODEL_NAME") | |
co = cohere.Client(cohere_api_key, client_name="huggingface-aya-23") | |
def trigger_example(example): | |
chat, updated_history = generate_response(example) | |
return chat, updated_history | |
def generate_response(user_message, cid, token, history=None): | |
if not token: | |
raise gr.Error("Error loading.") | |
if history is None: | |
history = [] | |
if cid == "" or None: | |
cid = str(uuid.uuid4()) | |
print(f"cid: {cid} prompt:{user_message}") | |
history.append(user_message) | |
stream = co.chat_stream(message=user_message, conversation_id=cid, model=AYA_MODEL_NAME, connectors=[], temperature=0.3) | |
#stream = co.generate(prompt=user_message, model='c4ai-aya-23') | |
output = "" | |
for idx, response in enumerate(stream): | |
if response.event_type == "text-generation": | |
output += response.text | |
if idx == 0: | |
history.append(" " + output) | |
else: | |
history[-1] = output | |
chat = [ | |
(history[i].strip(), history[i + 1].strip()) | |
for i in range(0, len(history) - 1, 2) | |
] | |
yield chat, history, cid | |
return chat, history, cid | |
def clear_chat(): | |
return [], [], str(uuid.uuid4()) | |
examples = [ | |
"Explain the relativity theory in French", | |
"Como sair de um helicóptero que caiu na água?", | |
"¿Cómo le explicarías el aprendizaje automático a un extraterrestre?", | |
"Explain gravity to a chicken.", | |
"Descrivi il processo di creazione di un capolavoro, come se fossi un artista del Rinascimento a Firenze.", | |
"Anneme onu ne kadar sevdiğimi anlatan bir mektup yaz", | |
"Explique-moi le sens de la vie selon un grand auteur littéraire.", | |
"Give me an example of an endangered species and let me know what I can do to help preserve it", | |
"یک پاراگراف در مورد زیباییهای طبیعت در فصل پاییز بنویس", | |
"Wie kann ich lernen, selbstbewusster zu werden?", | |
"Formally introduce the transformer architecture with notation.", | |
] | |
custom_css = """ | |
#logo-img { | |
border: none !important; | |
} | |
#chat-message { | |
font-size: 14px; | |
min-height: 300px; | |
} | |
""" | |
with gr.Blocks(analytics_enabled=False, css=custom_css) as demo: | |
cid = gr.State("") | |
token = gr.State(value=None) | |
with gr.Row(): | |
with gr.Column(scale=1): | |
gr.Image("aya-logo.png", elem_id="logo-img", show_label=False, show_share_button=False, show_download_button=False) | |
with gr.Column(scale=3): | |
gr.Markdown("""C4AI Aya 23 is a research open weights release of an 8 and 35 billion parameter with highly advanced instruction fine-tuned model, covering 23 languages: Arabic, Chinese (simplified & traditional), Czech, Dutch, English, French, German, Greek, Hebrew, Hindi, Indonesian, Italian, Japanese, Korean, Persian, Polish, Portuguese, Romanian, Russian, Spanish, Turkish, Ukrainian, and Vietnamese. | |
<br/> | |
**Note**: Aya 23 is a single-turn instruction-following model and it is not optimized for chat mode use. | |
<br/> | |
**Model**: [aya-23-35B](https://huggingface.co./CohereForAI/aya-23-35B) | |
<br/> | |
**Developed by**: [Cohere for AI](https://cohere.com/research) and [Cohere](https://cohere.com/) | |
<br/> | |
**License**: [CC-BY-NC](https://cohere.com/c4ai-cc-by-nc-license), requires also adhering to [C4AI's Acceptable Use Policy](https://docs.cohere.com/docs/c4ai-acceptable-use-policy) | |
""" | |
) | |
with gr.Column(): | |
with gr.Row(): | |
chatbot = gr.Chatbot(show_label=False, show_share_button=False, show_copy_button=True) | |
with gr.Row(): | |
user_message = gr.Textbox(lines=1, placeholder="Ask anything ...", label="Input", show_label=False) | |
with gr.Row(): | |
submit_button = gr.Button("Submit") | |
clear_button = gr.Button("Clear chat") | |
history = gr.State([]) | |
user_message.submit(fn=generate_response, inputs=[user_message, cid, token, history], outputs=[chatbot, history, cid], concurrency_limit=32) | |
submit_button.click(fn=generate_response, inputs=[user_message, cid, token, history], outputs=[chatbot, history, cid], concurrency_limit=32) | |
clear_button.click(fn=clear_chat, inputs=None, outputs=[chatbot, history, cid], concurrency_limit=32) | |
user_message.submit(lambda x: gr.update(value=""), None, [user_message], queue=False) | |
submit_button.click(lambda x: gr.update(value=""), None, [user_message], queue=False) | |
clear_button.click(lambda x: gr.update(value=""), None, [user_message], queue=False) | |
with gr.Row(): | |
gr.Examples( | |
examples=examples, | |
inputs=user_message, | |
cache_examples=False, | |
fn=trigger_example, | |
outputs=[chatbot], | |
examples_per_page=100 | |
) | |
demo.load(lambda: secrets.token_hex(16), None, token) | |
if __name__ == "__main__": | |
# demo.launch(debug=True) | |
try: | |
demo.queue(api_open=False, max_size=40).launch(show_api=False) | |
except Exception as e: | |
print(f"Error: {e}") |