Spaces:

way2call
/

Testing-Way2CALL-models

Sleeping

Update app.py

341548b verified 3 months ago

1.52 kB

	import gradio as gr
	from openai import OpenAI

	BASE_URL = "https://w0xtwbf2fdxe1q-8000.proxy.runpod.net/v1/chat/completions"
	API_KEY="SOMEHOW"

	# Create an OpenAI client to interact with the API server
	client = OpenAI(
	base_url=BASE_URL,
	api_key=API_KEY
	)

	def predict(message, history):
	# Convert chat history to OpenAI format
	history_openai_format = [{
	"role": "system",
	"content": "Tu es un excellent assistant IA développé par WAY2CALL pour faire des évaluations en JSON des audios transcrits."
	}]
	for i, (human, assistant) in enumerate(history):
	if i % 2 == 0:
	history_openai_format.append({"role": "user", "content": human})
	else:
	history_openai_format.append({"role": "assistant", "content": assistant})
	history_openai_format.append({"role": "user", "content": message})

	# Create a chat completion request and send it to the API server
	stream = client.chat.completions.create(
	model="way2call/way2call-7b-evaluation-instruct", # Model name to use
	messages=history_openai_format, # Chat history
	temperature=0.1, # Temperature for text generation
	stream=True, # Stream response
	)

	# Read and return generated text from response stream
	partial_message = ""
	for chunk in stream:
	partial_message += (chunk.choices[0].delta.content or "")
	yield partial_message

	# Create and launch a chat interface with Gradio
	gr.ChatInterface(predict).queue().launch()