Spaces:

Iblouse
/

image-captioning-api

Sleeping

image-captioning-api / app.py

Update app.py

973104b verified 4 months ago

987 Bytes

	import os
	import gradio as gr
	from transformers import pipeline

	# Initialize the pipeline with the image-to-text model
	model_path = "Salesforce/blip-image-captioning-base"
	if not os.path.exists(model_path):
	raise FileNotFoundError(f"Model path {model_path} does not exist. Please provide a valid path.")

	# Initialize the image-to-text pipeline with the specified model
	pipe = pipeline("image-to-text", model=model_path)

	def launch(input):
	"""
	Function to generate image caption.

	Args:
	input (PIL.Image): Input image for captioning.

	Returns:
	str: Generated caption for the input image.
	"""
	out = pipe(input)
	return out[0]['generated_text']

	# Create a Gradio interface for the image-to-text pipeline
	iface = gr.Interface(
	fn=launch, # Function to generate captions
	inputs=gr.Image(type='pil'), # Input type: Image (PIL format)
	outputs="text" # Output type: Text
	)

	# Launch the Gradio interface
	iface.launch()