Spaces:

Iblouse
/

image-captioning-api

Sleeping

image-captioning-api / app.py

Update app.py

e1ec791 verified 5 months ago

771 Bytes

	import os
	import gradio as gr
	from transformers import pipeline

	# Initialize the image-to-text pipeline with the specified model
	pipe = pipeline("image-to-text", model="Salesforce/blip-image-captioning-base")

	def launch(input):
	"""
	Function to generate image caption.

	Args:
	input (PIL.Image): Input image for captioning.

	Returns:
	str: Generated caption for the input image.
	"""
	out = pipe(input)
	return out[0]['generated_text']

	# Create a Gradio interface for the image-to-text pipeline
	iface = gr.Interface(
	fn=launch, # Function to generate captions
	inputs=gr.Image(type='pil'), # Input type: Image (PIL format)
	outputs="text" # Output type: Text
	)

	# Launch the Gradio interface
	iface.launch()