Spaces:

jjz5463
/

Diary-AI

Paused

App Files Files Community

Diary-AI / app.py

jjz5463

cache_dir

80db327 3 months ago

raw

history blame

2.7 kB

	import gradio as gr
	import openai
	import json
	from PIL import Image
	from google.oauth2 import service_account
	from baseline_utils import detect_text_in_image, summarize_diary_text, analyze_writer_image, generate_comic_book
	import glob
	import os

	# Load secrets from Hugging Face Spaces environment
	openai_api_key = os.getenv("OPENAI_API_KEY")
	google_service_account_info = json.loads(os.getenv("GOOGLE_SERVICE_ACCOUNT"))
	gemini_api_key = os.getenv("GEMINI_API_KEY")

	# from keys.keys import *
	# # Load secrets from the environment or other sources (adjust as needed)
	# openai_api_key = open_ai_keys
	# with open('keys/service_account_credentials.json') as f:
	# google_service_account_info = json.load(f)
	# gemini_api_key = gemini_keys

	# Function to get Google credentials
	def get_google_credentials():
	return service_account.Credentials.from_service_account_info(google_service_account_info)


	def process_images(diary_image, writer_image):
	# Save the file-like objects as image files
	diary_image_path = "temp_upload_images/temp_diary_image.png"
	writer_image_path = "temp_upload_images/temp_writer_image.png"
	os.makedirs("temp_upload_images", exist_ok=True)
	diary_image.save(diary_image_path)
	writer_image.save(writer_image_path)

	# Detect text from the diary image
	google_credentials = get_google_credentials()
	detected_text = detect_text_in_image(diary_image_path, google_credentials)
	summarized_text = summarize_diary_text(detected_text, openai_api_key)

	# Analyze the writer's image using Gemini API
	writer_summary = analyze_writer_image(writer_image_path, gemini_api_key)

	# Generate the comic book based on the summaries
	generate_comic_book(summarized_text, writer_summary, num_pages=4)

	# Assuming generated images are saved as 'comic_book/page_1.png', 'comic_book/page_2.png', etc.
	image_files = sorted(glob.glob("comic_book/page_*.png")) # Find all the generated comic book pages

	return image_files


	# Define the Gradio interface
	def gradio_interface(diary_image, writer_image):
	# Process the images and generate comic book pages
	generated_images = process_images(diary_image, writer_image)

	# Load the images and return them
	images = [Image.open(img) for img in generated_images]
	return images


	# Set up the Gradio interface
	interface = gr.Interface(
	fn=gradio_interface,
	inputs=[
	gr.Image(label="Upload your handwritten diary image", type="pil"),
	gr.Image(label="Upload a photo of the writer", type="pil"),
	],
	outputs=gr.Gallery(label="Generated Comic Book Pages"),
	title="Handwritten Diary to Comic Book"
	)

	# Launch the interface
	interface.launch()