Spaces:

Hieucyber2208
/

know-flow

Sleeping

App Files Files Community

know-flow / src /image_gen.py

Hieucyber2208

Update src/image_gen.py

e3ec604 verified 3 months ago

raw

history blame

5.58 kB

	from huggingface_hub import InferenceClient
	import os
	import glob
	from collections import defaultdict
	import google.generativeai as genai
	from tqdm import tqdm
	from huggingface_hub.utils import HfHubHTTPError
	import random
	import time
	from dotenv import load_dotenv

	load_dotenv()
	HF_TOKEN = os.getenv("HF_TOKEN")
	GOOGLE_API_KEY = os.getenv("GOOGLE_API_KEY")
	genai.configure(api_key=GOOGLE_API_KEY)
	client = InferenceClient(provider="hf-inference", api_key=HF_TOKEN)

	def split_text_for_images(number_of_images):
	with open("./text/text.txt", "r", encoding="utf-8") as file:
	text = file.read().strip()

	total_length = len(text)
	chunk_size = total_length // number_of_images # Độ dài trung bình của mỗi đoạn

	chunks = []
	start = 0

	for i in range(number_of_images):
	# Xác định điểm kết thúc gần nhất tại dấu câu (nếu có)
	end = start + chunk_size
	if i < number_of_images - 1:
	while end < total_length and text[end] not in ".!?":
	end += 1 # Mở rộng đến dấu câu gần nhất để tránh cắt ngang câu
	if end < total_length - 1:
	end += 1 # Bao gồm cả dấu câu vào đoạn

	chunk = text[start:end].strip()
	chunks.append(chunk)
	start = end # Bắt đầu đoạn tiếp theo từ đây

	return chunks
	def describe_image(description, detail_level="short", perspective="neutral", emotion=None, time_setting=None, art_style=None):
	"""
	Nhận một đoạn văn mô tả chi tiết và trả về một câu mô tả hình ảnh theo các tùy chỉnh.

	Args:
	description (str): Đoạn văn mô tả chi tiết.
	detail_level (str): Mức độ chi tiết ("short" hoặc "detailed").
	perspective (str): Góc nhìn ("subjective" hoặc "neutral").
	emotion (str, optional): Cảm xúc chủ đạo (nếu có, ví dụ: "mysterious", "romantic").
	time_setting (str, optional): Bối cảnh thời gian (ví dụ: "modern", "medieval", "futuristic").
	art_style (str, optional): Phong cách nghệ thuật (ví dụ: "realistic", "abstract", "sketch").

	Returns:
	str: Một câu mô tả hình ảnh theo yêu cầu.
	"""

	prompt = f"""
	Bạn là chuyên gia mô tả hình ảnh. Hãy đọc đoạn mô tả dưới đây và tạo một mô tả hình ảnh theo các tiêu chí sau:
	- Mức độ chi tiết: {"Ngắn gọn" if detail_level == "short" else "Chi tiết"}.
	- Góc nhìn: {"Chủ quan" if perspective == "subjective" else "Trung lập"}.
	{f"- Cảm xúc chủ đạo: {emotion}." if emotion else ""}
	{f"- Bối cảnh thời gian: {time_setting}." if time_setting else ""}
	{f"- Phong cách nghệ thuật: {art_style}." if art_style else ""}

	Đoạn mô tả:
	{description}

	Hãy tạo một mô tả hình ảnh phù hợp với yêu cầu trên bằng Tiếng Anh.
	"""

	try:
	model = genai.GenerativeModel("gemini-pro")
	response = model.generate_content(prompt)
	return response.text.strip()
	except Exception as e:
	print(f"Lỗi khi gọi API Gemini: {e}")
	return ""
	def generate_image(prompt, output_path, style=None, color_palette=None):
	model="stabilityai/stable-diffusion-3.5-large"
	"""
	Tạo hình ảnh từ mô tả văn bản với các tùy chỉnh linh hoạt.

	:param prompt: Mô tả hình ảnh đầu vào.
	:param output_path: Đường dẫn lưu ảnh đầu ra.
	:param model: Mô hình AI sử dụng để tạo ảnh.
	:param style: Phong cách hình ảnh (nếu có, ví dụ: 'realistic', 'anime', 'cyberpunk').
	:param color_palette: Bảng màu ưu tiên (nếu có, ví dụ: 'vibrant', 'monochrome').
	"""
	custom_prompt = prompt

	if style:
	custom_prompt += f" in {style} style"
	if color_palette:
	custom_prompt += f" with {color_palette} color scheme"

	image = client.text_to_image(custom_prompt, model=model)
	image.save(output_path)
	print(f"✅Image saved at {output_path}")
	def image_gen(number_of_images = 3,detail_level = "short", perspective="neutral", emotion=None, time_setting=None, art_style=None, style=None, color_palette=None):
	texts = split_text_for_images(number_of_images)
	index = 0
	for text in tqdm(texts, desc="Processing", unit="image"):
	output_path = f"./image/{index}.png"
	prompt = describe_image(text, detail_level, perspective, emotion, time_setting, art_style)
	print(prompt)

	# Cơ chế retry với backoff
	max_retries = 5
	retry_count = 0

	while retry_count < max_retries:
	try:
	generate_image(prompt, output_path, style, color_palette)
	time.sleep(60) # Chờ sau khi tạo ảnh thành công
	break # Nếu thành công thì thoát khỏi vòng lặp retry
	except HfHubHTTPError as e:
	print(f"Lỗi khi gọi API: {e}")
	retry_count += 1
	wait_time = 2 ** retry_count + random.uniform(0, 1) # Exponential backoff
	print(f"Thử lại sau {wait_time:.2f} giây...")
	time.sleep(wait_time)
	index += 1
	os.remove("./text/text.txt")
	if __name__ == "__main__":
	image_gen(number_of_images = 3, detail_level="short", perspective="neutral", emotion="sad", time_setting="classic", art_style="realistic", style="anime", color_palette="monochrome")