Spaces:

salomonsky
/

flux3

Running

File size: 5,216 Bytes

0cfb4a5
d4fba6d
0dec378
 
757da8f
d4fba6d
2fc432b
 
d95dbe9
32fdddd
219d097
471c590
757da8f
52a0784
757da8f
481dde5
d95dbe9
 
 
2fc432b
32fdddd
 
 
 
757da8f
32fdddd
 
 
52a0784
1a52ee5
68ef0f8
481dde5
68ef0f8
 
 
481dde5
 
 
d95dbe9
32fdddd
2f35681
52a0784
ffe0681
 
32fdddd
 
 
e3be785
 
d95dbe9
 
 
 
 
 
 
e3be785
32fdddd
2fc432b
757da8f
 
ffe0681
757da8f
 
ffe0681
d8f32ab
2713519
757da8f
 
 
e3be785
32fdddd
e3be785
 
32fdddd
e3be785
3b4ee8c
32fdddd
3b4ee8c
32fdddd
 
ffe0681
 
32fdddd
 
 
 
 
757da8f
d8f32ab
32fdddd
d95dbe9
 
68ef0f8
2713519
68ef0f8
d8f32ab
68ef0f8
757da8f
450c3d6

import os
import gradio as gr
import numpy as np
import random
from huggingface_hub import AsyncInferenceClient, InferenceClient
from PIL import Image
from gradio_client import Client, handle_file
from gradio_imageslider import ImageSlider

MAX_SEED = np.iinfo(np.int32).max
HF_TOKEN = os.environ.get("HF_TOKEN")
HF_TOKEN_UPSCALER = os.environ.get("HF_TOKEN_UPSCALER")

client = AsyncInferenceClient()
llm_client = InferenceClient("mistralai/Mixtral-8x7B-Instruct-v0.1")

def enable_lora(lora_add, basemodel):
    return basemodel if not lora_add else lora_add

async def generate_image(prompt, model, lora_word, width, height, scales, steps, seed):
    try:
        if seed == -1:
            seed = random.randint(0, MAX_SEED)
        seed = int(seed)
        text = prompt + "," + lora_word
        image = await client.text_to_image(prompt=text, height=height, width=width, guidance_scale=scales, num_inference_steps=steps, model=model)
        return image, seed
    except Exception as e:
        return f"Error al generar imagen: {e}", None

def get_upscale_finegrain(prompt, img_path, upscale_factor):
    try:
        client = Client("finegrain/finegrain-image-enhancer", hf_token=HF_TOKEN_UPSCALER)
        result = client.predict(input_image=handle_file(img_path), prompt=prompt, negative_prompt="", seed=42, upscale_factor=upscale_factor, controlnet_scale=0.6, controlnet_decay=1, condition_scale=6, tile_width=112, tile_height=144, denoise_strength=0.35, num_inference_steps=18, solver="DDIM", api_name="/process")
        return result[1]
    except Exception as e:
        return None

async def gen(prompt, basemodel, width, height, scales, steps, seed, upscale_factor, process_upscale, lora_model, process_lora):
    model = enable_lora(lora_model, basemodel) if process_lora else basemodel
    image, seed = await generate_image(prompt, model, "", width, height, scales, steps, seed)
    
    if isinstance(image, str) and image.startswith("Error"):
        return [image, None]
    
    image_path = "temp_image.jpg"
    image.save(image_path, format="JPEG")
    
    if process_upscale:
        upscale_image_path = get_upscale_finegrain(prompt, image_path, upscale_factor)
        if upscale_image_path is not None:
            upscale_image = Image.open(upscale_image_path)
            upscale_image.save("upscale_image.jpg", format="JPEG")
            return [image_path, "upscale_image.jpg"]
        else:
            return [image_path, image_path]
    else:
        return [image_path, image_path]

def improve_prompt(prompt):
    try:
        instruction = "Mejora mi prompt y desarrolla mi idea para texto a imagen en inglés con estilo para el modelo FLUX, cinematografía, cámaras, atmósfera e iluminación para la mejor calidad, de máximo 200 palabras."
        formatted_prompt = f"{instruction}: {prompt}"
        response = llm_client.text_generation(formatted_prompt, max_new_tokens=200)
        improved_text = response['generated_text'].strip() if 'generated_text' in response else response.strip()

        return improved_text
    except Exception as e:
        return f"Error mejorando el prompt: {e}"

css = """
#col-container{ margin: 0 auto; max-width: 1024px;}
"""

with gr.Blocks(css=css, theme="Nymbo/Nymbo_Theme") as demo:
    with gr.Column(elem_id="col-container"):
        with gr.Row():
            with gr.Column(scale=3):
                output_res = ImageSlider(label="Flux / Upscaled")
            with gr.Column(scale=2):
                prompt = gr.Textbox(label="Descripción de imágen")
                improved_prompt = gr.Textbox(label="Mejorada mi idea", interactive=False)
                improve_btn = gr.Button("Mejora mi prompt")
                basemodel_choice = gr.Dropdown(label="Modelo", choices=["black-forest-labs/FLUX.1-schnell", "black-forest-labs/FLUX.1-DEV"], value="black-forest-labs/FLUX.1-schnell")
                lora_model_choice = gr.Dropdown(label="LORA Realismo", choices=["Shakker-Labs/FLUX.1-dev-LoRA-add-details", "XLabs-AI/flux-RealismLora"], value="XLabs-AI/flux-RealismLora")
                process_lora = gr.Checkbox(label="Procesar LORA")
                process_upscale = gr.Checkbox(label="Procesar Escalador")
                upscale_factor = gr.Radio(label="Factor de Escala", choices=[2, 4, 8], value=2)
                improve_btn.click(fn=improve_prompt, inputs=[prompt], outputs=improved_prompt)
                
                with gr.Accordion(label="Opciones Avanzadas", open=False):
                    width = gr.Slider(label="Ancho", minimum=512, maximum=1280, step=8, value=1280)
                    height = gr.Slider(label="Alto", minimum=512, maximum=1280, step=8, value=768)
                    scales = gr.Slider(label="Escalado", minimum=1, maximum=20, step=1, value=10)
                    steps = gr.Slider(label="Pasos", minimum=1, maximum=100, step=1, value=20)
                    seed = gr.Number(label="Semilla", value=-1)
    
                btn = gr.Button("Generar")
                btn.click(fn=gen, inputs=[improved_prompt, basemodel_choice, width, height, scales, steps, seed, upscale_factor, process_upscale, lora_model_choice, process_lora], outputs=output_res)
    demo.launch()