Spaces:

sdafd
/

gemini-webui

Sleeping

App Files Files Community

sdafd commited on 25 days ago

Commit

c23b561

verified ·

1 Parent(s): e59f7e5

Update app.py

Browse files

Files changed (1) hide show

app.py +179 -597

app.py CHANGED Viewed

@@ -1,621 +1,203 @@
 import gradio as gr
-import google.generativeai as genai
-import os
-import mimetypes
 from PIL import Image
-import io
-import magic # python-magic library
-from dotenv import load_dotenv
-# (Optional) Load environment variables for local testing if you have a .env file
-# load_dotenv()
-# TEST_API_KEY = os.getenv("GEMINI_API_KEY") # Use this ONLY for your local testing
-# --- Constants ---
-# Define available models (expand this list as needed)
-# Include models supporting different modalities and versions
-AVAILABLE_MODELS = [
-    "gemini-1.5-flash-latest",
-    "gemini-1.5-pro-latest",
-    "gemini-1.0-pro",
-    "gemini-pro-vision", # Example vision model
-    # "gemini-experimental", # Add other relevant models
 ]
-# Define parameters for each model (Example structure)
-# This needs meticulous mapping based on official Gemini documentation
-MODEL_PARAMS = {
-    "gemini-1.5-flash-latest": {
-        "temperature": {"type": "slider", "min": 0.0, "max": 2.0, "step": 0.1, "default": 1.0},
-        "top_p": {"type": "slider", "min": 0.0, "max": 1.0, "step": 0.01, "default": 0.95},
-        "top_k": {"type": "slider", "min": 1, "max": 100, "step": 1, "default": 40},
-        "max_output_tokens": {"type": "number", "min": 1, "step": 1, "default": 8192},
-        "stop_sequences": {"type": "textbox", "lines": 1, "placeholder": "e.g., END,STOP", "default": ""},
-        # Safety settings could be added here too (as dropdowns or checkboxes)
-    },
-    "gemini-1.5-pro-latest": {
-        # Similar params, possibly different defaults or ranges
-        "temperature": {"type": "slider", "min": 0.0, "max": 2.0, "step": 0.1, "default": 1.0},
-        "top_p": {"type": "slider", "min": 0.0, "max": 1.0, "step": 0.01, "default": 0.95},
-        "top_k": {"type": "slider", "min": 1, "max": 100, "step": 1, "default": 40},
-        "max_output_tokens": {"type": "number", "min": 1, "step": 1, "default": 8192},
-        "stop_sequences": {"type": "textbox", "lines": 1, "placeholder": "e.g., END,STOP", "default": ""},
-    },
-    "gemini-1.0-pro": {
-        # Params for older model might differ slightly
-        "temperature": {"type": "slider", "min": 0.0, "max": 1.0, "step": 0.1, "default": 0.9}, # Different max/default maybe
-        "top_p": {"type": "slider", "min": 0.0, "max": 1.0, "step": 0.01, "default": 0.95},
-        "top_k": {"type": "slider", "min": 1, "max": 100, "step": 1, "default": 40},
-        "max_output_tokens": {"type": "number", "min": 1, "step": 1, "default": 2048}, # Different default
-        "stop_sequences": {"type": "textbox", "lines": 1, "placeholder": "e.g., END,STOP", "default": ""},
-    },
-    "gemini-pro-vision": {
-         # Vision models might have fewer text-generation params or different ones
-        "temperature": {"type": "slider", "min": 0.0, "max": 1.0, "step": 0.1, "default": 0.4},
-        "top_p": {"type": "slider", "min": 0.0, "max": 1.0, "step": 0.01, "default": 0.95},
-        "top_k": {"type": "slider", "min": 1, "max": 100, "step": 1, "default": 32},
-        "max_output_tokens": {"type": "number", "min": 1, "step": 1, "default": 2048},
-        # No stop sequences typically needed here? Check docs.
-    }
 }
-# --- Helper Functions ---
-def get_mime_type(file_path):
-    """Get MIME type using python-magic for reliability."""
-    try:
-        mime = magic.Magic(mime=True)
-        return mime.from_file(file_path)
-    except Exception:
-        # Fallback to mimetypes if magic fails
-        return mimetypes.guess_type(file_path)[0]
-def convert_file_to_text(file_obj):
-    """
-    Attempts to convert various file types to text.
-    Returns (text_content, original_filename) or (None, original_filename) if conversion fails.
-    """
-    file_path = file_obj.name
-    filename = os.path.basename(file_path)
-    mime_type = get_mime_type(file_path)
-    print(f"Processing file: {filename}, MIME type: {mime_type}") # Debugging
-    try:
-        if mime_type is None:
-            # If MIME type is unknown, try reading as text
-            print(f"Warning: Unknown MIME type for {filename}. Attempting to read as text.")
-            with open(file_path, 'r', encoding='utf-8', errors='ignore') as f:
-                return f.read(), filename
-        elif mime_type.startswith("text/"):
-            with open(file_path, 'r', encoding='utf-8', errors='ignore') as f:
-                return f.read(), filename
-        elif mime_type == "application/pdf":
-            # Placeholder for PDF conversion (requires pypdf or similar)
-            print(f"PDF conversion not implemented yet for {filename}.")
-            # from pypdf import PdfReader # Example
-            # reader = PdfReader(file_path)
-            # text = ""
-            # for page in reader.pages:
-            #    text += page.extract_text() + "\n"
-            # return text, filename
-            return f"[Unsupported PDF: {filename} - Conversion not implemented]", filename # Temporary
-        elif mime_type in ["application/msword", "application/vnd.openxmlformats-officedocument.wordprocessingml.document"]:
-             # Placeholder for DOCX conversion (requires python-docx or similar)
-            print(f"DOCX conversion not implemented yet for {filename}.")
-            # import docx # Example
-            # doc = docx.Document(file_path)
-            # text = "\n".join([para.text for para in doc.paragraphs])
-            # return text, filename
-            return f"[Unsupported Word Doc: {filename} - Conversion not implemented]", filename # Temporary
-        else:
-            # For other unsupported types, return a marker
-            print(f"Unsupported file type: {mime_type} for {filename}. Skipping content.")
-            return f"[Unsupported file type: {mime_type} - {filename}]", filename
-    except Exception as e:
-        print(f"Error converting file {filename}: {e}")
-        return f"[Error converting file: {filename}]", filename
-def prepare_gemini_input(prompt, files):
-    """Prepares the input list for Gemini, handling text and images."""
-    gemini_parts = []
-    if prompt:
-        gemini_parts.append(prompt)
-    if files:
-        for file_obj in files:
-            file_path = file_obj.name
-            mime_type = get_mime_type(file_path)
-            filename = os.path.basename(file_path)
-            print(f"Preparing file for Gemini: {filename}, MIME: {mime_type}")
-            if mime_type and mime_type.startswith("image/"):
-                try:
-                    img = Image.open(file_path)
-                    # Convert image to bytes (e.g., PNG or JPEG)
-                    # Gemini API directly accepts PIL Images usually
-                    gemini_parts.append(img)
-                    print(f"Added image: {filename}")
-                except Exception as e:
-                    print(f"Error processing image {filename}: {e}")
-                    gemini_parts.append(f"[Error processing image: {filename}]")
-            elif mime_type and mime_type.startswith("video/"): # Gemini 1.5 Pro can handle video
-                 # Upload file via File API first (more complex, needs google.ai.generativelanguage)
-                 # For simplicity here, we'll just note it's a video
-                 # or provide a basic text representation if conversion isn't implemented
-                 print(f"Video file detected: {filename}. Full video processing requires File API.")
-                 gemini_parts.append(f"[Video file: {filename} - Requires File API upload]")
-                 # Placeholder: Add text conversion if feasible for your use case
-                 # text_content, _ = convert_file_to_text(file_obj)
-                 # if text_content:
-                 #     gemini_parts.append(f"--- Content of video file {filename} (extracted as text) ---\n{text_content}")
-            elif mime_type and mime_type.startswith("audio/"): # Gemini 1.5 Pro can handle audio
-                 print(f"Audio file detected: {filename}. Full audio processing requires File API.")
-                 gemini_parts.append(f"[Audio file: {filename} - Requires File API upload]")
-                 # Placeholder: Add text conversion if feasible (e.g. transcript)
-                 # text_content, _ = convert_file_to_text(file_obj) # Needs specific audio-to-text logic
-                 # if text_content:
-                 #     gemini_parts.append(f"--- Content of audio file {filename} (extracted as text) ---\n{text_content}")
-            else: # Assume text or convertible to text
-                text_content, original_filename = convert_file_to_text(file_obj)
-                if text_content:
-                    # Add context marker
-                    gemini_parts.append(f"\n--- Content from file: {original_filename} ---\n{text_content}\n--- End of file: {original_filename} ---")
-                else:
-                    gemini_parts.append(f"[Could not process file: {original_filename}]")
-    # Ensure there's at least one part (maybe an empty string if only files were given?)
-    if not gemini_parts:
-         gemini_parts.append("") # Avoid sending empty list
-    return gemini_parts
-# --- Gradio UI Functions ---
 def validate_api_key(api_key):
-    """Checks if the API key is potentially valid by trying to list models."""
-    if not api_key:
-        return "<p style='color: orange;'>Please enter an API Key.</p>"
     try:
-        genai.configure(api_key=api_key)
-        models = genai.list_models()
-        # Check if at least one desired model is available with this key
-        available_core_models = [m.name for m in models if 'generateContent' in m.supported_generation_methods]
-        if any(model_name.split('/')[-1] in AVAILABLE_MODELS for model_name in available_core_models):
-             return "<p style='color: green;'>API Key seems valid (can list models).</p>"
-        else:
-             return "<p style='color: orange;'>API Key is valid but might not have access to the required Gemini models.</p>"
     except Exception as e:
-        print(f"API Key validation error: {e}")
-        # Be careful not to leak too much error detail
-        if "API key not valid" in str(e):
-             return "<p style='color: red;'>API Key is invalid.</p>"
         else:
-             return f"<p style='color: red;'>API Key validation failed. Error: {str(e)}</p>"
-def update_parameter_visibility(model_name):
-    """Updates visibility and values of parameter controls based on selected model."""
-    updates = {}
-    params_for_model = MODEL_PARAMS.get(model_name, {})
-    # Define ALL possible parameter components used across models
-    all_param_keys = set(k for params in MODEL_PARAMS.values() for k in params)
-    for key in all_param_keys:
-        param_config = params_for_model.get(key)
-        if param_config:
-            # Parameter exists for this model: make visible and set defaults
-            updates[param_elements[key]] = gr.update(
-                visible=True,
-                label=key.replace("_", " ").title(), # Nicer label
-                value=param_config.get("default") # Set default value
-                # Add specific updates for slider ranges etc. if needed
-                # minimum=param_config.get("min"),
-                # maximum=param_config.get("max"),
-                # step=param_config.get("step")
-            )
-        else:
-            # Parameter does NOT exist for this model: hide it
-            updates[param_elements[key]] = gr.update(visible=False, value=None) # Reset value when hiding
-    return updates
-def handle_chat(api_key, model_name, history, message, files, *params_tuple):
-    """Handles the chat interaction."""
-    # 1. Basic Validation
-    if not api_key:
-        gr.Warning("Gemini API Key is missing!")
-        return history, "" # Return unchanged history and empty textbox
-    if not message and not files:
-        gr.Warning("Please enter a message or upload files.")
-        return history, ""
-    # 2. Configure API Key
-    try:
-        genai.configure(api_key=api_key)
-    except Exception as e:
-        gr.Error(f"Failed to configure API Key: {e}")
-        return history, message # Keep message in textbox for retry
-    # 3. Prepare Generation Config from *params_tuple
-    param_keys = [key for key, config in MODEL_PARAMS.get(model_name, {}).items()]
-    generation_config_dict = {}
-    if len(params_tuple) == len(param_keys):
-         generation_config_dict = {key: val for key, val in zip(param_keys, params_tuple) if val is not None}
-         # Handle stop sequences (expecting comma-separated string)
-         if 'stop_sequences' in generation_config_dict and isinstance(generation_config_dict['stop_sequences'], str):
-             sequences = [s.strip() for s in generation_config_dict['stop_sequences'].split(',') if s.strip()]
-             if sequences:
-                 generation_config_dict['stop_sequences'] = sequences
-             else:
-                 del generation_config_dict['stop_sequences'] # Remove if empty/invalid
-         print(f"Using Generation Config: {generation_config_dict}") # Debug
     else:
-         print(f"Warning: Mismatch between expected params ({len(param_keys)}) and received params ({len(params_tuple)})")
-    # 4. Prepare Model Input
-    gemini_input_parts = prepare_gemini_input(message, files)
-    print(f"Prepared Gemini Input Parts: {gemini_input_parts}") # Debugging
-    # 5. Initialize Model and Chat
-    try:
-        # Add safety settings if needed/configured
-        # safety_settings = {...}
-        model = genai.GenerativeModel(model_name)#, safety_settings=safety_settings)
-        # Convert Gradio history (list of lists) to Gemini format (list of Content objects)
-        gemini_history = []
-        for user_msg, model_msg in history:
-            # Simple text history for now. Need enhancement for multimodal history.
-            if user_msg: gemini_history.append({'role': 'user', 'parts': [user_msg]})
-            if model_msg: gemini_history.append({'role': 'model', 'parts': [model_msg]})
-        chat = model.start_chat(history=gemini_history)
-        print(f"Starting chat with history (simplified): {gemini_history}") # Debugging
-    except Exception as e:
-        gr.Error(f"Failed to initialize model or chat: {e}")
-        return history, message # Keep message in textbox
-    # 6. Send Message and Get Response
-    response_text = ""
-    try:
-        # Use streaming for better UX in chat
-        response = chat.send_message(gemini_input_parts,
-                                     generation_config=genai.types.GenerationConfig(**generation_config_dict),
-                                     stream=True)
-        full_response_content = ""
-        for chunk in response:
-             # Check if the chunk has text content
-             if hasattr(chunk, 'text'):
-                 chunk_text = chunk.text
-                 print(f"Stream chunk: {chunk_text}") # Debug stream
-                 full_response_content += chunk_text
-                 # Yield intermediate updates to the chatbot
-                 current_history = history + [[message or "[Input files only]", full_response_content]]
-                 yield current_history, "" # Update chatbot, clear input
-             # Check for image data if model supports it (more complex parsing needed)
-             # elif chunk.parts and chunk.parts[0].inline_data:
-             #     # Handle potential image output - requires modification
-             #     pass
-        response_text = full_response_content # Final text response
-        # Check for blocked prompts or safety issues
-        if not response_text and response.prompt_feedback.block_reason:
-             block_reason = response.prompt_feedback.block_reason
-             safety_ratings = response.prompt_feedback.safety_ratings
-             gr.Warning(f"Request blocked. Reason: {block_reason}. Ratings: {safety_ratings}")
-             # Append a notice to history instead of an empty response
-             history.append([message or "[Input files only]", f"[Request blocked due to: {block_reason}]"])
-             return history, "" # Clear input box
-    except Exception as e:
-        gr.Error(f"Error during generation: {e}")
-        # Optionally add the error to history for context
-        history.append([message or "[Input files only]", f"[Error during generation: {str(e)}]"])
-        return history, "" # Clear input box
-    # 7. Update History and Clear Input
-    # The yielding above handles intermediate updates. This is the final state.
-    final_history = history + [[message or "[Input files only]", response_text or "[No text content received]"]]
-    return final_history, "" # Final update, clear input
-def handle_single_response(api_key, model_name, prompt, files, *params_tuple):
-    """Handles the single response interaction."""
-    # 1. Validations
-    if not api_key:
-        gr.Warning("Gemini API Key is missing!")
-        return "[Error: API Key Missing]", None # Text output, Image output
-    if not prompt and not files:
-        gr.Warning("Please enter a prompt or upload files.")
-        return "[Error: No input provided]", None
-    # 2. Configure API Key
     try:
-        genai.configure(api_key=api_key)
     except Exception as e:
-        gr.Error(f"Failed to configure API Key: {e}")
-        return f"[Error: API Key Config Failed: {e}]", None
-    # 3. Prepare Generation Config
-    param_keys = [key for key, config in MODEL_PARAMS.get(model_name, {}).items()]
-    generation_config_dict = {}
-    if len(params_tuple) == len(param_keys):
-         generation_config_dict = {key: val for key, val in zip(param_keys, params_tuple) if val is not None}
-         # Handle stop sequences
-         if 'stop_sequences' in generation_config_dict and isinstance(generation_config_dict['stop_sequences'], str):
-             sequences = [s.strip() for s in generation_config_dict['stop_sequences'].split(',') if s.strip()]
-             if sequences:
-                 generation_config_dict['stop_sequences'] = sequences
-             else:
-                 del generation_config_dict['stop_sequences']
-         print(f"Using Generation Config: {generation_config_dict}") # Debug
     else:
-         print(f"Warning: Mismatch between expected params ({len(param_keys)}) and received params ({len(params_tuple)})")
-    # 4. Prepare Model Input
-    gemini_input_parts = prepare_gemini_input(prompt, files)
-    print(f"Prepared Gemini Input Parts: {gemini_input_parts}") # Debugging
-    # 5. Initialize Model
-    try:
-        # Add safety settings if needed/configured
-        model = genai.GenerativeModel(model_name)
-    except Exception as e:
-        gr.Error(f"Failed to initialize model: {e}")
-        return f"[Error: Model Initialization Failed: {e}]", None
-    # 6. Generate Content (Non-streaming for single response usually)
-    output_text = "[No text content generated]"
-    output_image = None # Placeholder for image output
     try:
-        response = model.generate_content(
-            gemini_input_parts,
-            generation_config=genai.types.GenerationConfig(**generation_config_dict),
-            stream=False # Simpler for single turn unless very long output expected
-        )
-        # Check for blocked prompts or safety issues
-        if response.prompt_feedback.block_reason:
-             block_reason = response.prompt_feedback.block_reason
-             safety_ratings = response.prompt_feedback.safety_ratings
-             gr.Warning(f"Request blocked. Reason: {block_reason}. Ratings: {safety_ratings}")
-             return f"[Request blocked due to: {block_reason}]", None
-        # Process response parts (could contain text and/or images)
-        # This part needs refinement based on how Gemini API returns mixed content
-        # For now, prioritize text and assume first image part if present
-        response_text_parts = []
-        for part in response.parts:
-            if hasattr(part, 'text'):
-                response_text_parts.append(part.text)
-            elif hasattr(part, 'inline_data') and part.inline_data.mime_type.startswith('image/'):
-                 if output_image is None: # Display the first image found
-                     try:
-                        image_data = part.inline_data.data
-                        img = Image.open(io.BytesIO(image_data))
-                        output_image = img
-                        print("Image received in response.")
-                     except Exception as img_err:
-                         print(f"Error decoding image from response: {img_err}")
-                         response_text_parts.append("[Error decoding image in response]")
-        if response_text_parts:
-            output_text = "\n".join(response_text_parts)
-        elif hasattr(response, 'text'): # Fallback if parts parsing fails but text attribute exists
-            output_text = response.text
-        # Check if only an image was returned (or intended)
-        if not response_text_parts and output_image is not None:
-             output_text = "[Image generated - see output below]"
     except Exception as e:
-        gr.Error(f"Error during generation: {e}")
-        output_text = f"[Error during generation: {str(e)}]"
-    # 7. Return results
-    return output_text, output_image
-# --- Build Gradio Interface ---
-with gr.Blocks(theme=gr.themes.Soft()) as demo:
-    gr.Markdown("# Gemini API Interface")
-    gr.Markdown("Interact with Google Gemini models using your own API key. Supports chat, single responses, file uploads, and model-specific parameters.")
     # API Key Section
-    with gr.Row():
-        api_key_input = gr.Textbox(
-            label="Gemini API Key",
-            placeholder="Enter your Gemini API Key here",
-            type="password",
-            scale=3
-        )
-        validate_button = gr.Button("Validate Key", scale=1)
-    api_key_status = gr.Markdown("<p style='color: gray;'>Enter your key and click Validate.</p>")
-    # Model Selection
-    model_dropdown = gr.Dropdown(
-        label="Select Gemini Model",
-        choices=AVAILABLE_MODELS,
-        value=AVAILABLE_MODELS[0], # Default model
-    )
-    # Dynamic Parameters Section (Initially hidden, updated by model selection)
-    param_elements = {} # Dictionary to hold parameter UI components
-    with gr.Accordion("Model Parameters", open=False) as params_accordion:
-        # Create UI elements for ALL possible parameters defined in MODEL_PARAMS
-        # They will be shown/hidden by the update_parameter_visibility function
-        all_possible_params = set(k for params in MODEL_PARAMS.values() for k in params)
-        for param_name in sorted(list(all_possible_params)): # Sort for consistent order
-             # Determine control type based on the first model that defines it (can be refined)
-             control_type = "textbox" # Default
-             config = {}
-             for model_cfg in MODEL_PARAMS.values():
-                 if param_name in model_cfg:
-                     config = model_cfg[param_name]
-                     control_type = config.get("type", "textbox")
-                     break # Found config for this param
-             if control_type == "slider":
-                 param_elements[param_name] = gr.Slider(
-                     label=param_name.replace("_", " ").title(),
-                     minimum=config.get("min", 0),
-                     maximum=config.get("max", 1),
-                     step=config.get("step", 0.1),
-                     value=config.get("default"),
-                     visible=False, # Initially hidden
-                     interactive=True
-                 )
-             elif control_type == "number":
-                  param_elements[param_name] = gr.Number(
-                      label=param_name.replace("_", " ").title(),
-                      minimum=config.get("min", 1),
-                      step=config.get("step", 1),
-                      value=config.get("default"),
-                      visible=False,
-                      interactive=True
-                  )
-             else: # Default to Textbox for stop_sequences etc.
-                 param_elements[param_name] = gr.Textbox(
-                     label=param_name.replace("_", " ").title(),
-                     lines=config.get("lines", 1),
-                     placeholder=config.get("placeholder", ""),
-                     value=config.get("default", ""),
-                     visible=False,
-                     interactive=True
-                 )
-    # Pack the parameter components into a list for function inputs/outputs
-    # IMPORTANT: The order here MUST match the order expected by handle_chat/handle_single_response
-    ordered_param_components = [param_elements[key] for key in sorted(param_elements.keys())]
-    # Main Interaction Area (Tabs)
-    with gr.Tabs():
-        # --- Chat Interface Tab ---
-        with gr.TabItem("Chat Interface"):
-            gr.Markdown("Have a conversation with the selected model. Upload files to include their content.")
-            chat_history_state = gr.State([]) # Holds the conversation history
-            chatbot_display = gr.Chatbot(label="Conversation", height=500)
-            with gr.Row():
-                 chat_file_upload = gr.File(label="Upload Files (Text, Images, etc.)", file_count="multiple")
-            with gr.Row():
-                chat_message_input = gr.Textbox(label="Your Message", placeholder="Type your message here...", scale=4, lines=3)
-                chat_submit_button = gr.Button("Send", variant="primary", scale=1)
-            clear_chat_button = gr.Button("Clear Chat History")
-        # --- Single Response Tab ---
         with gr.TabItem("Single Response"):
-            gr.Markdown("Send a prompt (and optionally files) to get a single response from the model.")
-            with gr.Row():
-                with gr.Column(scale=2):
-                    single_prompt_input = gr.Textbox(label="Your Prompt", placeholder="Enter your prompt...", lines=5)
-                    single_file_upload = gr.File(label="Upload Files (Text, Images, etc.)", file_count="multiple")
-                    single_submit_button = gr.Button("Generate Response", variant="primary")
-                with gr.Column(scale=2):
-                    gr.Markdown("**Output:**")
-                    single_output_text = gr.Textbox(label="Text Response", lines=10, interactive=False)
-                    single_output_image = gr.Image(label="Image Response", type="pil", interactive=False) # Display PIL images
-    # --- Event Wiring ---
-    # 1. API Key Validation
-    validate_button.click(
-        fn=validate_api_key,
         inputs=[api_key_input],
-        outputs=[api_key_status]
-    )
-    # 2. Update Parameters UI when Model Changes
-    model_dropdown.change(
-        fn=update_parameter_visibility,
-        inputs=[model_dropdown],
-        outputs=list(param_elements.values()) # Pass the actual components
-    )
-    # Trigger initial parameter visibility update on load
-    demo.load(
-        fn=update_parameter_visibility,
-        inputs=[model_dropdown],
-        outputs=list(param_elements.values())
-    )
-    # 3. Chat Submission Logic (using .then() for streaming if possible, or standard submit)
-    # Note: Gradio streaming with gr.Chatbot often uses yields
-    chat_submit_button.click(
-        fn=handle_chat,
-        inputs=[
-            api_key_input,
-            model_dropdown,
-            chat_history_state,
-            chat_message_input,
-            chat_file_upload
-        ] + ordered_param_components, # Add dynamic params
-        outputs=[chatbot_display, chat_message_input] # Update chatbot, clear input box
-    ).then(
-         # Update the state *after* the response is fully generated
-         lambda history: history, # Simple pass-through to get final history
-         inputs=chatbot_display,
-         outputs=chat_history_state
     )
-    # Allow submitting chat by pressing Enter in the textbox
-    chat_message_input.submit(
-         fn=handle_chat,
-         inputs=[
-             api_key_input,
-             model_dropdown,
-             chat_history_state,
-             chat_message_input,
-             chat_file_upload
-         ] + ordered_param_components,
-         outputs=[chatbot_display, chat_message_input]
-     ).then(
-         lambda history: history,
-         inputs=chatbot_display,
-         outputs=chat_history_state
-     )
-    # 4. Clear Chat Logic
-    def clear_chat_history_func():
-        return [], [] # Clears chatbot display and history state
-    clear_chat_button.click(
-        fn=clear_chat_history_func,
-        inputs=[],
-        outputs=[chatbot_display, chat_history_state]
     )
-    # 5. Single Response Submission Logic
-    single_submit_button.click(
-        fn=handle_single_response,
-        inputs=[
-            api_key_input,
-            model_dropdown,
-            single_prompt_input,
-            single_file_upload
-        ] + ordered_param_components, # Add dynamic params
-        outputs=[single_output_text, single_output_image]
     )
-# Launch the Gradio app
-if __name__ == "__main__":
-    demo.launch(debug=True) # Set debug=False for deployment

 import gradio as gr
+import google.genai as genai
 from PIL import Image
+import os
+import textract
+# List of available models (including experimental and recent ones)
+models = [
+    "gemini-2.5-flash-preview-04-17",
+    "gemini-2.5-pro-preview-03-25",
+    "gemini-2.0-flash",
+    "gemini-2.0-flash-lite",
+    "gemini-2.0-flash-thinking-exp-01-21",
+    "gemini-1.5-pro",
+    "gemini-2.0-flash-exp-image-generation"
 ]
+# Model types for handling inputs
+model_types = {
+    "gemini-2.5-flash-preview-04-17": "text",
+    "gemini-2.5-pro-preview-03-25": "text",
+    "gemini-2.0-flash": "text",
+    "gemini-2.0-flash-lite": "text",
+    "gemini-2.0-flash-thinking-exp-01-21": "text",
+    "gemini-1.5-pro": "text",
+    "gemini-2.0-flash-exp-image-generationn": "multimodal"
 }
+# Function to validate API key
 def validate_api_key(api_key):
     try:
+        client = genai.Client(api_key=api_key)
+        client.models.list()  # Validate by attempting to list models
+        return True, "API Key is valid."
     except Exception as e:
+        return False, f"Invalid API Key: {str(e)}"
+# Function to process uploaded files
+def process_files(files, model_type):
+    inputs = []
+    for file_path in files:
+        if model_type == "multimodal" and file_path.lower().endswith(('.png', '.jpg', '.jpeg', '.gif', '.bmp')):
+            img = Image.open(file_path)
+            inputs.append(img)
         else:
+            try:
+                text = textract.process(file_path).decode('utf-8')
+                inputs.append(text)
+            except Exception as e:
+                inputs.append(f"Error extracting text from {os.path.basename(file_path)}: {str(e)}")
+    return inputs
+# Chat submit function
+def chat_submit_func(message, files, chat_history, model, temperature, top_p, max_tokens, api_key):
+    client = genai.Client(api_key=api_key)
+    gen_model = client.models.get(model)
+    # Prepare inputs
+    if model_types[model] == "text" and files:
+        chat_history.append((message, "Warning: Files are not supported for text-only models. Converting to text where possible."))
+        processed_inputs = process_files(files, "text")
+        inputs = [message] + processed_inputs
     else:
+        processed_inputs = process_files(files, model_types[model]) if files else []
+        inputs = [message] + processed_inputs
+    # Generation configuration
+    generation_config = {
+        "temperature": temperature,
+        "top_p": top_p,
+        "max_output_tokens": max_tokens,
+    }
     try:
+        response = gen_model.generate_content(inputs, generation_config=generation_config)
+        response_text = ""
+        response_images = []
+        # Parse response
+        for candidate in response.candidates:
+            for part in candidate.content.parts:
+                if hasattr(part, 'text') and part.text:
+                    response_text += part.text
+                elif hasattr(part, 'file_data') and part.file_data:
+                    # Assuming file_data provides a URL; adjust if base64 or other format
+                    image_url = part.file_data.url
+                    response_images.append(image_url)
+        # Update chat history
+        user_message = message
+        if files:
+            user_message += "\nFiles: " + ", ".join([os.path.basename(f) for f in files])
+        chat_history.append((user_message, None))
+        bot_message = response_text
+        if response_images:
+            bot_message += "\n" + "\n".join([f"![image]({img})" for img in response_images])
+        chat_history.append((None, bot_message))
+        return chat_history, ""
     except Exception as e:
+        chat_history.append((message, f"Error: {str(e)}"))
+        return chat_history, ""
+# Single response submit function
+def single_submit_func(prompt, files, model, temperature, top_p, max_tokens, api_key):
+    client = genai.Client(api_key=api_key)
+    gen_model = client.models.get(model)
+    # Prepare inputs
+    if model_types[model] == "text" and files:
+        processed_inputs = process_files(files, "text")
+        inputs = [prompt] + processed_inputs
+        warning = "Warning: Files converted to text for text-only model."
     else:
+        processed_inputs = process_files(files, model_types[model]) if files else []
+        inputs = [prompt] + processed_inputs
+        warning = ""
+    # Generation configuration
+    generation_config = {
+        "temperature": temperature,
+        "top_p": top_p,
+        "max_output_tokens": max_tokens,
+    }
     try:
+        response = gen_model.generate_content(inputs, generation_config=generation_config)
+        response_text = warning
+        response_images = []
+        # Parse response
+        for candidate in response.candidates:
+            for part in candidate.content.parts:
+                if hasattr(part, 'text') and part.text:
+                    response_text += part.text
+                elif hasattr(part, 'file_data') and part.file_data:
+                    image_url = part.file_data.url
+                    response_images.append(image_url)
+        return response_text, response_images
     except Exception as e:
+        return f"Error: {str(e)}", []
+# Gradio interface
+with gr.Blocks(title="Gemini API Interface") as app:
     # API Key Section
+    api_key_input = gr.Textbox(label="Gemini API Key", type="password", placeholder="Enter your Gemini API Key")
+    validate_btn = gr.Button("Validate API Key")
+    key_status = gr.Textbox(label="API Key Status", interactive=False)
+    key_validated = gr.State(False)
+    # Model and Parameters Section (hidden until key is validated)
+    with gr.Group(visible=False) as config_group:
+        model_selector = gr.Dropdown(choices=models, label="Select Model", value=models[0])
+        temperature = gr.Slider(0, 1, value=0.7, label="Temperature", step=0.01)
+        top_p = gr.Slider(0, 1, value=0.9, label="Top P", step=0.01)
+        max_tokens = gr.Number(value=512, label="Max Tokens", minimum=1)
+    # Tabs for Chat and Single Response (hidden until key is validated)
+    with gr.Tabs(visible=False) as tabs:
+        with gr.TabItem("Chat"):
+            chat_display = gr.Chatbot(label="Chat History")
+            chat_input = gr.Textbox(label="Your Message", placeholder="Type your message here...")
+            chat_files = gr.File(label="Upload Files", file_count="multiple")
+            chat_submit_btn = gr.Button("Send")
+            chat_status = gr.Textbox(label="Status", interactive=False)
         with gr.TabItem("Single Response"):
+            single_input = gr.Textbox(label="Prompt", placeholder="Enter your prompt here...")
+            single_files = gr.File(label="Upload Files", file_count="multiple")
+            single_submit_btn = gr.Button("Generate")
+            single_text_output = gr.Textbox(label="Response Text", interactive=False)
+            single_image_output = gr.Gallery(label="Response Images")
+    # Validation logic
+    def on_validate_key(api_key):
+        is_valid, status = validate_api_key(api_key)
+        if is_valid:
+            return status, True, gr.update(visible=True), gr.update(visible=True)
+        return status, False, gr.update(visible=False), gr.update(visible=False)
+    validate_btn.click(
+        on_validate_key,
         inputs=[api_key_input],
+        outputs=[key_status, key_validated, config_group, tabs]
     )
+    # Chat submission
+    chat_submit_btn.click(
+        chat_submit_func,
+        inputs=[chat_input, chat_files, chat_display, model_selector, temperature, top_p, max_tokens, api_key_input],
+        outputs=[chat_display, chat_status]
     )
+    # Single response submission
+    single_submit_btn.click(
+        single_submit_func,
+        inputs=[single_input, single_files, model_selector, temperature, top_p, max_tokens, api_key_input],
+        outputs=[single_text_output, single_image_output]
     )
+app.launch()