Spaces:

arad1367
/

GroqLLaVAMA_Econometrics_Agent

App Files Files Community

arad1367 commited on Sep 7

Commit

9e1902c

•

1 Parent(s): e7a21bc

Update app.py

Browse files

Files changed (1) hide show

app.py +7 -12

app.py CHANGED Viewed

@@ -1,25 +1,18 @@
-# 1. Imports and API setup
-import spaces
 import gradio as gr
 from groq import Groq
 import base64
 import os
-import subprocess
 # Define models used in the process
 llava_model = 'llava-v1.5-7b-4096-preview'
 llama31_model = 'llama-3.1-70b-versatile'
-# Install flash-attn if not already installed
-subprocess.run('pip install flash-attn --no-build-isolation', env={'FLASH_ATTENTION_SKIP_CUDA_BUILD': "TRUE"}, shell=True)
 # Image encoding function
 def encode_image(image_path):
     with open(image_path, "rb") as image_file:
         return base64.b64encode(image_file.read()).decode('utf-8')
 # Image to text function
-@spaces.GPU()
 def image_to_text(client, model, base64_image, prompt):
     try:
         chat_completion = client.chat.completions.create(
@@ -46,7 +39,6 @@ def image_to_text(client, model, base64_image, prompt):
         return f"Error generating text from image: {str(e)}"
 # Technical review generation function
-@spaces.GPU()
 def technical_review_generation(client, image_description):
     keywords = ["econometrics", "finance", "marketing", "stock", "prediction", "chart", "graph", "time series"]
     if not any(keyword in image_description.lower() for keyword in keywords):
@@ -72,6 +64,7 @@ def technical_review_generation(client, image_description):
 # Main function for Gradio interface
 def process_image(api_key, image, prompt="Describe this image in detail."):
     try:
         os.environ["GROQ_API_KEY"] = api_key
         client = Groq()  # Initialize the Groq client with the provided key
@@ -94,6 +87,7 @@ def process_image(api_key, image, prompt="Describe this image in detail."):
     # Return both image description and the econometrics report
     return f"--- Image Description ---\n{image_description}", f"--- GroqLLaVA EconoMind Report ---\n{report}"
 css = """
     #title, #description {
         text-align: center;
@@ -121,7 +115,9 @@ css = """
 """
 # Gradio Interface
 def gradio_interface():
     footer = """
     <div id="footer">
         <a href="https://www.linkedin.com/in/pejman-ebrahimi-4a60151a7/" target="_blank">LinkedIn</a> |
@@ -140,7 +136,7 @@ def gradio_interface():
         with gr.Row():
             api_key_input = gr.Textbox(label="GROQ API Key", placeholder="Enter your GROQ API Key", type="password")
         with gr.Row():
-            image_input = gr.Image(type="filepath", label="Upload an Image")  # Changed type to 'filepath'
         with gr.Row():
             report_button = gr.Button("Generate Report")
         with gr.Row():
@@ -169,8 +165,7 @@ def gradio_interface():
                 outputs=[api_key_input, image_input, output_description, output_report]
             )
-    # Launch the interface
-    demo.launch()
 # Start the Gradio interface
-gradio_interface()

 import gradio as gr
 from groq import Groq
 import base64
 import os
 # Define models used in the process
 llava_model = 'llava-v1.5-7b-4096-preview'
 llama31_model = 'llama-3.1-70b-versatile'
 # Image encoding function
 def encode_image(image_path):
     with open(image_path, "rb") as image_file:
         return base64.b64encode(image_file.read()).decode('utf-8')
 # Image to text function
 def image_to_text(client, model, base64_image, prompt):
     try:
         chat_completion = client.chat.completions.create(
         return f"Error generating text from image: {str(e)}"
 # Technical review generation function
 def technical_review_generation(client, image_description):
     keywords = ["econometrics", "finance", "marketing", "stock", "prediction", "chart", "graph", "time series"]
     if not any(keyword in image_description.lower() for keyword in keywords):
 # Main function for Gradio interface
 def process_image(api_key, image, prompt="Describe this image in detail."):
+    # Set the API key
     try:
         os.environ["GROQ_API_KEY"] = api_key
         client = Groq()  # Initialize the Groq client with the provided key
     # Return both image description and the econometrics report
     return f"--- Image Description ---\n{image_description}", f"--- GroqLLaVA EconoMind Report ---\n{report}"
+# Define CSS for centering elements and footer styling
 css = """
     #title, #description {
         text-align: center;
 """
 # Gradio Interface
+@gr.load(src="zerogpu")
 def gradio_interface():
+    # Define the footer HTML
     footer = """
     <div id="footer">
         <a href="https://www.linkedin.com/in/pejman-ebrahimi-4a60151a7/" target="_blank">LinkedIn</a> |
         with gr.Row():
             api_key_input = gr.Textbox(label="GROQ API Key", placeholder="Enter your GROQ API Key", type="password")
         with gr.Row():
+            image_input = gr.Image(type="filepath", label="Upload an Image")
         with gr.Row():
             report_button = gr.Button("Generate Report")
         with gr.Row():
                 outputs=[api_key_input, image_input, output_description, output_report]
             )
+    return demo
 # Start the Gradio interface
+app = gradio_interface()