Spaces:
Running
Running
Commit
·
b60841d
1
Parent(s):
5c2c847
added ultralytics
Browse files
app.py
CHANGED
@@ -91,7 +91,8 @@ def main():
|
|
91 |
st.session_state.visibility = "visible"
|
92 |
|
93 |
st.title("Computer Vision Agent :sunglasses:")
|
94 |
-
st.markdown("Use the CV agent to do Object Detection
|
|
|
95 |
st.markdown(
|
96 |
"""
|
97 |
<style>
|
@@ -107,12 +108,13 @@ def main():
|
|
107 |
st.header("About Project")
|
108 |
st.markdown(
|
109 |
"""
|
110 |
-
- Agent
|
111 |
-
- This application uses multiple tools like Image caption tool, DuckDuckGo search tool, Maskformer tool ,
|
|
|
112 |
""")
|
113 |
st.sidebar.subheader("Upload Image !")
|
114 |
option = st.sidebar.selectbox(
|
115 |
-
"Select
|
116 |
"gemma2-9b-it",
|
117 |
"llama-3.2-3b-preview",
|
118 |
"llama-3.2-1b-preview",
|
|
|
91 |
st.session_state.visibility = "visible"
|
92 |
|
93 |
st.title("Computer Vision Agent :sunglasses:")
|
94 |
+
st.markdown("Use the CV agent to do Object Detection , Panoptic Segementation,Image Segmentation , Image Descrption task using the latest foundation models available opensource.")
|
95 |
+
st.markdown('The CV Agent implements an Agent that decide what and when to use to provide the information related to the image asked my the user.')
|
96 |
st.markdown(
|
97 |
"""
|
98 |
<style>
|
|
|
108 |
st.header("About Project")
|
109 |
st.markdown(
|
110 |
"""
|
111 |
+
- CV Agent can perform check on images to detemine the image quality and can also find out the segementaion mask and panoptic mask .
|
112 |
+
- This application uses multiple tools like Image caption tool, DuckDuckGo search tool, Maskformer tool , Panoptic segementation tool to perform these tasks.
|
113 |
+
- The decision on how to use the certain tool and when to use it soely relies on the Reasoning power of the LLM.
|
114 |
""")
|
115 |
st.sidebar.subheader("Upload Image !")
|
116 |
option = st.sidebar.selectbox(
|
117 |
+
"Select your Large Language Model(LLM) ",("deepseek-r1-distill-llama-70b",
|
118 |
"gemma2-9b-it",
|
119 |
"llama-3.2-3b-preview",
|
120 |
"llama-3.2-1b-preview",
|