Update app.py
Browse files
app.py
CHANGED
@@ -170,7 +170,7 @@ def main():
|
|
170 |
model = AutoModelForVision2Seq.from_pretrained(ckpt, trust_remote_code=True).to("cuda")
|
171 |
processor = AutoProcessor.from_pretrained(ckpt, trust_remote_code=True)
|
172 |
|
173 |
-
def generate_predictions(image_input, text_input
|
174 |
|
175 |
# Save the image and load it again to match the original Kosmos-2 demo.
|
176 |
# (https://github.com/microsoft/unilm/blob/f4695ed0244a275201fff00bee495f76670fbe70/kosmos-2/demo/gradio_app.py#L345-L346)
|
@@ -252,10 +252,6 @@ def main():
|
|
252 |
with gr.Column():
|
253 |
image_input = gr.Image(type="pil", label="Test Image")
|
254 |
text_input = gr.Radio(["Brief", "Detailed"], label="Description Type", value="Brief")
|
255 |
-
do_sample = gr.Checkbox(label="Enable Sampling", info="(Please enable it before adjusting sampling parameters below)", value=False)
|
256 |
-
with gr.Accordion("Sampling parameters", open=False) as sampling_parameters:
|
257 |
-
sampling_topp = gr.Slider(minimum=0.1, maximum=1, step=0.01, value=0.9, label="Sampling: Top-P")
|
258 |
-
sampling_temperature = gr.Slider(minimum=0.1, maximum=1, step=0.01, value=0.7, label="Sampling: Temperature")
|
259 |
|
260 |
run_button = gr.Button(label="Run", visible=True)
|
261 |
|
@@ -270,16 +266,16 @@ def main():
|
|
270 |
with gr.Row():
|
271 |
with gr.Column():
|
272 |
gr.Examples(examples=[
|
273 |
-
["images/two_dogs.jpg", "Detailed"
|
274 |
-
["images/snowman.png", "Brief"
|
275 |
-
["images/man_ball.png", "Detailed"
|
276 |
-
], inputs=[image_input, text_input
|
277 |
with gr.Column():
|
278 |
gr.Examples(examples=[
|
279 |
-
["images/six_planes.png", "Brief"
|
280 |
-
["images/quadrocopter.jpg", "Brief"
|
281 |
-
["images/carnaby_street.jpg", "Brief"
|
282 |
-
], inputs=[image_input, text_input
|
283 |
gr.Markdown(term_of_use)
|
284 |
|
285 |
# record which text span (label) is selected
|
@@ -304,7 +300,7 @@ def main():
|
|
304 |
selected.change(update_output_image, [image_input, image_output, entity_output, selected], [image_output])
|
305 |
|
306 |
run_button.click(fn=generate_predictions,
|
307 |
-
inputs=[image_input, text_input
|
308 |
outputs=[image_output, text_output1, entity_output],
|
309 |
show_progress=True, queue=True)
|
310 |
|
|
|
170 |
model = AutoModelForVision2Seq.from_pretrained(ckpt, trust_remote_code=True).to("cuda")
|
171 |
processor = AutoProcessor.from_pretrained(ckpt, trust_remote_code=True)
|
172 |
|
173 |
+
def generate_predictions(image_input, text_input):
|
174 |
|
175 |
# Save the image and load it again to match the original Kosmos-2 demo.
|
176 |
# (https://github.com/microsoft/unilm/blob/f4695ed0244a275201fff00bee495f76670fbe70/kosmos-2/demo/gradio_app.py#L345-L346)
|
|
|
252 |
with gr.Column():
|
253 |
image_input = gr.Image(type="pil", label="Test Image")
|
254 |
text_input = gr.Radio(["Brief", "Detailed"], label="Description Type", value="Brief")
|
|
|
|
|
|
|
|
|
255 |
|
256 |
run_button = gr.Button(label="Run", visible=True)
|
257 |
|
|
|
266 |
with gr.Row():
|
267 |
with gr.Column():
|
268 |
gr.Examples(examples=[
|
269 |
+
["images/two_dogs.jpg", "Detailed"],
|
270 |
+
["images/snowman.png", "Brief"],
|
271 |
+
["images/man_ball.png", "Detailed"],
|
272 |
+
], inputs=[image_input, text_input])
|
273 |
with gr.Column():
|
274 |
gr.Examples(examples=[
|
275 |
+
["images/six_planes.png", "Brief"],
|
276 |
+
["images/quadrocopter.jpg", "Brief"],
|
277 |
+
["images/carnaby_street.jpg", "Brief"],
|
278 |
+
], inputs=[image_input, text_input])
|
279 |
gr.Markdown(term_of_use)
|
280 |
|
281 |
# record which text span (label) is selected
|
|
|
300 |
selected.change(update_output_image, [image_input, image_output, entity_output, selected], [image_output])
|
301 |
|
302 |
run_button.click(fn=generate_predictions,
|
303 |
+
inputs=[image_input, text_input],
|
304 |
outputs=[image_output, text_output1, entity_output],
|
305 |
show_progress=True, queue=True)
|
306 |
|