Image-To-Text

Paused

App Files Files Community

ruslanmv commited on Feb 13, 2024

Commit

fb6ff47

verified ·

1 Parent(s): 7778ff1

Update main.py

Browse files

Files changed (1) hide show

main.py +7 -41

main.py CHANGED Viewed

@@ -43,6 +43,7 @@ def generate_caption(processor, model, image, tokenizer=None):
     return generated_caption
 def generate_captions(image):
     caption_git_base = generate_caption(git_processor_base, git_model_base, image)
@@ -56,56 +57,21 @@ def generate_captions(image):
     return caption_git_base, caption_git_large, caption_blip_base, caption_blip_large, caption_vitgpt
-examples = [["cat.jpg"], ["dog.jpg"], ["horse.jpg"]]
-outputs = [gr.outputs.Textbox(label="Caption generated by GIT-base"), gr.outputs.Textbox(label="Caption generated by GIT-large"), gr.outputs.Textbox(label="Caption generated by BLIP-base"), gr.outputs.Textbox(label="Caption generated by BLIP-large"), gr.outputs.Textbox(label="Caption generated by ViT+GPT-2")]
 title = "Interactive demo: comparing image captioning models"
 description = "Gradio Demo to compare GIT, BLIP and ViT+GPT2, 3 state-of-the-art vision+language models. To use it, simply upload your image and click 'submit', or click one of the examples to load them. Read more at the links below."
 article = "<p style='text-align: center'><a href='https://huggingface.co/docs/transformers/main/model_doc/blip' target='_blank'>BLIP docs</a> | <a href='https://huggingface.co/docs/transformers/main/model_doc/git' target='_blank'>GIT docs</a></p>"
-css = """
-body {
-    background-color: #f2f2f2;
-    font-family: Arial, sans-serif;
-}
-.title {
-    color: #333333;
-    font-size: 24px;
-    font-weight: bold;
-    margin-bottom: 20px;
-}
-.description {
-    color: #666666;
-    font-size: 16px;
-    margin-bottom: 20px;
-}
-.article {
-    color: #666666;
-    font-size: 14px;
-    margin-bottom: 20px;
-    text-align: center;
-}
-.input {
-    margin-bottom: 20px;
-}
-.output {
-    margin-bottom: 20px;
-}
-"""
-iface = gr.Interface(fn=generate_captions,
                          inputs=gr.inputs.Image(type="pil"),
                          outputs=outputs,
-                         examples=examples,
                          title=title,
                          description=description,
-                         article=article,
-                         css=css,
                          enable_queue=True)
 iface.launch(server_name="0.0.0.0", server_port=7860)

     return generated_caption
 def generate_captions(image):
     caption_git_base = generate_caption(git_processor_base, git_model_base, image)
     return caption_git_base, caption_git_large, caption_blip_base, caption_blip_large, caption_vitgpt
+#examples = [["cats.jpg"], ["stop_sign.png"], ["astronaut.jpg"]]
+outputs = [gr.outputs.Textbox(label="Caption generated by GIT-base"), gr.outputs.Textbox(label="Caption generated by GIT-large"), gr.outputs.Textbox(label="Caption generated by BLIP-base"), gr.outputs.Textbox(label="Caption generated by BLIP-large"), gr.outputs.Textbox(label="Caption generated by ViT+GPT-2")]
 title = "Interactive demo: comparing image captioning models"
 description = "Gradio Demo to compare GIT, BLIP and ViT+GPT2, 3 state-of-the-art vision+language models. To use it, simply upload your image and click 'submit', or click one of the examples to load them. Read more at the links below."
 article = "<p style='text-align: center'><a href='https://huggingface.co/docs/transformers/main/model_doc/blip' target='_blank'>BLIP docs</a> | <a href='https://huggingface.co/docs/transformers/main/model_doc/git' target='_blank'>GIT docs</a></p>"
+iface = gr.Interface(fn=generate_captions,
                          inputs=gr.inputs.Image(type="pil"),
                          outputs=outputs,
+                         examples=examples,
                          title=title,
                          description=description,
+                         article=article,
                          enable_queue=True)
 iface.launch(server_name="0.0.0.0", server_port=7860)