Spaces:

swaptr
/

image-captioning

Runtime error

swaptr commited on May 26, 2023

Commit

44eade1

•

1 Parent(s): f3f75c4

add code for image captioning

Files changed (9) hide show

README.md CHANGED Viewed

@@ -1,5 +1,5 @@
 ---
-title: Text Captioning
 emoji: 💻
 colorFrom: purple
 colorTo: green
@@ -9,4 +9,6 @@ app_file: app.py
 pinned: false
 ---
-Check out the configuration reference at https://huggingface.co/docs/hub/spaces-config-reference

 ---
+title: Image Captioning
 emoji: 💻
 colorFrom: purple
 colorTo: green
 pinned: false
 ---
+Image Captioning
+This space contains the code for image captioning. All you need to do is import an image and the system will generate the caption for you.

app.py ADDED Viewed

+import pandas as pd
+import gradio as gr
+import torch
+from torch.nn import functional as F
+from transformers import AutoTokenizer, ViTFeatureExtractor, VisionEncoderDecoderModel
+device="cpu"
+feature_extractor = ViTFeatureExtractor.from_pretrained("nlpconnect/vit-gpt2-image-captioning")
+cat_tokenizer = AutoTokenizer.from_pretrained("nlpconnect/vit-gpt2-image-captioning")
+cap_model = VisionEncoderDecoderModel.from_pretrained("nlpconnect/vit-gpt2-image-captioning").to(device)
+def predict(image, max_length=64, num_beams=4):
+ image = image.convert('RGB')
+ image = feature_extractor(image, return_tensors="pt").pixel_values.to(device)
+ clean_text = lambda x: x.replace('<|endoftext|>','').split('\n')[0]
+ caption_ids = cap_model.generate(image, max_length=max_length)[0]
+ caption_text = clean_text(cat_tokenizer.decode(caption_ids))
+ return caption_text
+input = gr.components.Image(label="Upload Image", type = 'pil')
+caption = gr.components.Textbox(type="text", label="Captions")
+examples = [f"e{i}.jpg" for i in range(1,7)]
+title = "Image Caption"
+description = "Made by: Swapnil Tripathi"
+interface = gr.Interface(
+ fn=predict,
+ description=description,
+ inputs=input,
+ theme=gr.themes.Default(
+ primary_hue=gr.themes.colors.orange,
+ secondary_hue=gr.themes.colors.slate
+ ),
+ outputs=caption,
+ examples=examples,
+ title=title,
+)
+interface.launch(debug=True)

e1.jpg ADDED Viewed

e2.jpg ADDED Viewed

e3.jpg ADDED Viewed

e4.jpg ADDED Viewed

e5.jpg ADDED Viewed

e6.jpg ADDED Viewed

requirements.txt ADDED Viewed