Info-tools / app.py
Felguk's picture
Update app.py
4d49ad5 verified
raw
history blame contribute delete
7.17 kB
import gradio as gr
from PIL import Image
import requests
from bs4 import BeautifulSoup
import os
import subprocess
from huggingface_hub import ModelCard, SpaceCard, HfApi
# PNG Info Tool
def png_info(file):
img = Image.open(file)
metadata = img.info
metadata_str = "\n".join([f"{key}: {value}" for key, value in metadata.items()])
return metadata_str
# Web Info Tool
def web_info(url):
response = requests.get(url)
soup = BeautifulSoup(response.text, 'html.parser')
title = soup.title.string if soup.title else ""
meta_description = soup.find("meta", attrs={"name": "description"})
description = meta_description["content"] if meta_description else ""
meta_tags = soup.find_all("meta")
headers = {f"h{i}": len(soup.find_all(f"h{i}")) for i in range(1, 7)}
links = [a["href"] for a in soup.find_all("a", href=True)]
basic_info = f"Title: {title}\nDescription: {description}"
html_info = f"Meta Tags: {len(meta_tags)}\nHeaders: {headers}\nLinks: {len(links)}"
return f"{basic_info}\n\nHTML Info:\n{html_info}"
# View Source Info Tool
def view_source_info(url):
if url.startswith("view-source:"):
url = url.replace("view-source:", "").strip()
if not url.startswith(("http://", "https://")):
url = "https://" + url
response = requests.get(url)
return response.text
# Document Info Tool
def document_info(file):
file_extension = os.path.splitext(file.name)[1].lower()
content = ""
preview = None
if file_extension in [".txt", ".md"]:
with open(file.name, "r") as f:
content = f.read()
elif file_extension in [".png", ".jpg", ".jpeg", ".bmp", ".gif"]:
preview = file.name
else:
content = "Unsupported file format"
return content, preview
# Video Info Tool
def video_info(file):
video_display = file
result = subprocess.run(
["ffprobe", "-v", "error", "-show_format", "-show_streams", file],
stdout=subprocess.PIPE,
stderr=subprocess.PIPE,
text=True,
)
return video_display, result.stdout
# Model Info Tool
def model_info(model_id):
try:
card = ModelCard.load(model_id)
api = HfApi()
model_info = api.model_info(model_id)
by = model_info.author if model_info.author else ""
description = card.content if card.content else ""
related_spaces = model_info.siblings
related_spaces = [s.rfilename for s in related_spaces if s.rfilename.endswith(".py")]
related_spaces = "\n".join(related_spaces) if related_spaces else ""
install_instructions = f"pip install transformers\n\n# To use the model:\nfrom transformers import AutoModel, AutoTokenizer\nmodel = AutoModel.from_pretrained('{model_id}')\ntokenizer = AutoTokenizer.from_pretrained('{model_id}')"
return by, description, related_spaces, install_instructions
except Exception:
return "", "", "", ""
# Space Info Tool
def space_info(space_id):
try:
card = SpaceCard.load(space_id)
api = HfApi()
space_info = api.space_info(space_id)
makes = space_info.author if space_info.author else ""
description = card.content if card.content else ""
code_files = space_info.siblings
code_files = [s.rfilename for s in code_files if s.rfilename.endswith(".py")]
code = "\n".join(code_files) if code_files else ""
return makes, code, description
except Exception:
return "", "", ""
# Gradio Interface
with gr.Blocks() as demo:
gr.Markdown("## Information Extraction Tools")
with gr.Tab("PNG Info"):
png_input = gr.File(label="Upload PNG File")
png_output = gr.Textbox(label="PNG Metadata", lines=10)
png_button = gr.Button("Extract PNG Info")
png_button.click(png_info, inputs=png_input, outputs=png_output)
with gr.Tab("Web Info"):
web_input = gr.Textbox(label="Enter URL")
web_output = gr.Textbox(label="Web Info")
web_button = gr.Button("Extract Web Info")
web_button.click(web_info, inputs=web_input, outputs=web_output)
with gr.Tab("View Source Info"):
source_input = gr.Textbox(label="Enter URL (with or without 'view-source:')", placeholder="e.g., https://example.com or view-source:example.com")
source_output = gr.Textbox(label="HTML Source Code", lines=20)
source_button = gr.Button("View Source")
source_button.click(view_source_info, inputs=source_input, outputs=source_output)
with gr.Tab("Document Info"):
doc_input = gr.File(label="Upload Document")
content_output = gr.Textbox(label="Content", lines=10, visible=False)
preview_output = gr.Image(label="Preview (Image)", visible=False)
doc_button = gr.Button("Extract Document Info")
def update_output_components(file):
if file is None:
return gr.Textbox(visible=False), gr.Image(visible=False)
file_extension = os.path.splitext(file.name)[1].lower()
if file_extension in [".txt", ".md"]:
return gr.Textbox(visible=True), gr.Image(visible=False)
elif file_extension in [".png", ".jpg", ".jpeg", ".bmp", ".gif"]:
return gr.Textbox(visible=False), gr.Image(visible=True)
else:
return gr.Textbox(visible=True), gr.Image(visible=False)
doc_button.click(document_info, inputs=doc_input, outputs=[content_output, preview_output])
doc_input.change(update_output_components, inputs=doc_input, outputs=[content_output, preview_output])
with gr.Tab("Video Info"):
video_input = gr.Video(label="Upload Video")
video_output = gr.Video(label="Video Preview")
metadata_output = gr.Textbox(label="Video Metadata", lines=10)
video_button = gr.Button("Extract Video Info")
video_button.click(video_info, inputs=video_input, outputs=[video_output, metadata_output])
with gr.Tab("Model Info"):
model_input = gr.Textbox(label="Enter Model ID", placeholder="e.g., bert-base-uncased")
by_output = gr.Textbox(label="By", value="")
description_output = gr.Textbox(label="Description", value="", lines=5)
spaces_output = gr.Textbox(label="Related Spaces", value="", lines=3)
install_output = gr.Textbox(label="How to Install", value="", lines=5)
model_button = gr.Button("Fetch Model Info")
model_button.click(model_info, inputs=model_input, outputs=[by_output, description_output, spaces_output, install_output])
with gr.Tab("Space Info"):
space_input = gr.Textbox(label="Enter Space ID", placeholder="e.g., gradio/hello-world")
makes_output = gr.Textbox(label="Makes", value="")
code_output = gr.Textbox(label="Code", value="", lines=5)
description_output = gr.Textbox(label="Description", value="", lines=10)
space_button = gr.Button("Fetch Space Info")
space_button.click(space_info, inputs=space_input, outputs=[makes_output, code_output, description_output])
# Launch the Gradio app
demo.launch()