Info-tools / app.py
Felguk's picture
Update app.py
4d49ad5 verified
import gradio as gr
from PIL import Image
import requests
from bs4 import BeautifulSoup
import os
import subprocess
from huggingface_hub import ModelCard, SpaceCard, HfApi
# PNG Info Tool
def png_info(file):
img = Image.open(file)
metadata = img.info
metadata_str = "\n".join([f"{key}: {value}" for key, value in metadata.items()])
return metadata_str
# Web Info Tool
def web_info(url):
response = requests.get(url)
soup = BeautifulSoup(response.text, 'html.parser')
title = soup.title.string if soup.title else ""
meta_description = soup.find("meta", attrs={"name": "description"})
description = meta_description["content"] if meta_description else ""
meta_tags = soup.find_all("meta")
headers = {f"h{i}": len(soup.find_all(f"h{i}")) for i in range(1, 7)}
links = [a["href"] for a in soup.find_all("a", href=True)]
basic_info = f"Title: {title}\nDescription: {description}"
html_info = f"Meta Tags: {len(meta_tags)}\nHeaders: {headers}\nLinks: {len(links)}"
return f"{basic_info}\n\nHTML Info:\n{html_info}"
# View Source Info Tool
def view_source_info(url):
if url.startswith("view-source:"):
url = url.replace("view-source:", "").strip()
if not url.startswith(("http://", "https://")):
url = "https://" + url
response = requests.get(url)
return response.text
# Document Info Tool
def document_info(file):
file_extension = os.path.splitext(file.name)[1].lower()
content = ""
preview = None
if file_extension in [".txt", ".md"]:
with open(file.name, "r") as f:
content = f.read()
elif file_extension in [".png", ".jpg", ".jpeg", ".bmp", ".gif"]:
preview = file.name
else:
content = "Unsupported file format"
return content, preview
# Video Info Tool
def video_info(file):
video_display = file
result = subprocess.run(
["ffprobe", "-v", "error", "-show_format", "-show_streams", file],
stdout=subprocess.PIPE,
stderr=subprocess.PIPE,
text=True,
)
return video_display, result.stdout
# Model Info Tool
def model_info(model_id):
try:
card = ModelCard.load(model_id)
api = HfApi()
model_info = api.model_info(model_id)
by = model_info.author if model_info.author else ""
description = card.content if card.content else ""
related_spaces = model_info.siblings
related_spaces = [s.rfilename for s in related_spaces if s.rfilename.endswith(".py")]
related_spaces = "\n".join(related_spaces) if related_spaces else ""
install_instructions = f"pip install transformers\n\n# To use the model:\nfrom transformers import AutoModel, AutoTokenizer\nmodel = AutoModel.from_pretrained('{model_id}')\ntokenizer = AutoTokenizer.from_pretrained('{model_id}')"
return by, description, related_spaces, install_instructions
except Exception:
return "", "", "", ""
# Space Info Tool
def space_info(space_id):
try:
card = SpaceCard.load(space_id)
api = HfApi()
space_info = api.space_info(space_id)
makes = space_info.author if space_info.author else ""
description = card.content if card.content else ""
code_files = space_info.siblings
code_files = [s.rfilename for s in code_files if s.rfilename.endswith(".py")]
code = "\n".join(code_files) if code_files else ""
return makes, code, description
except Exception:
return "", "", ""
# Gradio Interface
with gr.Blocks() as demo:
gr.Markdown("## Information Extraction Tools")
with gr.Tab("PNG Info"):
png_input = gr.File(label="Upload PNG File")
png_output = gr.Textbox(label="PNG Metadata", lines=10)
png_button = gr.Button("Extract PNG Info")
png_button.click(png_info, inputs=png_input, outputs=png_output)
with gr.Tab("Web Info"):
web_input = gr.Textbox(label="Enter URL")
web_output = gr.Textbox(label="Web Info")
web_button = gr.Button("Extract Web Info")
web_button.click(web_info, inputs=web_input, outputs=web_output)
with gr.Tab("View Source Info"):
source_input = gr.Textbox(label="Enter URL (with or without 'view-source:')", placeholder="e.g., https://example.com or view-source:example.com")
source_output = gr.Textbox(label="HTML Source Code", lines=20)
source_button = gr.Button("View Source")
source_button.click(view_source_info, inputs=source_input, outputs=source_output)
with gr.Tab("Document Info"):
doc_input = gr.File(label="Upload Document")
content_output = gr.Textbox(label="Content", lines=10, visible=False)
preview_output = gr.Image(label="Preview (Image)", visible=False)
doc_button = gr.Button("Extract Document Info")
def update_output_components(file):
if file is None:
return gr.Textbox(visible=False), gr.Image(visible=False)
file_extension = os.path.splitext(file.name)[1].lower()
if file_extension in [".txt", ".md"]:
return gr.Textbox(visible=True), gr.Image(visible=False)
elif file_extension in [".png", ".jpg", ".jpeg", ".bmp", ".gif"]:
return gr.Textbox(visible=False), gr.Image(visible=True)
else:
return gr.Textbox(visible=True), gr.Image(visible=False)
doc_button.click(document_info, inputs=doc_input, outputs=[content_output, preview_output])
doc_input.change(update_output_components, inputs=doc_input, outputs=[content_output, preview_output])
with gr.Tab("Video Info"):
video_input = gr.Video(label="Upload Video")
video_output = gr.Video(label="Video Preview")
metadata_output = gr.Textbox(label="Video Metadata", lines=10)
video_button = gr.Button("Extract Video Info")
video_button.click(video_info, inputs=video_input, outputs=[video_output, metadata_output])
with gr.Tab("Model Info"):
model_input = gr.Textbox(label="Enter Model ID", placeholder="e.g., bert-base-uncased")
by_output = gr.Textbox(label="By", value="")
description_output = gr.Textbox(label="Description", value="", lines=5)
spaces_output = gr.Textbox(label="Related Spaces", value="", lines=3)
install_output = gr.Textbox(label="How to Install", value="", lines=5)
model_button = gr.Button("Fetch Model Info")
model_button.click(model_info, inputs=model_input, outputs=[by_output, description_output, spaces_output, install_output])
with gr.Tab("Space Info"):
space_input = gr.Textbox(label="Enter Space ID", placeholder="e.g., gradio/hello-world")
makes_output = gr.Textbox(label="Makes", value="")
code_output = gr.Textbox(label="Code", value="", lines=5)
description_output = gr.Textbox(label="Description", value="", lines=10)
space_button = gr.Button("Fetch Space Info")
space_button.click(space_info, inputs=space_input, outputs=[makes_output, code_output, description_output])
# Launch the Gradio app
demo.launch()