Spaces:
Runtime error
Runtime error
fix styling
Browse files- .DS_Store +0 -0
- app.py +15 -9
- requirements.txt +2 -1
.DS_Store
CHANGED
|
Binary files a/.DS_Store and b/.DS_Store differ
|
|
|
app.py
CHANGED
|
@@ -1,4 +1,5 @@
|
|
| 1 |
import torch
|
|
|
|
| 2 |
import gradio as gr
|
| 3 |
import numpy as np
|
| 4 |
from PIL import Image, ImageDraw, ImageFont
|
|
@@ -19,19 +20,24 @@ def query_image(img, text_queries):
|
|
| 19 |
results = processor.post_process(outputs=outputs, target_sizes=target_sizes)
|
| 20 |
boxes, scores, labels = results[0]["boxes"], results[0]["scores"], results[0]["labels"]
|
| 21 |
|
| 22 |
-
|
| 23 |
-
|
|
|
|
|
|
|
| 24 |
|
| 25 |
-
score_threshold = 0.1
|
| 26 |
for box, score, label in zip(boxes, scores, labels):
|
| 27 |
box = [int(i) for i in box.tolist()]
|
| 28 |
|
| 29 |
if score >= score_threshold:
|
| 30 |
-
|
| 31 |
-
|
| 32 |
-
|
| 33 |
-
|
| 34 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
| 35 |
return img
|
| 36 |
|
| 37 |
|
|
@@ -45,7 +51,7 @@ To use it, simply upload an image and enter comma separated text descriptions of
|
|
| 45 |
"""
|
| 46 |
demo = gr.Interface(
|
| 47 |
query_image,
|
| 48 |
-
inputs=[gr.Image(shape=(768, 768)
|
| 49 |
outputs="image",
|
| 50 |
title="Zero-Shot Object Detection with OWL-ViT",
|
| 51 |
description=description,
|
|
|
|
| 1 |
import torch
|
| 2 |
+
import cv2
|
| 3 |
import gradio as gr
|
| 4 |
import numpy as np
|
| 5 |
from PIL import Image, ImageDraw, ImageFont
|
|
|
|
| 20 |
results = processor.post_process(outputs=outputs, target_sizes=target_sizes)
|
| 21 |
boxes, scores, labels = results[0]["boxes"], results[0]["scores"], results[0]["labels"]
|
| 22 |
|
| 23 |
+
img = cv2.resize(img, (768, 768), interpolation = cv2.INTER_AREA)
|
| 24 |
+
score_threshold = 0.11
|
| 25 |
+
|
| 26 |
+
font = cv2.FONT_HERSHEY_SIMPLEX
|
| 27 |
|
|
|
|
| 28 |
for box, score, label in zip(boxes, scores, labels):
|
| 29 |
box = [int(i) for i in box.tolist()]
|
| 30 |
|
| 31 |
if score >= score_threshold:
|
| 32 |
+
img = cv2.rectangle(img, box[:2], box[2:], (255,0,0), 5)
|
| 33 |
+
if box[3] + 25 > 768:
|
| 34 |
+
y = box[3] - 10
|
| 35 |
+
else:
|
| 36 |
+
y = box[3] + 25
|
| 37 |
+
|
| 38 |
+
img = cv2.putText(
|
| 39 |
+
img, text_queries[label], (box[0], y), font, 1, (255,0,0), 2, cv2.LINE_AA
|
| 40 |
+
)
|
| 41 |
return img
|
| 42 |
|
| 43 |
|
|
|
|
| 51 |
"""
|
| 52 |
demo = gr.Interface(
|
| 53 |
query_image,
|
| 54 |
+
inputs=[gr.Image(shape=(768, 768)), "text"],
|
| 55 |
outputs="image",
|
| 56 |
title="Zero-Shot Object Detection with OWL-ViT",
|
| 57 |
description=description,
|
requirements.txt
CHANGED
|
@@ -4,4 +4,5 @@ numpy>=1.18.5
|
|
| 4 |
torch>=1.7.0
|
| 5 |
torchvision>=0.8.1
|
| 6 |
Pillow
|
| 7 |
-
transformers
|
|
|
|
|
|
| 4 |
torch>=1.7.0
|
| 5 |
torchvision>=0.8.1
|
| 6 |
Pillow
|
| 7 |
+
transformers
|
| 8 |
+
opencv-python
|