Spaces:

imageomics
/

bioclip-2-demo

Running

App Files Files Community

egrace479 commited on 20 days ago

Commit

fd1374f

verified ·

1 Parent(s): d4ca384

Update examples (#2)

Browse files

- Add images to LFS tracking (cee3f42e99d0067d36da79488a5b9e04a49f3fc2)
- Update examples for v2 (d1367b488a431acf5d3210b05e8b535aef890379)
- fix filter (affa08952db57e0154aa7de63366972abd49f69e)
- Add embeddings LFS tracking (cd0baf2af5c4c2564966619a43174d3511faea93)
- revert back to local inference code (1e724771249af95e9a7d9e3494291828eb225966)

Files changed (20) hide show

.gitattributes +4 -0
app.py +62 -34
components/query.py +1 -1
components/templates.py +82 -0
components/txt_emb_species.json +3 -0
examples/{Phoca-vitulina.png → Asparagales-Orchidaceae.jpg} +2 -2
examples/{Sarcoscypha-coccinea.jpeg → Bovidae-Oryx.jpg} +2 -2
examples/{Felis-catus.jpeg → Carcharhinus-melanopterus.jpg} +2 -2
examples/{Onoclea-sensibilis.jpg → Cebidae-Cebus.jpg} +2 -2
examples/Cortinarius-austroalbidus.jpg +3 -0
examples/Onoclea-hintonii.jpg +0 -0
examples/{Actinostola-abyssorum.png → Solanales-Petunia.png} +2 -2
examples/cheetah.jpg +3 -0
examples/coral-snake.jpeg +0 -0
examples/{Amanita-muscaria.jpeg → house-finch.jpeg} +2 -2
examples/jaguar.jpg +3 -0
examples/leopard.jpg +3 -0
examples/milk-snake.png +0 -3
examples/monarch.jpg +3 -0
examples/viceroy.jpg +3 -0

.gitattributes CHANGED Viewed

@@ -42,3 +42,7 @@ examples/Onoclea-sensibilis.jpg filter=lfs diff=lfs merge=lfs -text
 examples/Phoca-vitulina.png filter=lfs diff=lfs merge=lfs -text
 examples/Sarcoscypha-coccinea.jpeg filter=lfs diff=lfs merge=lfs -text
 examples/Ursus-arctos.jpeg filter=lfs diff=lfs merge=lfs -text

 examples/Phoca-vitulina.png filter=lfs diff=lfs merge=lfs -text
 examples/Sarcoscypha-coccinea.jpeg filter=lfs diff=lfs merge=lfs -text
 examples/Ursus-arctos.jpeg filter=lfs diff=lfs merge=lfs -text
+*.jpg filter=lfs diff=lfs merge=lfs -text
+*.jpeg filter=lfs diff=lfs merge=lfs -text
+*.png filter=lfs diff=lfs merge=lfs -text
+components/txt_emb_species.json filter=lfs diff=lfs merge=lfs -text

app.py CHANGED Viewed

@@ -11,9 +11,10 @@ import torch
 import torch.nn.functional as F
 from open_clip import create_model, get_tokenizer
 from torchvision import transforms
 from components.query import  get_sample
-from bioclip import CustomLabelsClassifier
 log_format = "[%(asctime)s] [%(levelname)s] [%(name)s] %(message)s"
 logging.basicConfig(level=logging.INFO, format=log_format)
@@ -27,16 +28,16 @@ METADATA_PATH = "components/metadata.parquet"
 metadata_df = pl.read_parquet(METADATA_PATH, low_memory = False)
 metadata_df = metadata_df.with_columns(pl.col(["eol_page_id", "gbif_id"]).cast(pl.Int64))
-MODEL_STR = "hf-hub:imageomics/bioclip-2"
-TOKENIZER_STR = "ViT-L-14"
-txt_emb_npy = "https://huggingface.co/datasets/imageomics/TreeOfLife-200M/resolve/main/embeddings/txt_emb_species.npy"
-txt_names_json = "embeddings/txt_emb_species.json"
 min_prob = 1e-9
 k = 5
-device = torch.device("cuda:0" if torch.cuda.is_available() else "cpu")
 preprocess_img = transforms.Compose(
     [
@@ -52,41 +53,45 @@ preprocess_img = transforms.Compose(
 ranks = ("Kingdom", "Phylum", "Class", "Order", "Family", "Genus", "Species")
 open_domain_examples = [
-    ["examples/Ursus-arctos.jpeg", "Species"],
-    ["examples/Phoca-vitulina.png", "Species"],
-    ["examples/Felis-catus.jpeg", "Genus"],
-    ["examples/Sarcoscypha-coccinea.jpeg", "Order"],
 ]
 zero_shot_examples = [
     [
-        "examples/Ursus-arctos.jpeg",
-        "brown bear\nblack bear\npolar bear\nkoala bear\ngrizzly bear",
     ],
-    ["examples/milk-snake.png", "coral snake\nmilk snake"],
-    ["examples/coral-snake.jpeg", "coral snake\nmilk snake"],
     [
-        "examples/Carnegiea-gigantea.png",
-        "Carnegiea gigantea\nSchlumbergera opuntioides\nMammillaria albicoma",
     ],
     [
-        "examples/Amanita-muscaria.jpeg",
-        "Amanita fulva\nAmanita vaginata (grisette)\nAmanita calyptrata (coccoli)\nAmanita crocea\nAmanita rubescens (blusher)\nAmanita caesarea (Caesar's mushroom)\nAmanita jacksonii (American Caesar's mushroom)\nAmanita muscaria (fly agaric)\nAmanita pantherina (panther cap)",
     ],
     [
-        "examples/Actinostola-abyssorum.png",
-        "Animalia Cnidaria Hexacorallia Actiniaria Actinostolidae Actinostola abyssorum\nAnimalia Cnidaria Hexacorallia Actiniaria Actinostolidae Actinostola bulbosa\nAnimalia Cnidaria Hexacorallia Actiniaria Actinostolidae Actinostola callosa\nAnimalia Cnidaria Hexacorallia Actiniaria Actinostolidae Actinostola capensis\nAnimalia Cnidaria Hexacorallia Actiniaria Actinostolidae Actinostola carlgreni",
     ],
     [
-        "examples/Sarcoscypha-coccinea.jpeg",
-        "scarlet elf cup (coccinea)\nscharlachroter kelchbecherling (austriaca)\ncrimson cup (dudleyi)\nstalked scarlet cup (occidentalis)",
     ],
     [
-        "examples/Onoclea-hintonii.jpg",
-        "Onoclea attenuata\nOnoclea boryana\nOnoclea hintonii\nOnoclea intermedia\nOnoclea sensibilis",
     ],
     [
-        "examples/Onoclea-sensibilis.jpg",
-        "Onoclea attenuata\nOnoclea boryana\nOnoclea hintonii\nOnoclea intermedia\nOnoclea sensibilis",
     ],
 ]
@@ -95,13 +100,32 @@ def indexed(lst, indices):
     return [lst[i] for i in indices]
 def zero_shot_classification(img, cls_str: str) -> dict[str, float]:
     classes = [cls.strip() for cls in cls_str.split("\n") if cls.strip()]
-    classifier = CustomLabelsClassifier(
-        cls_ary = classes,
-        model_str = MODEL_STR,  # remove this line once pybioclip uses BioCLIP 2
-    )
-    return classifier.predict(img)
 def format_name(taxon, common):
@@ -165,16 +189,20 @@ def change_output(choice):
 if __name__ == "__main__":
     logger.info("Starting.")
-    model = create_model(MODEL_STR, output_dict=True, require_pretrained=True)
     model = model.to(device)
     logger.info("Created model.")
     model = torch.compile(model)
     logger.info("Compiled model.")
-    tokenizer = get_tokenizer(TOKENIZER_STR)
-    txt_emb = torch.from_numpy(np.load(txt_emb_npy, mmap_mode="r")).to(device)
     with open(txt_names_json) as fd:
         txt_names = json.load(fd)

 import torch.nn.functional as F
 from open_clip import create_model, get_tokenizer
 from torchvision import transforms
+from huggingface_hub import hf_hub_download
+from components.templates import openai_imagenet_template
 from components.query import  get_sample
 log_format = "[%(asctime)s] [%(levelname)s] [%(name)s] %(message)s"
 logging.basicConfig(level=logging.INFO, format=log_format)
 metadata_df = pl.read_parquet(METADATA_PATH, low_memory = False)
 metadata_df = metadata_df.with_columns(pl.col(["eol_page_id", "gbif_id"]).cast(pl.Int64))
+model_str = "hf-hub:imageomics/bioclip-2"
+tokenizer_str = "ViT-L-14"
+HF_DATA_STR = "imageomics/TreeOfLife-200M"
+txt_names_json = "components/txt_emb_species.json"
 min_prob = 1e-9
 k = 5
+device = torch.device("cpu")
 preprocess_img = transforms.Compose(
     [
 ranks = ("Kingdom", "Phylum", "Class", "Order", "Family", "Genus", "Species")
 open_domain_examples = [
+    ["examples/Carcharhinus-melanopterus.jpg", "Species"],
+    ["examples/house-finch.jpeg", "Species"],
+    ["examples/Bovidae-Oryx.jpg", "Genus"],
+    ["examples/Cebidae-Cebus.jpg", "Genus"],
+    ["examples/Solanales-Petunia.png", "Genus"],
+    ["examples/Asparagales-Orchidaceae.jpg", "Family"],
 ]
 zero_shot_examples = [
     [
+        "examples/Cortinarius-austroalbidus.jpg",
+        "Cortinarius austroalbidus\nCortinarius armillatus\nCortinarius caperatus"
     ],
     [
+        "examples/leopard.jpg",
+        "Jaguar\nLeopard\nCheetah",
+    ],
+    [
+        "examples/jaguar.jpg",
+        "Jaguar\nLeopard\nCheetah",
     ],
     [
+        "examples/cheetah.jpg",
+        "Jaguar\nLeopard\nCheetah",
     ],
     [
+        "examples/monarch.jpg",
+        "Danaus plexippus — Monarch\nLimenitis archippus — Viceroy",
     ],
     [
+        "examples/viceroy.jpg",
+        "Danaus plexippus — Monarch\nLimenitis archippus — Viceroy",
     ],
     [
+        "examples/Ursus-arctos.jpeg",
+        "brown bear\nblack bear\npolar bear\nkoala bear\ngrizzly bear",
     ],
     [
+        "examples/Carnegiea-gigantea.png",
+        "Carnegiea gigantea\nSchlumbergera opuntioides\nMammillaria albicoma",
     ],
 ]
     return [lst[i] for i in indices]
+@torch.no_grad()
+def get_txt_features(classnames, templates):
+    all_features = []
+    for classname in classnames:
+        txts = [template(classname) for template in templates]
+        txts = tokenizer(txts).to(device)
+        txt_features = model.encode_text(txts)
+        txt_features = F.normalize(txt_features, dim=-1).mean(dim=0)
+        txt_features /= txt_features.norm()
+        all_features.append(txt_features)
+    all_features = torch.stack(all_features, dim=1)
+    return all_features
+@torch.no_grad()
 def zero_shot_classification(img, cls_str: str) -> dict[str, float]:
     classes = [cls.strip() for cls in cls_str.split("\n") if cls.strip()]
+    txt_features = get_txt_features(classes, openai_imagenet_template)
+    img = preprocess_img(img).to(device)
+    img_features = model.encode_image(img.unsqueeze(0))
+    img_features = F.normalize(img_features, dim=-1)
+    logits = (model.logit_scale.exp() * img_features @ txt_features).squeeze()
+    probs = F.softmax(logits, dim=0).to("cpu").tolist()
+    return {cls: prob for cls, prob in zip(classes, probs)}
 def format_name(taxon, common):
 if __name__ == "__main__":
     logger.info("Starting.")
+    model = create_model(model_str, output_dict=True, require_pretrained=True)
     model = model.to(device)
     logger.info("Created model.")
     model = torch.compile(model)
     logger.info("Compiled model.")
+    tokenizer = get_tokenizer(tokenizer_str)
+    txt_emb = torch.from_numpy(np.load(hf_hub_download(
+        repo_id=HF_DATA_STR,
+        filename="embeddings/txt_emb_species.npy",
+        repo_type="dataset",
+    )))
     with open(txt_names_json) as fd:
         txt_names = json.load(fd)

components/query.py CHANGED Viewed

@@ -118,7 +118,7 @@ def get_sample_data(df, pred_taxon, rank):
         return None, np.nan, "", False
     # First, try to find entries with empty lower ranks
-    exact_df = df.copy()
     for lower_rank in RANKS[rank + 1:]:
         exact_df = exact_df.filter((pl.col(lower_rank).is_null()) | (pl.col(lower_rank) == ""))

         return None, np.nan, "", False
     # First, try to find entries with empty lower ranks
+    exact_df = df
     for lower_rank in RANKS[rank + 1:]:
         exact_df = exact_df.filter((pl.col(lower_rank).is_null()) | (pl.col(lower_rank) == ""))

components/templates.py ADDED Viewed

	@@ -0,0 +1,82 @@

+openai_imagenet_template = [
+    lambda c: f"a bad photo of a {c}.",
+    lambda c: f"a photo of many {c}.",
+    lambda c: f"a sculpture of a {c}.",
+    lambda c: f"a photo of the hard to see {c}.",
+    lambda c: f"a low resolution photo of the {c}.",
+    lambda c: f"a rendering of a {c}.",
+    lambda c: f"graffiti of a {c}.",
+    lambda c: f"a bad photo of the {c}.",
+    lambda c: f"a cropped photo of the {c}.",
+    lambda c: f"a tattoo of a {c}.",
+    lambda c: f"the embroidered {c}.",
+    lambda c: f"a photo of a hard to see {c}.",
+    lambda c: f"a bright photo of a {c}.",
+    lambda c: f"a photo of a clean {c}.",
+    lambda c: f"a photo of a dirty {c}.",
+    lambda c: f"a dark photo of the {c}.",
+    lambda c: f"a drawing of a {c}.",
+    lambda c: f"a photo of my {c}.",
+    lambda c: f"the plastic {c}.",
+    lambda c: f"a photo of the cool {c}.",
+    lambda c: f"a close-up photo of a {c}.",
+    lambda c: f"a black and white photo of the {c}.",
+    lambda c: f"a painting of the {c}.",
+    lambda c: f"a painting of a {c}.",
+    lambda c: f"a pixelated photo of the {c}.",
+    lambda c: f"a sculpture of the {c}.",
+    lambda c: f"a bright photo of the {c}.",
+    lambda c: f"a cropped photo of a {c}.",
+    lambda c: f"a plastic {c}.",
+    lambda c: f"a photo of the dirty {c}.",
+    lambda c: f"a jpeg corrupted photo of a {c}.",
+    lambda c: f"a blurry photo of the {c}.",
+    lambda c: f"a photo of the {c}.",
+    lambda c: f"a good photo of the {c}.",
+    lambda c: f"a rendering of the {c}.",
+    lambda c: f"a {c} in a video game.",
+    lambda c: f"a photo of one {c}.",
+    lambda c: f"a doodle of a {c}.",
+    lambda c: f"a close-up photo of the {c}.",
+    lambda c: f"a photo of a {c}.",
+    lambda c: f"the origami {c}.",
+    lambda c: f"the {c} in a video game.",
+    lambda c: f"a sketch of a {c}.",
+    lambda c: f"a doodle of the {c}.",
+    lambda c: f"a origami {c}.",
+    lambda c: f"a low resolution photo of a {c}.",
+    lambda c: f"the toy {c}.",
+    lambda c: f"a rendition of the {c}.",
+    lambda c: f"a photo of the clean {c}.",
+    lambda c: f"a photo of a large {c}.",
+    lambda c: f"a rendition of a {c}.",
+    lambda c: f"a photo of a nice {c}.",
+    lambda c: f"a photo of a weird {c}.",
+    lambda c: f"a blurry photo of a {c}.",
+    lambda c: f"a cartoon {c}.",
+    lambda c: f"art of a {c}.",
+    lambda c: f"a sketch of the {c}.",
+    lambda c: f"a embroidered {c}.",
+    lambda c: f"a pixelated photo of a {c}.",
+    lambda c: f"itap of the {c}.",
+    lambda c: f"a jpeg corrupted photo of the {c}.",
+    lambda c: f"a good photo of a {c}.",
+    lambda c: f"a plushie {c}.",
+    lambda c: f"a photo of the nice {c}.",
+    lambda c: f"a photo of the small {c}.",
+    lambda c: f"a photo of the weird {c}.",
+    lambda c: f"the cartoon {c}.",
+    lambda c: f"art of the {c}.",
+    lambda c: f"a drawing of the {c}.",
+    lambda c: f"a photo of the large {c}.",
+    lambda c: f"a black and white photo of a {c}.",
+    lambda c: f"the plushie {c}.",
+    lambda c: f"a dark photo of a {c}.",
+    lambda c: f"itap of a {c}.",
+    lambda c: f"graffiti of the {c}.",
+    lambda c: f"a toy {c}.",
+    lambda c: f"itap of my {c}.",
+    lambda c: f"a photo of a cool {c}.",
+    lambda c: f"a photo of a small {c}.",
+    lambda c: f"a tattoo of the {c}.",
+]

components/txt_emb_species.json ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:4a81b2931330d7e0e5cf1e9a96982d7eed4ac187b08ad99533c9dad523f5b4f4
+size 110609010

examples/{Phoca-vitulina.png → Asparagales-Orchidaceae.jpg} RENAMED Viewed

File without changes

examples/{Sarcoscypha-coccinea.jpeg → Bovidae-Oryx.jpg} RENAMED Viewed

File without changes

examples/{Felis-catus.jpeg → Carcharhinus-melanopterus.jpg} RENAMED Viewed

File without changes

examples/{Onoclea-sensibilis.jpg → Cebidae-Cebus.jpg} RENAMED Viewed

File without changes

examples/Cortinarius-austroalbidus.jpg ADDED Viewed

Git LFS Details

SHA256: b31dcec447348ed6e9643bd3250bfa38c6bbd3b9d6c26eddaf584f2f6da9375b
Pointer size: 131 Bytes
Size of remote file: 691 kB

examples/Onoclea-hintonii.jpg DELETED Viewed

Binary file (88.1 kB)

examples/{Actinostola-abyssorum.png → Solanales-Petunia.png} RENAMED Viewed

File without changes

examples/cheetah.jpg ADDED Viewed

Git LFS Details

SHA256: 585c460f96a8ed44774bdc1009f3148ec232e60d9e7676681f781eeb55216100
Pointer size: 130 Bytes
Size of remote file: 41.9 kB

examples/coral-snake.jpeg DELETED Viewed

Binary file (51.8 kB)

examples/{Amanita-muscaria.jpeg → house-finch.jpeg} RENAMED Viewed

File without changes

examples/jaguar.jpg ADDED Viewed

Git LFS Details

SHA256: 6b6f3145366c10c57e9dba2225d061d7f8575fdf713393ebd90cd45f71c92db7
Pointer size: 131 Bytes
Size of remote file: 141 kB

examples/leopard.jpg ADDED Viewed

Git LFS Details

SHA256: 41a0815d6a774b9b2a1a28c0168c9ab94a38ada1e7d83fbaacbc199c36e46bba
Pointer size: 132 Bytes
Size of remote file: 3.88 MB

examples/milk-snake.png DELETED Viewed

Git LFS Details

SHA256: 4c5820dfcdaa056903767cc7a3dade6e9e9d24c686fab9d457889879e80fa3ab
Pointer size: 131 Bytes
Size of remote file: 411 kB

examples/monarch.jpg ADDED Viewed

Git LFS Details

SHA256: 9440186ed9edb88d7b5969f0ea08b375bb4f01b572406f698a247ba6ddd7c45c
Pointer size: 131 Bytes
Size of remote file: 416 kB

examples/viceroy.jpg ADDED Viewed

Git LFS Details

SHA256: 87a6d9646716cbda2c988511f4ae22fc1eed52d87b5656037943e2a0f429edef
Pointer size: 132 Bytes
Size of remote file: 1.23 MB