Spaces:

imageomics
/

bioclip-demo

Running

App Files Files Community

query-neighbors

#10

by smenon8 - opened Mar 23

base: refs/heads/main

←

from: refs/pr/10

Discussion Files changed

+85

-2

Files changed (3) hide show

.gitignore +1 -0
app.py +9 -2
components/query_neighbor.py +75 -0

.gitignore CHANGED Viewed

@@ -1,2 +1,3 @@
 .venv/
 __pycache__/

 .venv/
 __pycache__/
+.gradio/

app.py CHANGED Viewed

@@ -14,6 +14,7 @@ from torchvision import transforms
 from templates import openai_imagenet_template
 from components.query import  get_sample
 log_format = "[%(asctime)s] [%(levelname)s] [%(name)s] %(message)s"
 logging.basicConfig(level=logging.INFO, format=log_format)
@@ -90,6 +91,8 @@ zero_shot_examples = [
     ],
 ]
 def indexed(lst, indices):
     return [lst[i] for i in indices]
@@ -146,6 +149,10 @@ def open_domain_classification(img, rank: int, return_all=False):
     logits = (model.logit_scale.exp() * img_features @ txt_emb).squeeze()
     probs = F.softmax(logits, dim=0)
     if rank + 1 == len(ranks):
         topk = probs.topk(k)
         prediction_dict = {
@@ -154,9 +161,9 @@ def open_domain_classification(img, rank: int, return_all=False):
         logger.info(f"Top K predictions: {prediction_dict}")
         top_prediction_name = format_name(*txt_names[topk.indices[0]]).split("(")[0]
         logger.info(f"Top prediction name: {top_prediction_name}")
-        sample_img, taxon_url = get_sample(metadata_df, top_prediction_name, rank)
         if return_all:
-            return prediction_dict, sample_img, taxon_url
         return prediction_dict
     output = collections.defaultdict(float)

 from templates import openai_imagenet_template
 from components.query import  get_sample
+from components.query_neighbor import QueryNeighbor
 log_format = "[%(asctime)s] [%(levelname)s] [%(name)s] %(message)s"
 logging.basicConfig(level=logging.INFO, format=log_format)
     ],
 ]
+query_neighbor = QueryNeighbor(dataset_name = "BIRD")
 def indexed(lst, indices):
     return [lst[i] for i in indices]
     logits = (model.logit_scale.exp() * img_features @ txt_emb).squeeze()
     probs = F.softmax(logits, dim=0)
+    neighbor = str(query_neighbor.get_nearest_neighbor(img_features))
+    neighbor_image = query_neighbor.get_image(neighbor)
+    logger.info(f"Nearest neighbor: {neighbor}")
     if rank + 1 == len(ranks):
         topk = probs.topk(k)
         prediction_dict = {
         logger.info(f"Top K predictions: {prediction_dict}")
         top_prediction_name = format_name(*txt_names[topk.indices[0]]).split("(")[0]
         logger.info(f"Top prediction name: {top_prediction_name}")
+        _, taxon_url = get_sample(metadata_df, top_prediction_name, rank)
         if return_all:
+            return prediction_dict, neighbor_image, taxon_url
         return prediction_dict
     output = collections.defaultdict(float)

components/query_neighbor.py ADDED Viewed

	@@ -0,0 +1,75 @@

+import io
+import os
+import chromadb
+import boto3
+import requests
+import logging
+from PIL import Image
+from huggingface_hub import snapshot_download
+from dataclasses import dataclass
+log_format = "[%(asctime)s] [%(levelname)s] [%(name)s] %(message)s"
+logging.basicConfig(level=logging.INFO, format=log_format)
+logger = logging.getLogger()
+S3_BUCKET = "tol-bird-dataset-test"
+@dataclass
+class VectorDataset:
+    dataset_name: str
+    hf_dataset_path: str
+    relative_vector_db_path: str
+_SUPPORTED_DATASETS = {
+    "BIRD": VectorDataset(
+        dataset_name="BIRD",
+        hf_dataset_path="imageomics/bird-dataset-vector",
+        relative_vector_db_path="bird_vector_db"
+    ),
+}
+class QueryNeighbor:
+    """
+    Class to query the nearest neighbor for a given image feature vector.
+    It uses a vector database to find the nearest neighbor and retrieves the image from S3.
+    The class is initialized with the vector database path and the dataset name.
+    The vector database is downloaded from Hugging Face Hub and stored in a local cache.
+    The class uses the chromadb library to interact with the vector database and boto3 to interact with S3.
+    """
+    def __init__(self, dataset_name: str):
+        logger.info("Initializing QueryNeighbor")
+        vector_dataset = _SUPPORTED_DATASETS.get(dataset_name)
+        if vector_dataset is None:
+            raise ValueError(f"Unsupported dataset: {dataset_name}")
+        vector_db_path = snapshot_download(
+            repo_id=vector_dataset.hf_dataset_path,
+            repo_type="dataset"
+        )
+        logger.info(f"Vector DB cache: {vector_db_path}")
+        self._client = chromadb.PersistentClient(
+            path=os.path.join(vector_db_path,
+                              vector_dataset.relative_vector_db_path))
+        self._collection = self._client.get_collection(
+            name=dataset_name
+        )
+        self._s3_client = boto3.client("s3")
+    def get_nearest_neighbor(self, img_features) -> int:
+        ''' Returns the nearest neighbors for the given image features. '''
+        neighbors = self._collection.query(query_embeddings=[img_features[0].tolist()],
+                     n_results = 2)
+        return neighbors["ids"][0][0]
+    def get_image(self, image_key: str):
+        ''' Returns the image for the given key. '''
+        img_src = self._s3_client.generate_presigned_url('get_object',
+                                                   Params={'Bucket': S3_BUCKET,
+                                                           'Key': image_key}
+                                                   )
+        img_resp = requests.get(img_src)
+        img = Image.open(io.BytesIO(img_resp.content))
+        return img