Spaces:

piyushgrover
/

CLIPPhotoSearchEngine

Sleeping

App Files Files Community

piyushgrover commited on Oct 6, 2023

Commit

6917a0d

1 Parent(s): 0f1766c

added code files

Browse files

Files changed (4) hide show

README.md +7 -10
app.py +145 -0
requirements.txt +8 -0
utils.py +67 -0

README.md CHANGED Viewed

@@ -1,13 +1,10 @@
 ---
-title: CLIPPhotoSearchEngine
-emoji: 🦀
-colorFrom: red
-colorTo: purple
-sdk: gradio
-sdk_version: 3.46.1
-app_file: app.py
-pinned: false
 license: mit
 ---
-Check out the configuration reference at https://huggingface.co/docs/hub/spaces-config-reference

 ---
 license: mit
+title: YoloV3
+sdk: gradio
+colorFrom: yellow
+colorTo: green
+pinned: true
 ---
+# yolov3
+S13 ERA V1

app.py ADDED Viewed

	@@ -0,0 +1,145 @@

+import pandas as pd
+import numpy as np
+import clip
+import gradio as gr
+from utils import *
+import os
+# Load the open CLIP model
+model, preprocess = clip.load("ViT-B/32", device=device)
+from pathlib import Path
+# Download from Github Releases
+if not Path('unsplash-dataset/photo_ids.csv').exists():
+    os.system('''wget https://github.com/haltakov/natural-language-image-search/releases/download/1.0.0/photo_ids.csv -O unsplash-dataset/photo_ids.csv''')
+if not Path('unsplash-dataset/features.npy').exists():
+    os.system('''wget https://github.com/haltakov/natural-language-image-search/releases/download/1.0.0/features.npy - O unsplash-dataset/features.npy''')
+# Load the photo IDs
+photo_ids = pd.read_csv("unsplash-dataset/photo_ids.csv")
+photo_ids = list(photo_ids['photo_id'])
+# Load the features vectors
+photo_features = np.load("unsplash-dataset/features.npy")
+# Convert features to Tensors: Float32 on CPU and Float16 on GPU
+if device == "cpu":
+  photo_features = torch.from_numpy(photo_features).float().to(device)
+else:
+  photo_features = torch.from_numpy(photo_features).to(device)
+# Print some statistics
+print(f"Photos loaded: {len(photo_ids)}")
+def search_by_text_and_photo(query_text, query_img, query_photo_id=None, photo_weight=0.5):
+    # Encode the search query
+    if not query_text and not query_photo_id:
+        return []
+    text_features = encode_search_query(model, query_text)
+    if query_photo_id:
+        # Find the feature vector for the specified photo ID
+        query_photo_index = photo_ids.index(query_photo_id)
+        query_photo_features = photo_features[query_photo_index]
+        # Combine the test and photo queries and normalize again
+        search_features = text_features + query_photo_features * photo_weight
+        search_features /= search_features.norm(dim=-1, keepdim=True)
+        # Find the best match
+        best_photo_ids = find_best_matches(search_features, photo_features, photo_ids, 10)
+    elif query_img:
+        query_photo_features = model.encode_image(query_img)
+        query_photo_features = query_photo_features / query_photo_features.norm(dim=1, keepdim=True)
+        # Combine the test and photo queries and normalize again
+        search_features = text_features + query_photo_features * photo_weight
+        search_features /= search_features.norm(dim=-1, keepdim=True)
+        # Find the best match
+        best_photo_ids = find_best_matches(search_features, photo_features, photo_ids, 10)
+    else:
+        # Display the results
+        print("Test search result")
+        best_photo_ids = search_unslash(query_text, photo_features, photo_ids, 10)
+    return best_photo_ids
+with gr.Blocks() as app:
+    with gr.Row():
+        gr.Markdown(
+            """
+            # CLIP Image Search Engine!
+            ### Enter search query or/and input image to find the similar images from the database -
+            """)
+    with gr.Row(visible=True):
+        with gr.Column():
+            with gr.Row():
+                search_text = gr.Textbox(value='', placeholder='Search..', label='Enter Your Query')
+            with gr.Row():
+                submit_btn = gr.Button("Submit", variant='primary')
+                clear_btn = gr.ClearButton()
+        with gr.Column():
+            search_image = gr.Image(label='Upload Image or Select from results')
+    with gr.Row(visible=True):
+        output_images = gr.Gallery(allow_preview=False, label='Results.. ', info='',
+                                   value=[], columns=5, rows=2)
+        output_image_ids = gr.State([])
+    def clear_data():
+        return {
+            search_image: None,
+            output_images: None,
+            search_text: None
+        }
+    clear_btn.click(clear_data, None, [search_image, output_images, search_text])
+    def on_select(evt: gr.SelectData, output_image_ids):
+        return {
+            search_image: f"https://unsplash.com/photos/{output_image_ids[evt.index]}/download?w=100"
+        }
+    output_images.select(on_select, output_image_ids, search_image)
+    def func_search(query, img):
+        best_photo_ids = search_by_text_and_photo(query, img)
+        img_urls = []
+        for p_id in best_photo_ids:
+            url = f"https://unsplash.com/photos/{p_id}/download?w=100"
+            img_urls.append(url)
+        valid_images = filter_invalid_urls(img_urls, best_photo_ids)
+        return {
+            output_image_ids: valid_images['image_ids'],
+            output_images: valid_images['image_urls']
+        }
+    submit_btn.click(
+        func_search,
+        [search_text, search_image],
+        [output_images, output_image_ids]
+    )
+'''
+Launch the app
+'''
+app.launch()

requirements.txt ADDED Viewed

	@@ -0,0 +1,8 @@

+torch
+torchvision
+pillow
+gradio
+numpy
+panda
+grequests
+git+https://github.com/openai/CLIP.git

utils.py ADDED Viewed

	@@ -0,0 +1,67 @@

+from gevent import monkey
+def stub(*args, **kwargs):  # pylint: disable=unused-argument
+    pass
+monkey.patch_all = stub
+import grequests
+import requests
+import torch
+import clip
+device = "cuda" if torch.cuda.is_available() else "cpu"
+def encode_search_query(model, search_query):
+    with torch.no_grad():
+        tokenized_query = clip.tokenize(search_query)
+        # print("tokenized_query: ", tokenized_query.shape)
+        # Encode and normalize the search query using CLIP
+        text_encoded = model.encode_text(tokenized_query.to(device))
+        text_encoded /= text_encoded.norm(dim=-1, keepdim=True)
+        # Retrieve the feature vector
+        # print("text_encoded: ", text_encoded.shape)
+        return text_encoded
+def find_best_matches(text_features, photo_features, photo_ids, results_count=5):
+    # Compute the similarity between the search query and each photo using the Cosine similarity
+    # print("text_features: ", text_features.shape)
+    # print("photo_features: ", photo_features.shape)
+    similarities = (photo_features @ text_features.T).squeeze(1)
+    # Sort the photos by their similarity score
+    best_photo_idx = (-similarities).argsort()
+    # print("best_photo_idx: ", best_photo_idx.shape)
+    # print("best_photo_idx: ", best_photo_idx[:results_count])
+    result_list = [photo_ids[i] for i in best_photo_idx[:results_count]]
+    # print("result_list: ", len(result_list))
+    # Return the photo IDs of the best matches
+    return result_list
+def search_unslash(search_query, photo_features, photo_ids, results_count=10):
+    # Encode the search query
+    text_features = encode_search_query(search_query)
+    # Find the best matches
+    best_photo_ids = find_best_matches(text_features, photo_features, photo_ids, results_count)
+    return best_photo_ids
+def filter_invalid_urls(urls, photo_ids):
+    rs = (grequests.get(u) for u in urls)
+    results = grequests.map(rs)
+    valid_image_ids = []
+    valid_image_urls = []
+    for i, res in enumerate(results):
+        if res and res.status_code == 200:
+            valid_image_urls.append(urls[i])
+            valid_image_ids.append(photo_ids[i])
+    return dict(
+        image_ids=valid_image_ids,
+        image_urls=valid_image_urls
+    )