Spaces:

sohojoe
/

soho-clip-embeddings-explorer

Running

App Files Files Community

sohojoe commited on May 9, 2023

Commit

cdfc363

1 Parent(s): 99ea77b

refactor clip_app_client into an api class and clip_app_performance_test

Browse files

Files changed (2) hide show

experimental/clip_app_client.py +94 -140
experimental/clip_app_performance_test.py +168 -0

experimental/clip_app_client.py CHANGED Viewed

@@ -1,146 +1,100 @@
-# File name: graph_client.py
-from concurrent.futures import ThreadPoolExecutor
-import json
 import os
 import numpy as np
 import requests
 from concurrent.futures import ThreadPoolExecutor, as_completed
-import time
 import torch
-# hack for debugging, set HTTP_ADDRESS to "http://127.0.0.1:8000/"
-# os.environ["HTTP_ADDRESS"] = "http://192.168.7.79:8000"
-test_image_url = "https://static.wixstatic.com/media/4d6b49_42b9435ce1104008b1b5f7a3c9bfcd69~mv2.jpg/v1/fill/w_454,h_333,fp_0.50_0.50,q_90/4d6b49_42b9435ce1104008b1b5f7a3c9bfcd69~mv2.jpg"
-english_text = (
-    "It was the best of times, it was the worst of times, it was the age "
-    "of wisdom, it was the age of foolishness, it was the epoch of belief"
-)
-clip_model="ViT-L/14"
-clip_model_id ="laion5B-L-14"
-device = "cuda:0" if torch.cuda.is_available() else "cpu"
-print ("using device", device)
-from clip_retrieval.load_clip import load_clip, get_tokenizer
-# from clip_retrieval.clip_client import ClipClient, Modality
-model, preprocess = load_clip(clip_model, use_jit=True, device=device)
-tokenizer = get_tokenizer(clip_model)
-def preprocess_image(image_url):
-    # download image from url
-    import requests
-    from PIL import Image
-    from io import BytesIO
-    response = requests.get(test_image_url)
-    input_image = Image.open(BytesIO(response.content))
-    input_image = input_image.convert('RGB')
-    # convert image to numpy array
-    input_image = np.array(input_image)
-    input_im = Image.fromarray(input_image)
-    prepro = preprocess(input_im).unsqueeze(0).cpu()
-    return prepro
-preprocessed_image = preprocess_image(test_image_url)
-def text_to_embedding(text):
-    payload = {
-        "text": ('str', text, 'application/octet-stream'),
-    }
-    url = os.environ.get("HTTP_ADDRESS", "http://127.0.0.1:8000/")
-    response = requests.post(url, files=payload)
-    embeddings = response.text
-    return embeddings
-def image_url_to_embedding(image_url):
-    payload = {
-        "image_url": ('str', test_image_url, 'application/octet-stream'),
-    }
-    url = os.environ.get("HTTP_ADDRESS", "http://127.0.0.1:8000/")
-    response = requests.post(url, files=payload)
-    embeddings = response.text
-    return embeddings
-def preprocessed_image_to_embedding(image):
-    key = "preprocessed_image"
-    data_bytes = image.numpy().tobytes()
-    shape_bytes = np.array(image.shape).tobytes()
-    dtype_bytes = str(image.dtype).encode()
-    payload = {
-        key: ('tensor', data_bytes, 'application/octet-stream'),
-        'shape': ('shape', shape_bytes, 'application/octet-stream'),
-        'dtype': ('dtype', dtype_bytes, 'application/octet-stream'),
-    }
-    url = os.environ.get("HTTP_ADDRESS", "http://127.0.0.1:8000/")
-    response = requests.post(url, files=payload)
-    embeddings = response.text
-    return embeddings
-def _send_text_request(number):
-    embeddings = text_to_embedding(english_text)
-    return number, embeddings
-def _send_image_url_request(number):
-    embeddings = image_url_to_embedding(test_image_url)
-    return number, embeddings
-def _send_preprocessed_image_request(number):
-    embeddings = preprocessed_image_to_embedding(preprocessed_image)
-    return number, embeddings
-def process(numbers, send_func, max_workers=10):
-    with ThreadPoolExecutor(max_workers=max_workers) as executor:
-        futures = [executor.submit(send_func, number) for number in numbers]
-        for future in as_completed(futures):
-            n_result, result = future.result()
-            result = json.loads(result)
-            print (f"{n_result} : {len(result[0])}")
-# def process_text(numbers, max_workers=10):
-#     for n in numbers:
-#         n_result, result = send_text_request(n)
-#         result = json.loads(result)
-#         print (f"{n_result} : {len(result[0])}")
-if __name__ == "__main__":
-    n_calls = 300
-    # test text
-    # n_calls = 1
-    numbers = list(range(n_calls))
-    start_time = time.monotonic()
-    process(numbers, _send_text_request)
-    end_time = time.monotonic()
-    total_time = end_time - start_time
-    avg_time_ms = total_time / n_calls * 1000
-    calls_per_sec = n_calls / total_time
-    print(f"Text...")
-    print(f" Average time taken: {avg_time_ms:.2f} ms")
-    print(f" Number of calls per second: {calls_per_sec:.2f}")
-    # test image url
-    # n_calls = 1
-    numbers = list(range(n_calls))
-    start_time = time.monotonic()
-    process(numbers, _send_image_url_request)
-    end_time = time.monotonic()
-    total_time = end_time - start_time
-    avg_time_ms = total_time / n_calls * 1000
-    calls_per_sec = n_calls / total_time
-    print(f"Image passing url...")
-    print(f" Average time taken: {avg_time_ms:.2f} ms")
-    print(f" Number of calls per second: {calls_per_sec:.2f}")
-    # test image as vector
-    # n_calls = 1
-    numbers = list(range(n_calls))
-    start_time = time.monotonic()
-    process(numbers, _send_preprocessed_image_request)
-    end_time = time.monotonic()
-    total_time = end_time - start_time
-    avg_time_ms = total_time / n_calls * 1000
-    calls_per_sec = n_calls / total_time
-    print(f"Preprocessed image...")
-    print(f" Average time taken: {avg_time_ms:.2f} ms")
-    print(f" Number of calls per second: {calls_per_sec:.2f}")

 import os
 import numpy as np
 import requests
 from concurrent.futures import ThreadPoolExecutor, as_completed
+from PIL import Image
+from io import BytesIO
 import torch
+from clip_retrieval.load_clip import load_clip, get_tokenizer
+class ClipAppClient:
+    """
+    A class to handle generating embeddings using the OpenAI CLIP model.
+    clip_embeddings = ClipEmbeddings()
+    test_image_url = "https://example.com/image.jpg"
+    preprocessed_image = clip_embeddings.preprocess_image(test_image_url)
+    text = "A beautiful landscape"
+    text_embeddings = clip_embeddings.text_to_embedding(text)
+    image_embeddings = clip_embeddings.image_url_to_embedding(test_image_url)
+    preprocessed_image_embeddings = clip_embeddings.preprocessed_image_to_embedding(preprocessed_image)
+    """
+    def __init__(self, clip_model="ViT-L/14", device=None):
+        self.clip_model = clip_model
+        self.device = device or ("cuda:0" if torch.cuda.is_available() else "cpu")
+        print("using device", self.device)
+        self.model, self.preprocess = load_clip(clip_model, use_jit=True, device=self.device)
+        self.tokenizer = get_tokenizer(clip_model)
+    def preprocess_image(self, image_url):
+        """
+        Preprocess an image from a given URL.
+        :param image_url: str, URL of the image to preprocess
+        :return: torch.Tensor, preprocessed image
+        """
+        response = requests.get(image_url)
+        input_image = Image.open(BytesIO(response.content)).convert('RGB')
+        input_image = np.array(input_image)
+        input_im = Image.fromarray(input_image)
+        prepro = self.preprocess(input_im).unsqueeze(0).cpu()
+        return prepro
+    def text_to_embedding(self, text):
+        """
+        Convert a given text to an embedding using the OpenAI CLIP model.
+        :param text: str, text to convert to an embedding
+        :return: str, text embeddings
+        """
+        payload = {
+            "text": ('str', text, 'application/octet-stream'),
+        }
+        url = os.environ.get("HTTP_ADDRESS", "http://127.0.0.1:8000/")
+        response = requests.post(url, files=payload)
+        embeddings = response.text
+        return embeddings
+    def image_url_to_embedding(self, image_url):
+        """
+        Convert an image URL to an embedding using the OpenAI CLIP model.
+        :param image_url: str, URL of the image to convert to an embedding
+        :return: str, image embeddings
+        """
+        payload = {
+            "image_url": ('str', image_url, 'application/octet-stream'),
+        }
+        url = os.environ.get("HTTP_ADDRESS", "http://127.0.0.1:8000/")
+        response = requests.post(url, files=payload)
+        embeddings = response.text
+        return embeddings
+    def preprocessed_image_to_embedding(self, image):
+        """
+        Convert a preprocessed image to an embedding using the OpenAI CLIP model.
+        :param image: torch.Tensor, preprocessed image
+        :return: str, image embeddings
+        """
+        key = "preprocessed_image"
+        data_bytes = image.numpy().tobytes()
+        shape_bytes = np.array(image.shape).tobytes()
+        dtype_bytes = str(image.dtype).encode()
+        payload = {
+            key: ('tensor', data_bytes, 'application/octet-stream'),
+            'shape': ('shape', shape_bytes, 'application/octet-stream'),
+            'dtype': ('dtype', dtype_bytes, 'application/octet-stream'),
+        }
+        url = os.environ.get("HTTP_ADDRESS", "http://127.0.0.1:8000/")
+        response = requests.post(url, files=payload)
+        embeddings = response.text
+        return embeddings

experimental/clip_app_performance_test.py ADDED Viewed

	@@ -0,0 +1,168 @@

+from concurrent.futures import ThreadPoolExecutor, as_completed
+import json
+import os
+import time
+import numpy as np
+import requests
+import torch
+from clip_app_client import ClipAppClient
+test_image_url = "https://static.wixstatic.com/media/4d6b49_42b9435ce1104008b1b5f7a3c9bfcd69~mv2.jpg/v1/fill/w_454,h_333,fp_0.50_0.50,q_90/4d6b49_42b9435ce1104008b1b5f7a3c9bfcd69~mv2.jpg"
+english_text = (
+    "It was the best of times, it was the worst of times, it was the age "
+    "of wisdom, it was the age of foolishness, it was the epoch of belief"
+)
+app_client = ClipAppClient()
+preprocessed_image = app_client.preprocess_image(test_image_url)
+def _send_text_request(number):
+    embeddings = app_client.text_to_embedding(english_text)
+    return number, embeddings
+def _send_image_url_request(number):
+    embeddings = app_client.image_url_to_embedding(test_image_url)
+    return number, embeddings
+def _send_preprocessed_image_request(number):
+    embeddings = app_client.preprocessed_image_to_embedding(preprocessed_image)
+    return number, embeddings
+def process(numbers, send_func, max_workers=10):
+    with ThreadPoolExecutor(max_workers=max_workers) as executor:
+        futures = [executor.submit(send_func, number) for number in numbers]
+        for future in as_completed(futures):
+            n_result, result = future.result()
+            result = json.loads(result)
+            print (f"{n_result} : {len(result[0])}")
+if __name__ == "__main__":
+    n_calls = 300
+    # test text
+    numbers = list(range(n_calls))
+    start_time = time.monotonic()
+    process(numbers, _send_text_request)
+    end_time = time.monotonic()
+    total_time = end_time - start_time
+    avg_time_ms = total_time / n_calls * 1000
+    calls_per_sec = n_calls / total_time
+    print(f"Text...")
+    print(f" Average time taken: {avg_time_ms:.2f} ms")
+    print(f" Number of calls per second: {calls_per_sec:.2f}")
+    # test image url
+    numbers = list(range(n_calls))
+    start_time = time.monotonic()
+    process(numbers, _send_image_url_request)
+    end_time = time.monotonic()
+    total_time = end_time - start_time
+    avg_time_ms = total_time / n_calls * 1000
+    calls_per_sec = n_calls / total_time
+    print(f"Image passing url...")
+    print(f" Average time taken: {avg_time_ms:.2f} ms")
+    print(f" Number of calls per second: {calls_per_sec:.2f}")
+    # test image as vector
+    numbers = list(range(n_calls))
+    start_time = time.monotonic()
+    process(numbers, _send_preprocessed_image_request)
+    end_time = time.monotonic()
+    total_time = end_time - start_time
+    avg_time_ms = total_time / n_calls * 1000
+    calls_per_sec = n_calls / total_time
+    print(f"Preprocessed image...")
+    print(f" Average time taken: {avg_time_ms:.2f} ms")
+    print(f" Number of calls per second: {calls_per_sec:.2f}")
+# from concurrent.futures import ThreadPoolExecutor
+# import json
+# import os
+# import numpy as np
+# import requests
+# from concurrent.futures import ThreadPoolExecutor, as_completed
+# import time
+# import torch
+# # hack for debugging, set HTTP_ADDRESS to "http://127.0.0.1:8000/"
+# # os.environ["HTTP_ADDRESS"] = "http://192.168.7.79:8000"
+# test_image_url = "https://static.wixstatic.com/media/4d6b49_42b9435ce1104008b1b5f7a3c9bfcd69~mv2.jpg/v1/fill/w_454,h_333,fp_0.50_0.50,q_90/4d6b49_42b9435ce1104008b1b5f7a3c9bfcd69~mv2.jpg"
+# english_text = (
+#     "It was the best of times, it was the worst of times, it was the age "
+#     "of wisdom, it was the age of foolishness, it was the epoch of belief"
+# )
+# preprocessed_image = preprocess_image(test_image_url)
+# def _send_text_request(number):
+#     embeddings = text_to_embedding(english_text)
+#     return number, embeddings
+# def _send_image_url_request(number):
+#     embeddings = image_url_to_embedding(test_image_url)
+#     return number, embeddings
+# def _send_preprocessed_image_request(number):
+#     embeddings = preprocessed_image_to_embedding(preprocessed_image)
+#     return number, embeddings
+# def process(numbers, send_func, max_workers=10):
+#     with ThreadPoolExecutor(max_workers=max_workers) as executor:
+#         futures = [executor.submit(send_func, number) for number in numbers]
+#         for future in as_completed(futures):
+#             n_result, result = future.result()
+#             result = json.loads(result)
+#             print (f"{n_result} : {len(result[0])}")
+# # def process_text(numbers, max_workers=10):
+# #     for n in numbers:
+# #         n_result, result = send_text_request(n)
+# #         result = json.loads(result)
+# #         print (f"{n_result} : {len(result[0])}")
+# if __name__ == "__main__":
+#     n_calls = 300
+#     # test text
+#     # n_calls = 1
+#     numbers = list(range(n_calls))
+#     start_time = time.monotonic()
+#     process(numbers, _send_text_request)
+#     end_time = time.monotonic()
+#     total_time = end_time - start_time
+#     avg_time_ms = total_time / n_calls * 1000
+#     calls_per_sec = n_calls / total_time
+#     print(f"Text...")
+#     print(f" Average time taken: {avg_time_ms:.2f} ms")
+#     print(f" Number of calls per second: {calls_per_sec:.2f}")
+#     # test image url
+#     # n_calls = 1
+#     numbers = list(range(n_calls))
+#     start_time = time.monotonic()
+#     process(numbers, _send_image_url_request)
+#     end_time = time.monotonic()
+#     total_time = end_time - start_time
+#     avg_time_ms = total_time / n_calls * 1000
+#     calls_per_sec = n_calls / total_time
+#     print(f"Image passing url...")
+#     print(f" Average time taken: {avg_time_ms:.2f} ms")
+#     print(f" Number of calls per second: {calls_per_sec:.2f}")
+#     # test image as vector
+#     # n_calls = 1
+#     numbers = list(range(n_calls))
+#     start_time = time.monotonic()
+#     process(numbers, _send_preprocessed_image_request)
+#     end_time = time.monotonic()
+#     total_time = end_time - start_time
+#     avg_time_ms = total_time / n_calls * 1000
+#     calls_per_sec = n_calls / total_time
+#     print(f"Preprocessed image...")
+#     print(f" Average time taken: {avg_time_ms:.2f} ms")
+#     print(f" Number of calls per second: {calls_per_sec:.2f}")