codeShare
/

JupyterNotebooks

Model card Files Files and versions

xet

Community

codeShare commited on Sep 6, 2024

Commit

1028385

verified ·

1 Parent(s): 8ad9fee

Upload sd_token_similarity_calculator.ipynb

Browse files

Files changed (1) hide show

sd_token_similarity_calculator.ipynb +116 -19

sd_token_similarity_calculator.ipynb CHANGED Viewed

@@ -14,6 +14,15 @@
     }
   },
   "cells": [
     {
       "cell_type": "code",
       "source": [
@@ -23,7 +32,42 @@
         "from torch import linalg as LA\n",
         "device = torch.device('cuda' if torch.cuda.is_available() else 'cpu')\n",
         "%cd /content/sd_tokens\n",
-        "token = torch.load('sd15_tensors.pt', map_location=device, weights_only=True)"
       ],
       "metadata": {
         "id": "Ch9puvwKH1s3"
@@ -34,7 +78,8 @@
     {
       "cell_type": "code",
       "source": [
-        "print(token[100].shape)  #dimension of the tokens"
       ],
       "metadata": {
         "id": "S_Yh9gH_OUA1"
@@ -42,36 +87,88 @@
       "execution_count": null,
       "outputs": []
     },
     {
       "cell_type": "code",
       "source": [
-        "def absolute_value(x):\n",
-        "    return max(x, -x)\n",
         "\n",
-        "def similarity(id_A , id_B):\n",
-        "  #Tensors\n",
-        "  A = token[id_A]\n",
-        "  B = token[id_B]\n",
         "\n",
-        "  #Tensor vector length (2nd order, i.e (a^2 + b^2 + ....)^(1/2)\n",
-        "  _A = LA.vector_norm(A, ord=2)\n",
-        "  _B = LA.vector_norm(B, ord=2)\n",
         "\n",
         "  result = torch.dot(A,B)/(_A*_B)\n",
-        "  similarity_pcnt = absolute_value(result.item()*100)\n",
-        "\n",
-        "  similarity_pcnt_aprox = round(similarity_pcnt, 3)\n",
         "\n",
-        "  result = f'{similarity_pcnt_aprox} %'\n",
-        "\n",
-        "  return result"
       ],
       "metadata": {
-        "id": "fxquCxFaUxAZ"
       },
-      "execution_count": 16,
       "outputs": []
     },
     {
       "cell_type": "markdown",
       "source": [

     }
   },
   "cells": [
+    {
+      "cell_type": "markdown",
+      "source": [
+        "This Notebook is a Stable-diffusion tool which allows you to find similiar tokens from the SD 1.5 vocab.json that you can use for text-to-image generation"
+      ],
+      "metadata": {
+        "id": "L7JTcbOdBPfh"
+      }
+    },
     {
       "cell_type": "code",
       "source": [
         "from torch import linalg as LA\n",
         "device = torch.device('cuda' if torch.cuda.is_available() else 'cpu')\n",
         "%cd /content/sd_tokens\n",
+        "token = torch.load('sd15_tensors.pt', map_location=device, weights_only=True)\n",
+        "#-----#\n",
+        "\n",
+        "#Import the vocab.json\n",
+        "import json\n",
+        "import pandas as pd\n",
+        "with open('vocab.json', 'r') as f:\n",
+        "    data = json.load(f)\n",
+        "\n",
+        "_df = pd.DataFrame({'count': data})['count']\n",
+        "\n",
+        "vocab = {\n",
+        "    value: key for key, value in _df.items()\n",
+        "}\n",
+        "#-----#\n",
+        "\n",
+        "# Define functions/constants\n",
+        "NUM_TOKENS = 49407\n",
+        "\n",
+        "def absolute_value(x):\n",
+        "    return max(x, -x)\n",
+        "\n",
+        "def similarity(id_A , id_B):\n",
+        "  #Tensors\n",
+        "  A = token[id_A]\n",
+        "  B = token[id_B]\n",
+        "  #Tensor vector length (2nd order, i.e (a^2 + b^2 + ....)^(1/2)\n",
+        "  _A = LA.vector_norm(A, ord=2)\n",
+        "  _B = LA.vector_norm(B, ord=2)\n",
+        "  #----#\n",
+        "  result = torch.dot(A,B)/(_A*_B)\n",
+        "  similarity_pcnt = absolute_value(result.item()*100)\n",
+        "  similarity_pcnt_aprox = round(similarity_pcnt, 3)\n",
+        "  result = f'{similarity_pcnt_aprox} %'\n",
+        "  return result\n",
+        "#----#"
       ],
       "metadata": {
         "id": "Ch9puvwKH1s3"
     {
       "cell_type": "code",
       "source": [
+        "print(vocab[12432]) #the vocab item for ID 12432\n",
+        "print(token[12432].shape)  #dimension of the token"
       ],
       "metadata": {
         "id": "S_Yh9gH_OUA1"
       "execution_count": null,
       "outputs": []
     },
+    {
+      "cell_type": "markdown",
+      "source": [
+        "Get the IDs from a prompt text.\n",
+        "\n",
+        "The prompt will be enclosed with the <|start-of-text|> and <|end-of-text|> tokens"
+      ],
+      "metadata": {
+        "id": "f1-jS7YJApiO"
+      }
+    },
     {
       "cell_type": "code",
       "source": [
         "\n",
+        "from transformers import AutoTokenizer\n",
+        "tokenizer = AutoTokenizer.from_pretrained(\"openai/clip-vit-large-patch14\", clean_up_tokenization_spaces = False)\n",
+        "prompt= \"blah\" # @param {type:'string'}\n",
+        "tokenizer_output = tokenizer(text = prompt)\n",
+        "input_ids = tokenizer_output['input_ids']\n",
+        "print(input_ids)"
+      ],
+      "metadata": {
+        "id": "RPdkYzT2_X85"
+      },
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "source": [
+        "#Produce a list id IDs that are most similiar to the prompt ID at positiion 1\n",
         "\n",
+        "id_A = input_ids[1]\n",
+        "A = token[id_A]\n",
+        "_A = LA.vector_norm(A, ord=2)\n",
+        "dots = torch.zeros(NUM_TOKENS)\n",
         "\n",
+        "for index in range(NUM_TOKENS):\n",
+        "  id_B = index\n",
+        "  B = token[id_B]\n",
+        "  _B = LA.vector_norm(B, ord=2)\n",
         "  result = torch.dot(A,B)/(_A*_B)\n",
+        "  result = absolute_value(result.item())\n",
+        "  dots[index] = result\n",
         "\n",
+        "sorted, indices = torch.sort(dots,dim=0 , descending=True)\n",
+        "#----#\n",
+        "print(f'Calculated all cosine-similarities between ID = {id_A} the rest of the IDs as a 1x{sorted.shape[0]} tensor')\n",
+        "print(f'Calculated indices as a 1x{indices.shape[0]} tensor')"
       ],
       "metadata": {
+        "id": "juxsvco9B0iV"
       },
+      "execution_count": null,
       "outputs": []
     },
+    {
+      "cell_type": "code",
+      "source": [
+        "list_size = 10 # @param {type:'number'}\n",
+        "for index in range(list_size):\n",
+        "  print(f'{vocab[indices[index]]}') # vocab item\n",
+        "  print(f'ID = {indices[index]}') # IDs\n",
+        "  print(f'similiarity = {round(sorted[index].item()*100,2)} %') # % value\n",
+        "  print('--------')\n"
+      ],
+      "metadata": {
+        "id": "YIEmLAzbHeuo"
+      },
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "source": [
+        "Find the most similiar Tokens for given input"
+      ],
+      "metadata": {
+        "id": "qqZ5DvfLBJnw"
+      }
+    },
     {
       "cell_type": "markdown",
       "source": [