milvus-io
diff --git a/‎localization/v2.4.x/site/fr/menuStructure/fr.json
Lines changed: 3 additions & 3 deletions b/‎localization/v2.4.x/site/fr/menuStructure/fr.json
Lines changed: 3 additions & 3 deletions
diff --git a/‎localization/v2.4.x/site/it/menuStructure/it.json
Lines changed: 2 additions & 2 deletions b/‎localization/v2.4.x/site/it/menuStructure/it.json
Lines changed: 2 additions & 2 deletions
diff --git a/‎localization/v2.4.x/site/pt/menuStructure/pt.json
Lines changed: 2 additions & 2 deletions b/‎localization/v2.4.x/site/pt/menuStructure/pt.json
Lines changed: 2 additions & 2 deletions
diff --git a/‎localization/v2.4.x/site/zh/menuStructure/zh.json
Lines changed: 1 addition & 1 deletion b/‎localization/v2.4.x/site/zh/menuStructure/zh.json
Lines changed: 1 addition & 1 deletion
diff --git a/‎localization/v2.5.x/site/de/about/limitations.md
Lines changed: 1 addition & 1 deletion b/‎localization/v2.5.x/site/de/about/limitations.md
Lines changed: 1 addition & 1 deletion
diff --git a/‎localization/v2.5.x/site/de/adminGuide/limit_collection_counts.md
Lines changed: 2 additions & 2 deletions b/‎localization/v2.5.x/site/de/adminGuide/limit_collection_counts.md
Lines changed: 2 additions & 2 deletions
diff --git a/‎localization/v2.5.x/site/de/integrations/integrate_with_pytorch.json
Lines changed: 1 addition & 1 deletion b/‎localization/v2.5.x/site/de/integrations/integrate_with_pytorch.json
Lines changed: 1 addition & 1 deletion
diff --git a/‎localization/v2.5.x/site/de/integrations/integrate_with_pytorch.md
Lines changed: 7 additions & 5 deletions b/‎localization/v2.5.x/site/de/integrations/integrate_with_pytorch.md
Lines changed: 7 additions & 5 deletions
@@ -74,7 +74,7 @@
             "children": []
           },
           {
-            "label": "Exécuter Milvus en mode autonome",
+            "label": "Run Milvus Standalone",
             "id": "run_milvus_docker",
             "order": 2,
             "isMenu": true,
@@ -1451,7 +1451,7 @@
             "children": []
           },
           {
-            "label": "PrivateGPT",
+            "label": "PrivéGPT",
             "id": "use_milvus_in_private_gpt.md",
             "order": 10,
             "children": []
@@ -1781,7 +1781,7 @@
         "children": []
       },
       {
-        "label": "FAQ opérationnelles",
+        "label": "FAQ opérationnelle",
         "id": "operational_faq.md",
         "order": 2,
         "children": []
 
@@ -493,7 +493,7 @@
             "children": []
           },
           {
-            "label": "Compattazione dei cluster",
+            "label": "Compattazione del clustering",
             "id": "clustering-compaction.md",
             "order": 8,
             "children": []
@@ -1729,7 +1729,7 @@
             "children": []
           },
           {
-            "label": "Ricerca di somiglianza audio",
+            "label": "Ricerca della somiglianza audio",
             "id": "audio_similarity_search.md",
             "order": 8,
             "children": []
 
@@ -803,7 +803,7 @@
                     "children": []
                   },
                   {
-                    "label": "Azure",
+                    "label": "Azulejo",
                     "id": "abs.md",
                     "order": 3,
                     "children": []
@@ -1763,7 +1763,7 @@
     ]
   },
   {
-    "label": "FAQs",
+    "label": "Perguntas frequentes",
     "id": "faq",
     "isMenu": true,
     "order": 9,
 
@@ -677,7 +677,7 @@
         "children": []
       },
       {
-        "label": "From Milvus 2.3.x",
+        "label": "来自 Milvus 2.3.x",
         "id": "from-m2x.md",
         "order": 5,
         "children": []
 
@@ -106,7 +106,7 @@ summary: Informieren Sie sich über die Grenzen bei der Verwendung von Milvus.
 <tr><th>Ressource</th><th>Grenze</th></tr>
 </thead>
 <tbody>
-<tr><td>Partition</td><td>4,096</td></tr>
+<tr><td>Partition</td><td>1,024</td></tr>
 <tr><td>Scherbe</td><td>16</td></tr>
 <tr><td>Feld</td><td>64</td></tr>
 <tr><td>Index</td><td>1</td></tr>
 
@@ -63,10 +63,10 @@ title: Begrenzung der Erfassungsanzahl festlegen
         ></path>
       </svg>
     </button></h2><p>In einer Sammlung können Sie mehrere Shards und Partitionen einrichten. Shards sind logische Einheiten, die verwendet werden, um Datenschreiboperationen auf mehrere Datenknoten zu verteilen. Partitionen sind logische Einheiten, die dazu dienen, die Effizienz der Datenabfrage zu verbessern, indem nur eine Teilmenge der Sammlungsdaten geladen wird. Wenn Sie die Anzahl der Sammlungen in der aktuellen Milvus-Instanz berechnen, müssen Sie auch die Shards und Partitionen zählen.</p>
-<p>Nehmen wir zum Beispiel an, Sie haben bereits <strong>100</strong> Sammlungen angelegt, von denen <strong>60</strong> <strong>mit 2</strong> Shards und <strong>4</strong> Partitionen und die restlichen <strong>40</strong> mit <strong>1</strong> Shard und <strong>12</strong> Partitionen ausgestattet sind. Die aktuelle Anzahl der Sammlungen kann wie folgt berechnet werden:</p>
+<p>Nehmen wir zum Beispiel an, dass Sie bereits <strong>100</strong> Sammlungen erstellt haben, von denen <strong>60</strong> <strong>2</strong> Shards und <strong>4</strong> Partitionen und die restlichen <strong>40</strong> Sammlungen <strong>1</strong> Shard und <strong>12</strong> Partitionen enthalten. Die Gesamtzahl der Sammeleinheiten (berechnet als <code translate="no">shards × partitions</code>) kann wie folgt ermittelt werden:</p>
 <pre><code translate="no">60 (collections) x 2 (shards) x 4 (partitions) + 40 (collections) x 1 (shard) x 12 (partitions) = 960
 <button class="copy-code-btn"></button></code></pre>
-<p>Im obigen Beispiel haben Sie bereits <strong>960</strong> der Standardgrenzen genutzt. Wenn Sie nun eine neue Sammlung mit <strong>4</strong> Shards und <strong>20</strong> Partitionen erstellen möchten, erhalten Sie folgende Fehlermeldung, da die Gesamtzahl der Sammlungen die maximale Kapazität überschreitet:</p>
+<p>In diesem Beispiel entspricht die berechnete Gesamtzahl von 960 Sammeleinheiten der aktuellen Nutzung. Die <code translate="no">maxGeneralCapacity</code> definiert die maximale Anzahl von Sammeleinheiten, die eine Instanz unterstützen kann, die standardmäßig auf <code translate="no">65536</code> eingestellt ist. Das bedeutet, dass die Instanz bis zu 65.536 Sammeleinheiten aufnehmen kann. Wenn die Gesamtzahl diese Grenze überschreitet, zeigt das System die folgende Fehlermeldung an:</p>
 <pre><code translate="no" class="language-shell">failed checking constraint: sum_collections(parition*shard) exceeding the <span class="hljs-built_in">max</span> general capacity:
 <button class="copy-code-btn"></button></code></pre>
 <p>Um diesen Fehler zu vermeiden, können Sie entweder die Anzahl der Shards oder Partitionen in bestehenden oder neuen Sammlungen reduzieren, einige Sammlungen löschen oder den Wert <code translate="no">maxGeneralCapacity</code> erhöhen.</p>
@@ -1 +1 @@
-{"codeList":["pip install pymilvus torch gdown torchvision tqdm\n","import gdown\nimport zipfile\n\nurl = 'https://drive.google.com/uc?id=1OYDHLEy992qu5C4C8HV5uDIkOWRTAR1_'\noutput = './paintings.zip'\ngdown.download(url, output)\n\nwith zipfile.ZipFile(\"./paintings.zip\",\"r\") as zip_ref:\n    zip_ref.extractall(\"./paintings\")\n","# Milvus Setup Arguments\nCOLLECTION_NAME = 'image_search'  # Collection name\nDIMENSION = 2048  # Embedding vector size in this example\nMILVUS_HOST = \"localhost\"\nMILVUS_PORT = \"19530\"\n\n# Inference Arguments\nBATCH_SIZE = 128\nTOP_K = 3\n","from pymilvus import connections\n\n# Connect to the instance\nconnections.connect(host=MILVUS_HOST, port=MILVUS_PORT)\n","from pymilvus import utility\n\n# Remove any previous collections with the same name\nif utility.has_collection(COLLECTION_NAME):\n    utility.drop_collection(COLLECTION_NAME)\n","from pymilvus import FieldSchema, CollectionSchema, DataType, Collection\n\n# Create collection which includes the id, filepath of the image, and image embedding\nfields = [\n    FieldSchema(name='id', dtype=DataType.INT64, is_primary=True, auto_id=True),\n    FieldSchema(name='filepath', dtype=DataType.VARCHAR, max_length=200),  # VARCHARS need a maximum length, so for this example they are set to 200 characters\n    FieldSchema(name='image_embedding', dtype=DataType.FLOAT_VECTOR, dim=DIMENSION)\n]\nschema = CollectionSchema(fields=fields)\ncollection = Collection(name=COLLECTION_NAME, schema=schema)\n","# Create an AutoIndex index for collection\nindex_params = {\n'metric_type':'L2',\n'index_type':\"IVF_FLAT\",\n'params':{'nlist': 16384}\n}\ncollection.create_index(field_name=\"image_embedding\", index_params=index_params)\ncollection.load()\n","import glob\n\n# Get the filepaths of the images\npaths = glob.glob('./paintings/paintings/**/*.jpg', recursive=True)\nlen(paths)\n","import torch\n\n# Load the embedding model with the last layer removed\nmodel = torch.hub.load('pytorch/vision:v0.10.0', 'resnet50', pretrained=True)\nmodel = torch.nn.Sequential(*(list(model.children())[:-1]))\nmodel.eval()\n","from torchvision import transforms\n\n# Preprocessing for images\npreprocess = transforms.Compose([\n    transforms.Resize(256),\n    transforms.CenterCrop(224),\n    transforms.ToTensor(),\n    transforms.Normalize(mean=[0.485, 0.456, 0.406], std=[0.229, 0.224, 0.225]),\n])\n","from PIL import Image\nfrom tqdm import tqdm\n\n# Embed function that embeds the batch and inserts it\ndef embed(data):\n    with torch.no_grad():\n        output = model(torch.stack(data[0])).squeeze()\n        collection.insert([data[1], output.tolist()])\n\ndata_batch = [[],[]]\n\n# Read the images into batches for embedding and insertion\nfor path in tqdm(paths):\n    im = Image.open(path).convert('RGB')\n    data_batch[0].append(preprocess(im))\n    data_batch[1].append(path)\n    if len(data_batch[0]) % BATCH_SIZE == 0:\n        embed(data_batch)\n        data_batch = [[],[]]\n\n# Embed and insert the remainder\nif len(data_batch[0]) != 0:\n    embed(data_batch)\n\n# Call a flush to index any unsealed segments.\ncollection.flush()\n","import glob\n\n# Get the filepaths of the search images\nsearch_paths = glob.glob('./paintings/test_paintings/**/*.jpg', recursive=True)\nlen(search_paths)\n","import time\nfrom matplotlib import pyplot as plt\n\n# Embed the search images\ndef embed(data):\n    with torch.no_grad():\n        ret = model(torch.stack(data))\n        # If more than one image, use squeeze\n        if len(ret) > 1:\n            return ret.squeeze().tolist()\n        # Squeeze would remove batch for single image, so using flatten\n        else:\n            return torch.flatten(ret, start_dim=1).tolist()\n\ndata_batch = [[],[]]\n\nfor path in search_paths:\n    im = Image.open(path).convert('RGB')\n    data_batch[0].append(preprocess(im))\n    data_batch[1].append(path)\n\nembeds = embed(data_batch[0])\nstart = time.time()\nres = collection.search(embeds, anns_field='image_embedding', param={'nprobe': 128}, limit=TOP_K, output_fields=['filepath'])\nfinish = time.time()\n","# Show the image results\nf, axarr = plt.subplots(len(data_batch[1]), TOP_K + 1, figsize=(20, 10), squeeze=False)\n\nfor hits_i, hits in enumerate(res):\n    axarr[hits_i][0].imshow(Image.open(data_batch[1][hits_i]))\n    axarr[hits_i][0].set_axis_off()\n    axarr[hits_i][0].set_title('Search Time: ' + str(finish - start))\n    for hit_i, hit in enumerate(hits):\n        axarr[hits_i][hit_i + 1].imshow(Image.open(hit.entity.get('filepath')))\n        axarr[hits_i][hit_i + 1].set_axis_off()\n        axarr[hits_i][hit_i + 1].set_title('Distance: ' + str(hit.distance))\n\n# Save the search result in a separate image file alongside your script.\nplt.savefig('search_result.png')\n"],"headingContent":"Image Search with Milvus","anchorList":[{"label":"Bildsuche mit Milvus","href":"Image-Search-with-Milvus","type":1,"isActive":false},{"label":"Installieren der Voraussetzungen","href":"Installing-the-requirements","type":2,"isActive":false},{"label":"Erfassen der Daten","href":"Grabbing-the-data","type":2,"isActive":false},{"label":"Globale Argumente","href":"Global-Arguments","type":2,"isActive":false},{"label":"Einrichten von Milvus","href":"Setting-up-Milvus","type":2,"isActive":false},{"label":"Einfügen der Daten","href":"Inserting-the-data","type":2,"isActive":false},{"label":"Durchführen der Suche","href":"Performing-the-search","type":2,"isActive":false}]}
+{"codeList":["pip install pymilvus torch gdown torchvision tqdm\n","import gdown\nimport zipfile\n\nurl = 'https://drive.google.com/uc?id=1OYDHLEy992qu5C4C8HV5uDIkOWRTAR1_'\noutput = './paintings.zip'\ngdown.download(url, output)\n\nwith zipfile.ZipFile(\"./paintings.zip\",\"r\") as zip_ref:\n    zip_ref.extractall(\"./paintings\")\n","# Milvus Setup Arguments\nCOLLECTION_NAME = 'image_search'  # Collection name\nDIMENSION = 2048  # Embedding vector size in this example\nMILVUS_HOST = \"localhost\"\nMILVUS_PORT = \"19530\"\n\n# Inference Arguments\nBATCH_SIZE = 128\nTOP_K = 3\n","from pymilvus import connections\n\n# Connect to the instance\nconnections.connect(host=MILVUS_HOST, port=MILVUS_PORT)\n","from pymilvus import utility\n\n# Remove any previous collections with the same name\nif utility.has_collection(COLLECTION_NAME):\n    utility.drop_collection(COLLECTION_NAME)\n","from pymilvus import FieldSchema, CollectionSchema, DataType, Collection\n\n# Create collection which includes the id, filepath of the image, and image embedding\nfields = [\n    FieldSchema(name='id', dtype=DataType.INT64, is_primary=True, auto_id=True),\n    FieldSchema(name='filepath', dtype=DataType.VARCHAR, max_length=200),  # VARCHARS need a maximum length, so for this example they are set to 200 characters\n    FieldSchema(name='image_embedding', dtype=DataType.FLOAT_VECTOR, dim=DIMENSION)\n]\nschema = CollectionSchema(fields=fields)\ncollection = Collection(name=COLLECTION_NAME, schema=schema)\n","# Create an AutoIndex index for collection\nindex_params = {\n'metric_type':'L2',\n'index_type':\"IVF_FLAT\",\n'params':{'nlist': 16384}\n}\ncollection.create_index(field_name=\"image_embedding\", index_params=index_params)\ncollection.load()\n","import glob\n\n# Get the filepaths of the images\npaths = glob.glob('./paintings/paintings/**/*.jpg', recursive=True)\nlen(paths)\n","import torch\n\n# Load the embedding model with the last layer removed\nmodel = torch.hub.load('pytorch/vision:v0.10.0', 'resnet50', pretrained=True)\nmodel = torch.nn.Sequential(*(list(model.children())[:-1]))\nmodel.eval()\n","from torchvision import transforms\n\n# Preprocessing for images\npreprocess = transforms.Compose([\n    transforms.Resize(256),\n    transforms.CenterCrop(224),\n    transforms.ToTensor(),\n    transforms.Normalize(mean=[0.485, 0.456, 0.406], std=[0.229, 0.224, 0.225]),\n])\n","from PIL import Image\nfrom tqdm import tqdm\n\n# Embed function that embeds the batch and inserts it\ndef embed(data):\n    with torch.no_grad():\n        output = model(torch.stack(data[0])).squeeze()\n        collection.insert([data[1], output.tolist()])\n\ndata_batch = [[],[]]\n\n# Read the images into batches for embedding and insertion\nfor path in tqdm(paths):\n    im = Image.open(path).convert('RGB')\n    data_batch[0].append(preprocess(im))\n    data_batch[1].append(path)\n    if len(data_batch[0]) % BATCH_SIZE == 0:\n        embed(data_batch)\n        data_batch = [[],[]]\n\n# Embed and insert the remainder\nif len(data_batch[0]) != 0:\n    embed(data_batch)\n\n# Call a flush to index any unsealed segments.\ncollection.flush()\n","import glob\n\n# Get the filepaths of the search images\nsearch_paths = glob.glob('./paintings/test_paintings/**/*.jpg', recursive=True)\nlen(search_paths)\n","import time\nfrom matplotlib import pyplot as plt\n\n# Embed the search images\ndef embed(data):\n    with torch.no_grad():\n        ret = model(torch.stack(data))\n        # If more than one image, use squeeze\n        if len(ret) > 1:\n            return ret.squeeze().tolist()\n        # Squeeze would remove batch for single image, so using flatten\n        else:\n            return torch.flatten(ret, start_dim=1).tolist()\n\ndata_batch = [[],[]]\n\nfor path in search_paths:\n    im = Image.open(path).convert('RGB')\n    data_batch[0].append(preprocess(im))\n    data_batch[1].append(path)\n\nembeds = embed(data_batch[0])\nstart = time.time()\nres = collection.search(embeds, anns_field='image_embedding', param={'nprobe': 128}, limit=TOP_K, output_fields=['filepath'])\nfinish = time.time()\n","# Show the image results\nf, axarr = plt.subplots(len(data_batch[1]), TOP_K + 1, figsize=(20, 10), squeeze=False)\n\nfor hits_i, hits in enumerate(res):\n    axarr[hits_i][0].imshow(Image.open(data_batch[1][hits_i]))\n    axarr[hits_i][0].set_axis_off()\n    axarr[hits_i][0].set_title('Search Time: ' + str(finish - start))\n    for hit_i, hit in enumerate(hits):\n        axarr[hits_i][hit_i + 1].imshow(Image.open(hit.entity.get('filepath')))\n        axarr[hits_i][hit_i + 1].set_axis_off()\n        axarr[hits_i][hit_i + 1].set_title('Distance: ' + str(hit.distance))\n\n# Save the search result in a separate image file alongside your script.\nplt.savefig('search_result.png')\n"],"headingContent":"Image Search with PyTorch and Milvus","anchorList":[{"label":"Bildsuche mit PyTorch und Milvus","href":"Image-Search-with-PyTorch-and-Milvus","type":1,"isActive":false},{"label":"Installieren der Voraussetzungen","href":"Installing-the-requirements","type":2,"isActive":false},{"label":"Erfassen der Daten","href":"Grabbing-the-data","type":2,"isActive":false},{"label":"Globale Argumente","href":"Global-Arguments","type":2,"isActive":false},{"label":"Einrichten von Milvus","href":"Setting-up-Milvus","type":2,"isActive":false},{"label":"Einfügen der Daten","href":"Inserting-the-data","type":2,"isActive":false},{"label":"Durchführen der Suche","href":"Performing-the-search","type":2,"isActive":false}]}
@@ -1,9 +1,11 @@
 ---
 id: integrate_with_pytorch.md
-summary: Diese Seite behandelt die Bildsuche mit Milvus
-title: Bildsuche mit Milvus - Integration
+summary: >-
+  Diese Seite demonstriert, wie man eine Bildsuche mit PyTorch und Milvus
+  erstellt
+title: Bildsuche mit PyTorch und Milvus
 ---
-<h1 id="Image-Search-with-Milvus" class="common-anchor-header">Bildsuche mit Milvus<button data-href="#Image-Search-with-Milvus" class="anchor-icon" translate="no">
+<h1 id="Image-Search-with-PyTorch-and-Milvus" class="common-anchor-header">Bildsuche mit PyTorch und Milvus<button data-href="#Image-Search-with-PyTorch-and-Milvus" class="anchor-icon" translate="no">
       <svg translate="no"
         aria-hidden="true"
         focusable="false"
@@ -18,8 +20,8 @@ title: Bildsuche mit Milvus - Integration
           d="M4 9h1v1H4c-1.5 0-3-1.69-3-3.5S2.55 3 4 3h4c1.45 0 3 1.69 3 3.5 0 1.41-.91 2.72-2 3.25V8.59c.58-.45 1-1.27 1-2.09C10 5.22 8.98 4 8 4H4c-.98 0-2 1.22-2 2.5S3 9 4 9zm9-3h-1v1h1c1 0 2 1.22 2 2.5S13.98 12 13 12H9c-.98 0-2-1.22-2-2.5 0-.83.42-1.64 1-2.09V6.25c-1.09.53-2 1.84-2 3.25C6 11.31 7.55 13 9 13h4c1.45 0 3-1.69 3-3.5S14.5 6 13 6z"
         ></path>
       </svg>
-    </button></h1><p>Auf dieser Seite werden wir ein einfaches Beispiel für eine Bildsuche mit Milvus durchgehen. Der Datensatz, den wir durchsuchen, ist der Impressionist-Classifier-Datensatz, der auf <a href="https://www.kaggle.com/datasets/delayedkarma/impressionist-classifier-data">Kaggle</a> zu finden ist. Für dieses Beispiel haben wir die Daten in einem öffentlichen Google Drive gehostet.</p>
-<p>Für dieses Beispiel verwenden wir nur das von Torchvision trainierte Resnet50-Modell für Einbettungen. Los geht's!</p>
+    </button></h1><p>In dieser Anleitung wird ein Beispiel für die Integration von PyTorch und Milvus vorgestellt, um eine Bildsuche mit Einbettungen durchzuführen. PyTorch ist ein leistungsfähiges Open-Source-Framework für Deep Learning, das häufig für die Erstellung und den Einsatz von Machine-Learning-Modellen verwendet wird. In diesem Beispiel nutzen wir die Torchvision-Bibliothek und ein vorab trainiertes ResNet50-Modell, um Merkmalsvektoren (Einbettungen) zu erzeugen, die Bildinhalte darstellen. Diese Einbettungen werden in Milvus, einer leistungsstarken Vektordatenbank, gespeichert, um eine effiziente Ähnlichkeitssuche zu ermöglichen. Der verwendete Datensatz ist der Impressionist-Classifier Dataset von <a href="https://www.kaggle.com/datasets/delayedkarma/impressionist-classifier-data">Kaggle</a>. Durch die Kombination der Deep-Learning-Fähigkeiten von PyTorch mit den skalierbaren Suchfunktionen von Milvus zeigt dieses Beispiel, wie man ein robustes und effizientes Bildabfragesystem aufbauen kann.</p>
+<p>Los geht's!</p>
 <h2 id="Installing-the-requirements" class="common-anchor-header">Installieren der Voraussetzungen<button data-href="#Installing-the-requirements" class="anchor-icon" translate="no">
       <svg translate="no"
         aria-hidden="true"
Original file line number	Diff line number	Diff line change
`@@ -803,7 +803,7 @@`
`803`	`803`	`"children": []`
`804`	`804`	`},`
`805`	`805`	`{`
`806`		`- "label": "Azure",`
	`806`	`+ "label": "Azulejo",`
`807`	`807`	`"id": "abs.md",`
`808`	`808`	`"order": 3,`
`809`	`809`	`"children": []`
`@@ -1763,7 +1763,7 @@`
`1763`	`1763`	`]`
`1764`	`1764`	`},`
`1765`	`1765`	`{`
`1766`		`- "label": "FAQs",`
	`1766`	`+ "label": "Perguntas frequentes",`
`1767`	`1767`	`"id": "faq",`
`1768`	`1768`	`"isMenu": true,`
`1769`	`1769`	`"order": 9,`
Original file line number	Diff line number	Diff line change
`@@ -677,7 +677,7 @@`
`677`	`677`	`"children": []`
`678`	`678`	`},`
`679`	`679`	`{`
`680`		`- "label": "From Milvus 2.3.x",`
	`680`	`+ "label": "来自 Milvus 2.3.x",`
`681`	`681`	`"id": "from-m2x.md",`
`682`	`682`	`"order": 5,`
`683`	`683`	`"children": []`
Original file line number	Diff line number	Diff line change
`@@ -1 +1 @@`
`1`		-{"codeList":["pip install pymilvus torch gdown torchvision tqdm\n","import gdown\nimport zipfile\n\nurl = 'https://drive.google.com/uc?id=1OYDHLEy992qu5C4C8HV5uDIkOWRTAR1_'\noutput = './paintings.zip'\ngdown.download(url, output)\n\nwith zipfile.ZipFile(\"./paintings.zip\",\"r\") as zip_ref:\n zip_ref.extractall(\"./paintings\")\n","# Milvus Setup Arguments\nCOLLECTION_NAME = 'image_search' # Collection name\nDIMENSION = 2048 # Embedding vector size in this example\nMILVUS_HOST = \"localhost\"\nMILVUS_PORT = \"19530\"\n\n# Inference Arguments\nBATCH_SIZE = 128\nTOP_K = 3\n","from pymilvus import connections\n\n# Connect to the instance\nconnections.connect(host=MILVUS_HOST, port=MILVUS_PORT)\n","from pymilvus import utility\n\n# Remove any previous collections with the same name\nif utility.has_collection(COLLECTION_NAME):\n utility.drop_collection(COLLECTION_NAME)\n","from pymilvus import FieldSchema, CollectionSchema, DataType, Collection\n\n# Create collection which includes the id, filepath of the image, and image embedding\nfields = [\n FieldSchema(name='id', dtype=DataType.INT64, is_primary=True, auto_id=True),\n FieldSchema(name='filepath', dtype=DataType.VARCHAR, max_length=200), # VARCHARS need a maximum length, so for this example they are set to 200 characters\n FieldSchema(name='image_embedding', dtype=DataType.FLOAT_VECTOR, dim=DIMENSION)\n]\nschema = CollectionSchema(fields=fields)\ncollection = Collection(name=COLLECTION_NAME, schema=schema)\n","# Create an AutoIndex index for collection\nindex_params = {\n'metric_type':'L2',\n'index_type':\"IVF_FLAT\",\n'params':{'nlist': 16384}\n}\ncollection.create_index(field_name=\"image_embedding\", index_params=index_params)\ncollection.load()\n","import glob\n\n# Get the filepaths of the images\npaths = glob.glob('./paintings/paintings/*/.jpg', recursive=True)\nlen(paths)\n","import torch\n\n# Load the embedding model with the last layer removed\nmodel = torch.hub.load('pytorch/vision:v0.10.0', 'resnet50', pretrained=True)\nmodel = torch.nn.Sequential((list(model.children())[:-1]))\nmodel.eval()\n","from torchvision import transforms\n\n# Preprocessing for images\npreprocess = transforms.Compose([\n transforms.Resize(256),\n transforms.CenterCrop(224),\n transforms.ToTensor(),\n transforms.Normalize(mean=[0.485, 0.456, 0.406], std=[0.229, 0.224, 0.225]),\n])\n","from PIL import Image\nfrom tqdm import tqdm\n\n# Embed function that embeds the batch and inserts it\ndef embed(data):\n with torch.no_grad():\n output = model(torch.stack(data[0])).squeeze()\n collection.insert([data[1], output.tolist()])\n\ndata_batch = [[],[]]\n\n# Read the images into batches for embedding and insertion\nfor path in tqdm(paths):\n im = Image.open(path).convert('RGB')\n data_batch[0].append(preprocess(im))\n data_batch[1].append(path)\n if len(data_batch[0]) % BATCH_SIZE == 0:\n embed(data_batch)\n data_batch = [[],[]]\n\n# Embed and insert the remainder\nif len(data_batch[0]) != 0:\n embed(data_batch)\n\n# Call a flush to index any unsealed segments.\ncollection.flush()\n","import glob\n\n# Get the filepaths of the search images\nsearch_paths = glob.glob('./paintings/test_paintings//.jpg', recursive=True)\nlen(search_paths)\n","import time\nfrom matplotlib import pyplot as plt\n\n# Embed the search images\ndef embed(data):\n with torch.no_grad():\n ret = model(torch.stack(data))\n # If more than one image, use squeeze\n if len(ret) > 1:\n return ret.squeeze().tolist()\n # Squeeze would remove batch for single image, so using flatten\n else:\n return torch.flatten(ret, start_dim=1).tolist()\n\ndata_batch = [[],[]]\n\nfor path in search_paths:\n im = Image.open(path).convert('RGB')\n data_batch[0].append(preprocess(im))\n data_batch[1].append(path)\n\nembeds = embed(data_batch[0])\nstart = time.time()\nres = collection.search(embeds, anns_field='image_embedding', param={'nprobe': 128}, limit=TOP_K, output_fields=['filepath'])\nfinish = time.time()\n","# Show the image results\nf, axarr = plt.subplots(len(data_batch[1]), TOP_K + 1, figsize=(20, 10), squeeze=False)\n\nfor hits_i, hits in enumerate(res):\n axarr[hits_i][0].imshow(Image.open(data_batch[1][hits_i]))\n axarr[hits_i][0].set_axis_off()\n axarr[hits_i][0].set_title('Search Time: ' + str(finish - start))\n for hit_i, hit in enumerate(hits):\n axarr[hits_i][hit_i + 1].imshow(Image.open(hit.entity.get('filepath')))\n axarr[hits_i][hit_i + 1].set_axis_off()\n axarr[hits_i][hit_i + 1].set_title('Distance: ' + str(hit.distance))\n\n# Save the search result in a separate image file alongside your script.\nplt.savefig('search_result.png')\n"],"headingContent":"Image Search with Milvus","anchorList":[{"label":"Bildsuche mit Milvus","href":"Image-Search-with-Milvus","type":1,"isActive":false},{"label":"Installieren der Voraussetzungen","href":"Installing-the-requirements","type":2,"isActive":false},{"label":"Erfassen der Daten","href":"Grabbing-the-data","type":2,"isActive":false},{"label":"Globale Argumente","href":"Global-Arguments","type":2,"isActive":false},{"label":"Einrichten von Milvus","href":"Setting-up-Milvus","type":2,"isActive":false},{"label":"Einfügen der Daten","href":"Inserting-the-data","type":2,"isActive":false},{"label":"Durchführen der Suche","href":"Performing-the-search","type":2,"isActive":false}]}
	`1`	+{"codeList":["pip install pymilvus torch gdown torchvision tqdm\n","import gdown\nimport zipfile\n\nurl = 'https://drive.google.com/uc?id=1OYDHLEy992qu5C4C8HV5uDIkOWRTAR1_'\noutput = './paintings.zip'\ngdown.download(url, output)\n\nwith zipfile.ZipFile(\"./paintings.zip\",\"r\") as zip_ref:\n zip_ref.extractall(\"./paintings\")\n","# Milvus Setup Arguments\nCOLLECTION_NAME = 'image_search' # Collection name\nDIMENSION = 2048 # Embedding vector size in this example\nMILVUS_HOST = \"localhost\"\nMILVUS_PORT = \"19530\"\n\n# Inference Arguments\nBATCH_SIZE = 128\nTOP_K = 3\n","from pymilvus import connections\n\n# Connect to the instance\nconnections.connect(host=MILVUS_HOST, port=MILVUS_PORT)\n","from pymilvus import utility\n\n# Remove any previous collections with the same name\nif utility.has_collection(COLLECTION_NAME):\n utility.drop_collection(COLLECTION_NAME)\n","from pymilvus import FieldSchema, CollectionSchema, DataType, Collection\n\n# Create collection which includes the id, filepath of the image, and image embedding\nfields = [\n FieldSchema(name='id', dtype=DataType.INT64, is_primary=True, auto_id=True),\n FieldSchema(name='filepath', dtype=DataType.VARCHAR, max_length=200), # VARCHARS need a maximum length, so for this example they are set to 200 characters\n FieldSchema(name='image_embedding', dtype=DataType.FLOAT_VECTOR, dim=DIMENSION)\n]\nschema = CollectionSchema(fields=fields)\ncollection = Collection(name=COLLECTION_NAME, schema=schema)\n","# Create an AutoIndex index for collection\nindex_params = {\n'metric_type':'L2',\n'index_type':\"IVF_FLAT\",\n'params':{'nlist': 16384}\n}\ncollection.create_index(field_name=\"image_embedding\", index_params=index_params)\ncollection.load()\n","import glob\n\n# Get the filepaths of the images\npaths = glob.glob('./paintings/paintings/*/.jpg', recursive=True)\nlen(paths)\n","import torch\n\n# Load the embedding model with the last layer removed\nmodel = torch.hub.load('pytorch/vision:v0.10.0', 'resnet50', pretrained=True)\nmodel = torch.nn.Sequential((list(model.children())[:-1]))\nmodel.eval()\n","from torchvision import transforms\n\n# Preprocessing for images\npreprocess = transforms.Compose([\n transforms.Resize(256),\n transforms.CenterCrop(224),\n transforms.ToTensor(),\n transforms.Normalize(mean=[0.485, 0.456, 0.406], std=[0.229, 0.224, 0.225]),\n])\n","from PIL import Image\nfrom tqdm import tqdm\n\n# Embed function that embeds the batch and inserts it\ndef embed(data):\n with torch.no_grad():\n output = model(torch.stack(data[0])).squeeze()\n collection.insert([data[1], output.tolist()])\n\ndata_batch = [[],[]]\n\n# Read the images into batches for embedding and insertion\nfor path in tqdm(paths):\n im = Image.open(path).convert('RGB')\n data_batch[0].append(preprocess(im))\n data_batch[1].append(path)\n if len(data_batch[0]) % BATCH_SIZE == 0:\n embed(data_batch)\n data_batch = [[],[]]\n\n# Embed and insert the remainder\nif len(data_batch[0]) != 0:\n embed(data_batch)\n\n# Call a flush to index any unsealed segments.\ncollection.flush()\n","import glob\n\n# Get the filepaths of the search images\nsearch_paths = glob.glob('./paintings/test_paintings//.jpg', recursive=True)\nlen(search_paths)\n","import time\nfrom matplotlib import pyplot as plt\n\n# Embed the search images\ndef embed(data):\n with torch.no_grad():\n ret = model(torch.stack(data))\n # If more than one image, use squeeze\n if len(ret) > 1:\n return ret.squeeze().tolist()\n # Squeeze would remove batch for single image, so using flatten\n else:\n return torch.flatten(ret, start_dim=1).tolist()\n\ndata_batch = [[],[]]\n\nfor path in search_paths:\n im = Image.open(path).convert('RGB')\n data_batch[0].append(preprocess(im))\n data_batch[1].append(path)\n\nembeds = embed(data_batch[0])\nstart = time.time()\nres = collection.search(embeds, anns_field='image_embedding', param={'nprobe': 128}, limit=TOP_K, output_fields=['filepath'])\nfinish = time.time()\n","# Show the image results\nf, axarr = plt.subplots(len(data_batch[1]), TOP_K + 1, figsize=(20, 10), squeeze=False)\n\nfor hits_i, hits in enumerate(res):\n axarr[hits_i][0].imshow(Image.open(data_batch[1][hits_i]))\n axarr[hits_i][0].set_axis_off()\n axarr[hits_i][0].set_title('Search Time: ' + str(finish - start))\n for hit_i, hit in enumerate(hits):\n axarr[hits_i][hit_i + 1].imshow(Image.open(hit.entity.get('filepath')))\n axarr[hits_i][hit_i + 1].set_axis_off()\n axarr[hits_i][hit_i + 1].set_title('Distance: ' + str(hit.distance))\n\n# Save the search result in a separate image file alongside your script.\nplt.savefig('search_result.png')\n"],"headingContent":"Image Search with PyTorch and Milvus","anchorList":[{"label":"Bildsuche mit PyTorch und Milvus","href":"Image-Search-with-PyTorch-and-Milvus","type":1,"isActive":false},{"label":"Installieren der Voraussetzungen","href":"Installing-the-requirements","type":2,"isActive":false},{"label":"Erfassen der Daten","href":"Grabbing-the-data","type":2,"isActive":false},{"label":"Globale Argumente","href":"Global-Arguments","type":2,"isActive":false},{"label":"Einrichten von Milvus","href":"Setting-up-Milvus","type":2,"isActive":false},{"label":"Einfügen der Daten","href":"Inserting-the-data","type":2,"isActive":false},{"label":"Durchführen der Suche","href":"Performing-the-search","type":2,"isActive":false}]}