Merge branch 'master' into thomasht86/wip-version-arg-to-deploy

vespa-engine · Nov 21, 2024 · 80aa44a · 80aa44a
2 parents 5301a65 + b38751d
commit 80aa44a
Show file tree

Hide file tree

Showing 5 changed files with 69 additions and 53 deletions.
diff --git a/.github/workflows/release-vespacli.yml b/.github/workflows/release-vespacli.yml
@@ -37,7 +37,6 @@ jobs:
           # Set the output variable
           echo "version=$version" >> $GITHUB_OUTPUT
 
-
   check-and-update:
     runs-on: ubuntu-latest
     # Only run if we have a new version
@@ -74,7 +73,6 @@ jobs:
           name: binaries
           path: vespacli/vespacli/go-binaries
 
-
   test:
     runs-on: ${{ matrix.os }}
     # Only run if we have a new version
@@ -86,7 +84,8 @@ jobs:
       VERSION: ${{ needs.prepare.outputs.version }}
     strategy:
       matrix:
-        os: [ubuntu-24.04, ubuntu-latest, windows-latest, macos-13, macos-latest]
+        os:
+          [ubuntu-24.04, ubuntu-latest, windows-latest, macos-13, macos-latest]
         python-version: ["3.10", "3.11", "3.12"]
     steps:
       - uses: actions/checkout@v4
@@ -114,6 +113,7 @@ jobs:
       - name: Update latest version
         run: |
           python utils/update_version.py --version "${VERSION}"
+        shell: bash
 
       - name: Install dependencies
         run: |
@@ -178,3 +178,4 @@ jobs:
         uses: pypa/gh-action-pypi-publish@release/v1
         with:
           print-hash: true
+          packages-dir: vespacli/dist/
diff --git a/docs/sphinx/source/examples/visual_pdf_rag_with_vespa_colpali_cloud.ipynb b/docs/sphinx/source/examples/visual_pdf_rag_with_vespa_colpali_cloud.ipynb
@@ -1265,14 +1265,13 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 41,
+   "execution_count": null,
    "id": "5b7acbb6",
    "metadata": {
     "id": "5b7acbb6"
    },
    "outputs": [],
    "source": [
-    "# Define the Vespa schema\n",
     "colpali_schema = Schema(\n",
     "    name=VESPA_SCHEMA_NAME,\n",
     "    document=Document(\n",
@@ -1293,9 +1292,7 @@
     "                index=\"enable-bm25\",\n",
     "            ),\n",
     "            Field(name=\"page_number\", type=\"int\", indexing=[\"summary\", \"attribute\"]),\n",
-    "            Field(\n",
-    "                name=\"blur_image\", type=\"raw\", indexing=[\"summary\"]\n",
-    "            ),  # We store the images as base64-encoded strings\n",
+    "            Field(name=\"blur_image\", type=\"raw\", indexing=[\"summary\"]),\n",
     "            Field(name=\"full_image\", type=\"raw\", indexing=[\"summary\"]),\n",
     "            Field(\n",
     "                name=\"text\",\n",
@@ -1305,31 +1302,29 @@
     "                index=\"enable-bm25\",\n",
     "            ),\n",
     "            Field(\n",
-    "                name=\"embedding\",  # The page image embeddings are stored as binary tensors (represented by signed 8-bit integers)\n",
+    "                name=\"embedding\",\n",
     "                type=\"tensor<int8>(patch{}, v[16])\",\n",
     "                indexing=[\n",
     "                    \"attribute\",\n",
     "                    \"index\",\n",
     "                ],\n",
-    "                ann=HNSW(  # Since we are using binary embeddings, we use the HNSW algorithm with Hamming distance as the metric, which is highly efficient in Vespa, see https://blog.vespa.ai/scaling-colpali-to-billions/\n",
+    "                ann=HNSW(\n",
     "                    distance_metric=\"hamming\",\n",
     "                    max_links_per_node=32,\n",
     "                    neighbors_to_explore_at_insert=400,\n",
     "                ),\n",
     "            ),\n",
     "            Field(\n",
-    "                name=\"questions\",  # We store the generated questions and queries as arrays of strings for each document\n",
+    "                name=\"questions\",\n",
     "                type=\"array<string>\",\n",
-    "                indexing=[\"summary\", \"index\", \"attribute\"],\n",
-    "                index=\"enable-bm25\",\n",
-    "                stemming=\"best\",\n",
+    "                indexing=[\"summary\", \"attribute\"],\n",
+    "                summary=Summary(fields=[\"matched-elements-only\"]),\n",
     "            ),\n",
     "            Field(\n",
     "                name=\"queries\",\n",
     "                type=\"array<string>\",\n",
-    "                indexing=[\"summary\", \"index\", \"attribute\"],\n",
-    "                index=\"enable-bm25\",\n",
-    "                stemming=\"best\",\n",
+    "                indexing=[\"summary\", \"attribute\"],\n",
+    "                summary=Summary(fields=[\"matched-elements-only\"]),\n",
     "            ),\n",
     "        ]\n",
     "    ),\n",
@@ -1389,7 +1384,7 @@
     "]\n",
     "\n",
     "# Define the 'bm25' rank profile\n",
-    "colpali_bm25_profile = RankProfile(\n",
+    "bm25 = RankProfile(\n",
     "    name=\"bm25\",\n",
     "    inputs=[(\"query(qt)\", \"tensor<float>(querytoken{}, v[128])\")],\n",
     "    first_phase=\"bm25(title) + bm25(text)\",\n",
@@ -1407,14 +1402,27 @@
     "    )\n",
     "\n",
     "\n",
-    "colpali_schema.add_rank_profile(colpali_bm25_profile)\n",
-    "colpali_schema.add_rank_profile(with_quantized_similarity(colpali_bm25_profile))\n",
+    "colpali_schema.add_rank_profile(bm25)\n",
+    "colpali_schema.add_rank_profile(with_quantized_similarity(bm25))\n",
     "\n",
-    "# Update the 'default' rank profile\n",
-    "colpali_profile = RankProfile(\n",
-    "    name=\"default\",\n",
-    "    inputs=[(\"query(qt)\", \"tensor<float>(querytoken{}, v[128])\")],\n",
-    "    first_phase=\"bm25_score\",\n",
+    "\n",
+    "# Update the 'colpali' rank profile\n",
+    "input_query_tensors = []\n",
+    "MAX_QUERY_TERMS = 64\n",
+    "for i in range(MAX_QUERY_TERMS):\n",
+    "    input_query_tensors.append((f\"query(rq{i})\", \"tensor<int8>(v[16])\"))\n",
+    "\n",
+    "input_query_tensors.extend(\n",
+    "    [\n",
+    "        (\"query(qt)\", \"tensor<float>(querytoken{}, v[128])\"),\n",
+    "        (\"query(qtb)\", \"tensor<int8>(querytoken{}, v[16])\"),\n",
+    "    ]\n",
+    ")\n",
+    "\n",
+    "colpali = RankProfile(\n",
+    "    name=\"colpali\",\n",
+    "    inputs=input_query_tensors,\n",
+    "    first_phase=\"max_sim_binary\",\n",
     "    second_phase=SecondPhaseRanking(expression=\"max_sim\", rerank_count=10),\n",
     "    functions=mapfunctions\n",
     "    + [\n",
@@ -1432,30 +1440,33 @@
     "                )\n",
     "            \"\"\",\n",
     "        ),\n",
-    "        Function(name=\"bm25_score\", expression=\"bm25(title) + bm25(text)\"),\n",
+    "        Function(\n",
+    "            name=\"max_sim_binary\",\n",
+    "            expression=\"\"\"\n",
+    "                sum(\n",
+    "                    reduce(\n",
+    "                        1 / (1 + sum(\n",
+    "                            hamming(query(qtb), attribute(embedding)), v)\n",
+    "                        ),\n",
+    "                        max, patch\n",
+    "                    ),\n",
+    "                    querytoken\n",
+    "                )\n",
+    "            \"\"\",\n",
+    "        ),\n",
     "    ],\n",
     ")\n",
-    "colpali_schema.add_rank_profile(colpali_profile)\n",
-    "colpali_schema.add_rank_profile(with_quantized_similarity(colpali_profile))\n",
-    "\n",
-    "# Update the 'retrieval-and-rerank' rank profile\n",
-    "input_query_tensors = []\n",
-    "MAX_QUERY_TERMS = 64\n",
-    "for i in range(MAX_QUERY_TERMS):\n",
-    "    input_query_tensors.append((f\"query(rq{i})\", \"tensor<int8>(v[16])\"))\n",
-    "\n",
-    "input_query_tensors.extend(\n",
-    "    [\n",
-    "        (\"query(qt)\", \"tensor<float>(querytoken{}, v[128])\"),\n",
-    "        (\"query(qtb)\", \"tensor<int8>(querytoken{}, v[16])\"),\n",
-    "    ]\n",
-    ")\n",
+    "colpali_schema.add_rank_profile(colpali)\n",
+    "colpali_schema.add_rank_profile(with_quantized_similarity(colpali))\n",
     "\n",
-    "colpali_retrieval_profile = RankProfile(\n",
-    "    name=\"retrieval-and-rerank\",\n",
+    "# Update the 'hybrid' rank profile\n",
+    "hybrid = RankProfile(\n",
+    "    name=\"hybrid\",\n",
     "    inputs=input_query_tensors,\n",
     "    first_phase=\"max_sim_binary\",\n",
-    "    second_phase=SecondPhaseRanking(expression=\"max_sim\", rerank_count=10),\n",
+    "    second_phase=SecondPhaseRanking(\n",
+    "        expression=\"max_sim + 2 * (bm25(text) + bm25(title))\", rerank_count=10\n",
+    "    ),\n",
     "    functions=mapfunctions\n",
     "    + [\n",
     "        Function(\n",
@@ -1488,8 +1499,8 @@
     "        ),\n",
     "    ],\n",
     ")\n",
-    "colpali_schema.add_rank_profile(colpali_retrieval_profile)\n",
-    "colpali_schema.add_rank_profile(with_quantized_similarity(colpali_retrieval_profile))"
+    "colpali_schema.add_rank_profile(hybrid)\n",
+    "colpali_schema.add_rank_profile(with_quantized_similarity(hybrid))"
    ]
   },
   {

diff --git a/vespacli/utils/update_version.py b/vespacli/utils/update_version.py
@@ -1,12 +1,12 @@
 # This script should modify top level pyproject.toml to update the version of vespacli
-# And modify vespacli/_version_generated.py to update the version of vespacli
 
 import toml
 import sys
 from pathlib import Path
 import argparse
 
 PYPROJECT_TOML_PATH = Path(__file__).parent.parent / "pyproject.toml"
+VERSION_FILE_PATH = Path(__file__).parent.parent / "vespacli" / "_version_generated.py"
 
 
 def update_version(new_version: str):
@@ -17,6 +17,11 @@ def update_version(new_version: str):
     with open("pyproject.toml", "w") as f:
         toml.dump(data, f)
 
+    # Also update version in vespacli/_version_generated.py
+    with open(VERSION_FILE_PATH, "w") as f:
+        # Write comment about auto-generation
+        f.write("# This file is auto-generated by utils/update_version.py\n")
+        f.write(f'__version__ = "{new_version}"\n')
     print(f"Updated version to {new_version}")
 
 

diff --git a/vespacli/vespacli/__init__.py b/vespacli/vespacli/__init__.py
@@ -1,9 +1,10 @@
 import os
+import sys
 import platform
 import subprocess
-import sys
+from ._version_generated import __version__
 
-from vespacli._version_generated import vespa_version
+vespa_version = __version__
 
 
 def get_binary_path():
@@ -26,7 +27,6 @@ def get_binary_path():
     binary_dir_name = f"vespa-cli_{vespa_version}_{os_name}_{arch}"
     binary_path = os.path.join(go_binaries_path, binary_dir_name, "bin")
 
-    # Assuming the executable name is consistent and known
     executable_name = "vespa" if os_name != "windows" else "vespa.exe"
     full_executable_path = os.path.join(binary_path, executable_name)
 
@@ -42,6 +42,3 @@ def run_vespa_cli():
     full_cmd = [binary_path, *args]
     _result = subprocess.run(full_cmd)
     return
-
-
-__version__ = vespa_version
diff --git a/vespacli/vespacli/_version_generated.py b/vespacli/vespacli/_version_generated.py
@@ -0,0 +1,2 @@
+# This file is auto-generated by utils/update_version.py
+__version__ = "8.dev"
Original file line number	Diff line number	Diff line change
		@@ -0,0 +1,2 @@
		# This file is auto-generated by utils/update_version.py
		__version__ = "8.dev"