add predict proxy virtual service (#1628)

* add predict proxy virtual service * Add e2e for predict proxy endpoint * simpler check
nuclia · Nov 30, 2023 · 3c0130a · 3c0130a · github-actions · Nov 30, 2023
1 parent 84cebd9
commit 3c0130a
Show file tree

Hide file tree

Showing 2 changed files with 81 additions and 5 deletions.
diff --git a/charts/nucliadb_search/templates/search.vs.yaml b/charts/nucliadb_search/templates/search.vs.yaml
@@ -34,6 +34,10 @@ spec:
             regex: '^/api/v\d+/kb/[^/]+/summarize$'
           method:
             regex: "POST|OPTIONS"
+        - uri:
+            regex: '^/api/v\d+/kb/[^/]+/predict/.*'
+          method:
+            regex: "GET|POST|OPTIONS"            
         - uri:
             regex: '^/api/v\d+/kb/[^/]+/resource/[^/]+/(chat|find|search|ask)$'
           method:

diff --git a/e2e/test_e2e.py b/e2e/test_e2e.py
@@ -1,11 +1,12 @@
-import pytest
-import requests
+import base64
+import io
+import json
 import os
 import random
 import time
-import io
-import json
-import base64
+
+import pytest
+import requests
 
 BASE_URL = os.environ.get("NUCLIADB_URL", "http://localhost:8080")
 
@@ -149,3 +150,74 @@ def test_search(kbid: str, resource_id: str):
 
     assert "Not enough data to answer this" not in chat_response
     assert len(search_results["resources"]) == 1
+
+
+def test_predict_proxy(kbid: str):
+    _test_predict_proxy_chat(kbid)
+    _test_predict_proxy_tokens(kbid)
+    _test_predict_proxy_rephrase(kbid)
+
+
+def _test_predict_proxy_chat(kbid: str):
+    resp = requests.post(
+        os.path.join(BASE_URL, f"api/v1/kb/{kbid}/predict/chat"),
+        headers={
+            "content-type": "application/json",
+            "X-NUCLIADB-ROLES": "READER",
+            "x-ndb-client": "web",
+        },
+        json={
+            "question": "Who is the best one?",
+            "query_context": [
+                "Many football players have existed. Cristiano Ronaldo and Messi among them, but Messi is by far the greatest."
+            ],
+            "user_id": "[email protected]",
+        },
+    )
+    resp.raise_for_status()
+    data = io.BytesIO(resp.content)
+    answer = data.read().decode("utf-8")
+    assert "Messi" in answer
+
+
+def _test_predict_proxy_tokens(kbid: str):
+    resp = requests.get(
+        os.path.join(BASE_URL, f"api/v1/kb/{kbid}/predict/tokens"),
+        headers={
+            "content-type": "application/json",
+            "X-NUCLIADB-ROLES": "READER",
+            "x-ndb-client": "web",
+        },
+        params={
+            "text": "Barcelona",
+        },
+    )
+    resp.raise_for_status()
+    data = resp.json()
+    assert data["tokens"][0]["text"] == "Barcelona"
+
+
+def _test_predict_proxy_rephrase(kbid: str):
+    resp = requests.post(
+        os.path.join(BASE_URL, f"api/v1/kb/{kbid}/predict/rephrase"),
+        headers={
+            "content-type": "application/json",
+            "X-NUCLIADB-ROLES": "READER",
+            "x-ndb-client": "web",
+        },
+        json={
+            "question": "Who is the best one?",
+            "context": [
+                {
+                    "author": "NUCLIA",
+                    "text": "Many football players have existed. Cristiano Ronaldo and Messi among them.",
+                },
+                {"author": "USER", "text": "Tell me some football players"},
+            ],
+            "user_id": "[email protected]",
+        },
+    )
+    resp.raise_for_status()
+    rephrased_query = resp.json()
+    # Status code 0 means success...
+    assert rephrased_query.endswith("0")