ReflexioAI · yilu331 · Apr 23, 2026 · Apr 23, 2026 · Apr 23, 2026 · Apr 23, 2026
diff --git a/README.md b/README.md
@@ -249,7 +249,7 @@ client.publish_interaction(
 )
 
 # Search profiles
-profiles = client.search_profiles(
+profiles = client.search_user_profiles(
     reflexio.SearchUserProfileRequest(query="deployment region preference")
 )
 

diff --git a/client_dist/README.md b/client_dist/README.md
@@ -98,7 +98,7 @@ print(response.success, response.message)
 
 ```python
 # Semantic search for profiles
-results = client.search_profiles(user_id="user-123", query="password preferences")
+results = client.search_user_profiles(user_id="user-123", query="password preferences")
 for profile in results.profiles:
     print(profile.profile_name, profile.profile_content)
 
@@ -313,7 +313,7 @@ In async contexts (e.g., FastAPI), fire-and-forget uses the existing event loop.
 
 | Method | Description |
 |--------|-------------|
-| `search_profiles()` | Semantic search for profiles |
+| `search_user_profiles()` | Semantic search for profiles |
 | `get_profiles()` | Get profiles for a user |
 | `get_all_profiles()` | Get all profiles across users |
 | `delete_profile()` | Delete profiles by ID or search query |

diff --git a/pyproject.toml b/pyproject.toml
@@ -41,6 +41,10 @@ dependencies = [
     "typer>=0.15.0",
     "rich>=13.0.0",
     "chromadb>=1.5.8",
+    # Cross-encoder reranker + local embedding providers — chromadb pulls
+    # ``sentence-transformers`` transitively, but we depend on it directly
+    # so the CrossEncoder/SentenceTransformer surface is guaranteed.
+    "sentence-transformers>=3.0",
 ]
 
 [project.optional-dependencies]
@@ -79,6 +83,7 @@ dev = [
     "python-semantic-release>=10.0.0",
     "build>=1.0.0",
     "twine>=6.0.0",
+    "polars>=1.40.1",
 ]
 docs = [
     "mkdocs>=1.5.3",
@@ -217,6 +222,18 @@ max-complexity = 20
 quote-style = "double"
 indent-style = "space"
 
+[tool.pyright]
+include = ["reflexio", "tests"]
+exclude = [
+    "reflexio/integrations/langchain",
+    "tests/test_scripts",
+    "**/__pycache__",
+    "**/.venv",
+    "benchmark",
+    "notebooks",
+]
+reportMissingImports = "warning"
+
 [tool.mutmut]
 paths_to_mutate = [
     "reflexio/server/services/service_utils.py",

diff --git a/pyrightconfig.json b/pyrightconfig.json
@@ -1,14 +1,19 @@
 {
-    "include": ["reflexio"],
+    "include": ["reflexio", "tests"],
     "exclude": [
         "reflexio/website", "reflexio/tests", "reflexio/data",
         "reflexio/public_docs", "**/__pycache__",
         "reflexio/reflexio_commons/tests",
         "reflexio/reflexio_client/tests",
-        "reflexio/scripts", "notebooks", "demo"
+        "reflexio/scripts", "notebooks", "demo",
+        "reflexio/integrations/langchain",
+        "tests/test_scripts",
+        "**/.venv",
+        "benchmark"
     ],
     "extraPaths": ["."],
     "pythonVersion": "3.14",
     "typeCheckingMode": "basic",
-    "reportMissingTypeStubs": false
+    "reportMissingTypeStubs": false,
+    "reportMissingImports": "warning"
 }
diff --git a/reflexio/benchmarks/retrieval_latency/backends.py b/reflexio/benchmarks/retrieval_latency/backends.py
@@ -45,7 +45,7 @@ class BackendHandle:
 
     Attributes:
         name (str): Short backend identifier, e.g. ``"sqlite"``.
-        reflexio (Reflexio): Service-layer facade — call ``search_profiles``
+        reflexio (Reflexio): Service-layer facade — call ``search_user_profiles``
             etc. directly on this for the service layer benchmark.
         storage (BaseStorage): Underlying storage instance, needed for
             swapping ``_get_embedding`` during seeding and the timed loop.

diff --git a/reflexio/benchmarks/retrieval_latency/bench.py b/reflexio/benchmarks/retrieval_latency/bench.py
@@ -177,7 +177,7 @@ def _service_call(
     """
     match retrieval:
         case "profile":
-            reflexio.search_profiles(_build_profile_request(query_idx))
+            reflexio.search_user_profiles(_build_profile_request(query_idx))
         case "user_playbook":
             reflexio.search_user_playbooks(_build_user_playbook_request(query_idx))
         case "agent_playbook":
@@ -188,7 +188,7 @@ def _service_call(
 
 # Map retrieval type to (HTTP path, request builder) for the http layer.
 _HTTP_ROUTES: dict[RetrievalType, tuple[str, Callable[[int], Any]]] = {
-    "profile": ("/api/search_profiles", _build_profile_request),
+    "profile": ("/api/search_user_profiles", _build_profile_request),
     "user_playbook": ("/api/search_user_playbooks", _build_user_playbook_request),
     "agent_playbook": ("/api/search_agent_playbooks", _build_agent_playbook_request),
     "unified": ("/api/search", _build_unified_request),