From 658f2f24fe23ecf1a5bc3dbb70380f919756ab83 Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?Mihai=20Capot=C4=83?= Date: Thu, 26 Jun 2025 15:56:40 -0700 Subject: [PATCH] Print more stats; print WS_SEARCH as ef --- engine/base_client/client.py | 10 ++++++++++ 1 file changed, 10 insertions(+) diff --git a/engine/base_client/client.py b/engine/base_client/client.py index 4f097bfc..6ccde526 100644 --- a/engine/base_client/client.py +++ b/engine/base_client/client.py @@ -121,6 +121,12 @@ def run_experiment( upload_stats = self.uploader.upload( distance=dataset.config.distance, records=reader.read_data(upload_start_idx,upload_end_idx) ) + memory_usage = upload_stats["memory_usage"] + if (used_memory := memory_usage.get("used_memory")) is not None: + print(f"{used_memory=}") + if (index_info := memory_usage.get("index_info")) is not None: + if (vector_index_sz_mb := index_info.get("vector_index_sz_mb")) is not None: + print(f"{vector_index_sz_mb=}") if not DETAILED_RESULTS: # Remove verbose stats from upload results @@ -157,6 +163,8 @@ def run_experiment( ef = "default" if "search_params" in search_params: ef = search_params["search_params"].get("ef", "default") + if ef == "default": + ef = search_params["search_params"].get("WS_SEARCH", "default") client_count = search_params.get("parallel", 1) # Filter by client count if parallels is specified @@ -186,6 +194,7 @@ def run_experiment( f"Calibrated {top=} {precision=} {calibration_value=} {calibration_precision=!s}" ) searcher.search_params["search_params"][calibration_param] = calibration_value + ef = calibration_value for repetition in range(1, REPETITIONS + 1): print( @@ -195,6 +204,7 @@ def run_experiment( search_stats = searcher.search_all( dataset.config.distance, reader.read_queries(), num_queries ) + print(f"{search_stats['mean_precisions']=!s}, {search_stats['rps']=}") # ensure we specify the client count in the results search_params["parallel"] = client_count if not DETAILED_RESULTS: