From d7bdeb3ff25f248736d912bc66cbe085d1e07172 Mon Sep 17 00:00:00 2001
From: Martin Aumueller <maau@itu.dk>
Date: Thu, 26 Oct 2023 14:58:30 +0200
Subject: [PATCH] Use -1 as default value for build time, indicating that index
 has been loaded from file.

---
 benchmark/plotting/metrics.py | 12 ++++++------
 benchmark/runner.py           |  5 +++--
 data_export.py                |  5 +++--
 3 files changed, 12 insertions(+), 10 deletions(-)

diff --git a/benchmark/plotting/metrics.py b/benchmark/plotting/metrics.py
index 043cb638..697113b1 100644
--- a/benchmark/plotting/metrics.py
+++ b/benchmark/plotting/metrics.py
@@ -95,7 +95,7 @@ def index_size(attrs):
 
 
 def build_time(attrs):
-    return attrs.get("build_time", 1e6)
+    return attrs.get("build_time", -1)
 
 
 def dist_computations(nq, attrs):
@@ -144,11 +144,11 @@ def mean_latency(attrs):
         "function": lambda true_nn, run_nn, metrics, run_attrs: index_size(run_attrs),  # noqa
         "worst": float("inf")
     },
-    "queriessize": {
-        "description": "Index size (kB)/Queries per second (s)",
-        "function": lambda true_nn, run_nn, metrics, run_attrs: index_size(run_attrs) / queries_per_second(len(true_nn[0]), run_attrs), # noqa
-        "worst": float("inf")
-    },
+    # "queriessize": {
+    #     "description": "Index size (kB)/Queries per second (s)",
+    #     "function": lambda true_nn, run_nn, metrics, run_attrs: index_size(run_attrs) / queries_per_second(len(true_nn[0]), run_attrs), # noqa
+    #     "worst": float("inf")
+    # },
     "wspq": {
         "description": "Watt seconds per query (watt*s/query)",
         "function": lambda true_nn, run_nn, metrics, run_attrs: watt_seconds_per_query(true_nn, run_attrs),  
diff --git a/benchmark/runner.py b/benchmark/runner.py
index 073f1ddb..6cc9a66a 100644
--- a/benchmark/runner.py
+++ b/benchmark/runner.py
@@ -44,6 +44,7 @@ def run(definition, dataset, count, run_count, rebuild,
 
     distance = ds.distance()
     search_type = ds.search_type()
+    build_time = -1 # default value used to indicate that the index was loaded from file
     print(f"Running {definition.algorithm} on {dataset}")
 
     custom_runner = RUNNERS.get(neurips23track, BaseRunner)
@@ -104,8 +105,8 @@ def run(definition, dataset, count, run_count, rebuild,
                 else:
                     descriptor, results = custom_runner.run_task(
                         algo, ds, distance, count, run_count, search_type, private_query)
-                # A bit unclear how to set this correctly if we usually load from file
-                #descriptor["build_time"] = build_time
+
+                descriptor["build_time"] = build_time
                 descriptor["index_size"] = index_size
                 descriptor["algo"] = definition.algorithm
                 descriptor["dataset"] = dataset
diff --git a/data_export.py b/data_export.py
index 47669eae..39ee6f6a 100644
--- a/data_export.py
+++ b/data_export.py
@@ -103,12 +103,13 @@ def cleaned_run_metric(run_metrics):
                     run_metrics = compute_metrics_all_runs(dataset, dataset_name, results, args.recompute, \
                         args.sensors, args.search_times, args.private_query, \
                         neurips23track=track, runbook_path=runbook_path)
-                    dfs.append(pd.DataFrame(cleaned_run_metric(run_metrics)))
             else:
                 results = load_all_results(dataset_name, neurips23track=track)
                 run_metrics = compute_metrics_all_runs(dataset, dataset_name, results, args.recompute, \
                         args.sensors, args.search_times, args.private_query, neurips23track=track)
-                dfs.append(pd.DataFrame(cleaned_run_metric(run_metrics)))
+            results = cleaned_run_metric(run_metrics)
+            if len(results) > 0:
+                dfs.append(pd.DataFrame(results))
     dfs = [e for e in dfs if len(e) > 0]
     if len(dfs) > 0:
         data = pd.concat(dfs)