Skip to content

Commit

Permalink
add helper functions and tests
Browse files Browse the repository at this point in the history
Signed-off-by: Bangtian Liu <[email protected]>
  • Loading branch information
bangtianliu committed Jan 9, 2025
1 parent 4b2165c commit 9593df8
Show file tree
Hide file tree
Showing 2 changed files with 84 additions and 2 deletions.
46 changes: 46 additions & 0 deletions tuner/tuner/libtuner.py
Original file line number Diff line number Diff line change
Expand Up @@ -216,6 +216,52 @@ def validate_devices(user_devices: list[str]) -> None:
)


def validate_benchmark_results(
benchmark_results: list[BenchmarkResult],
) -> list[BenchmarkResult]:
filtered_benchmark_results = [r for r in benchmark_results if math.isfinite(r.time)]
if len(filtered_benchmark_results) == 0:
logging.error("No successful candidate benchmarks.")

return filtered_benchmark_results


def map_baseline_by_device(baseline_results: list[BenchmarkResult]) -> dict[str, float]:
return {r.device_id: r.time for r in baseline_results}


def validate_baselines_device_ids_match(
first_baseline_by_device: dict[str, float],
second_baseline_by_device: dict[str, float],
) -> bool:
return first_baseline_by_device.keys() == second_baseline_by_device.keys()


def validate_baseline_regression(
first_baseline_by_device: dict[str, float],
second_baseline_by_device: dict[str, float],
) -> bool:
regression_detected = False
for device_id in first_baseline_by_device:
if device_id not in second_baseline_by_device:
continue
first_baseline_time = first_baseline_by_device[device_id]
second_baseline_time = second_baseline_by_device[device_id]

if second_baseline_time > first_baseline_time * 1.03:
percentage_slower = (
(second_baseline_time - first_baseline_time) / first_baseline_time
) * 100
logging.warning(
f"Performance regression detected on device {device_id}: "
f"Baseline time = {first_baseline_time}, Post-baseline time = {second_baseline_time}, "
f"Slower by {percentage_slower:.3f}%"
)
regression_detected = True

return regression_detected


class ExecutionPhases(str, Enum):
dont_stop = ""
generate_candidates = "generate-candidates"
Expand Down
40 changes: 38 additions & 2 deletions tuner/tuner/libtuner_test.py
Original file line number Diff line number Diff line change
Expand Up @@ -5,8 +5,7 @@
# SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception

import argparse
import pytest
import json
import math
from subprocess import CompletedProcess
from unittest.mock import call, patch, MagicMock
from . import libtuner
Expand Down Expand Up @@ -177,3 +176,40 @@ def test_validate_devices_with_invalid_device() -> None:

def test_enum_collision():
from iree.compiler.dialects import linalg, vector, iree_gpu, iree_codegen, iree_input # type: ignore


def test_validate_benchmark_results():
benchmark_results = [
libtuner.BenchmarkResult(0, math.inf, "hip://0"),
]

result = libtuner.validate_benchmark_results(benchmark_results)
assert result == []

benchmark_results = [
libtuner.BenchmarkResult(0, math.inf, "hip://0"),
libtuner.BenchmarkResult(0, 0.1, "hip://1"),
]
result = libtuner.validate_benchmark_results(benchmark_results)
assert len(result) == 1
assert result[0].candidate_id == 0
assert result[0].time == 0.1
assert result[0].device_id == "hip://1"


def test_validate_baselines_device_id_match():
first_baseline = {"hip://0": 1000.0, "hip://1": 2000.0}
second_baseline = {"hip://1": 1500.0, "hip://2": 2500.0}

result = libtuner.validate_baselines_device_ids_match(
first_baseline, second_baseline
)
assert result is False

first_baseline = {"hip://0": 1000.0, "hip://1": 2000.0}
second_baseline = {"hip://0": 1500.0, "hip://1": 2500.0}

result = libtuner.validate_baselines_device_ids_match(
first_baseline, second_baseline
)
assert result is True

0 comments on commit 9593df8

Please sign in to comment.