|
| 1 | +# SPDX-FileCopyrightText: Copyright (c) 2025 NVIDIA CORPORATION & AFFILIATES. All rights reserved. |
| 2 | +# SPDX-License-Identifier: Apache-2.0 |
| 3 | + |
| 4 | +import asyncio |
| 5 | +from unittest.mock import AsyncMock, MagicMock, patch |
| 6 | + |
| 7 | +import pytest |
| 8 | + |
| 9 | +from aiperf.common.config import ServiceConfig |
| 10 | +from aiperf.common.hooks import AIPerfHook |
| 11 | +from aiperf.common.messages import RealtimeTelemetryMetricsMessage |
| 12 | +from aiperf.common.mixins.realtime_telemetry_metrics_mixin import ( |
| 13 | + RealtimeTelemetryMetricsMixin, |
| 14 | +) |
| 15 | +from aiperf.common.models import MetricResult |
| 16 | + |
| 17 | + |
| 18 | +class TestRealtimeTelemetryMetricsMixin: |
| 19 | + """Test suite for RealtimeTelemetryMetricsMixin functionality.""" |
| 20 | + |
| 21 | + @pytest.fixture |
| 22 | + def mocked_mixin(self): |
| 23 | + """Create a RealtimeTelemetryMetricsMixin instance with mocked dependencies.""" |
| 24 | + service_config = ServiceConfig() |
| 25 | + mock_controller = MagicMock() |
| 26 | + |
| 27 | + # Mock the MessageBusClientMixin.__init__ to avoid initialization issues |
| 28 | + with patch( |
| 29 | + "aiperf.common.mixins.message_bus_mixin.MessageBusClientMixin.__init__", |
| 30 | + return_value=None, |
| 31 | + ): |
| 32 | + mixin = RealtimeTelemetryMetricsMixin( |
| 33 | + service_config=service_config, controller=mock_controller |
| 34 | + ) |
| 35 | + # Manually set attributes that would be set by parent __init__ |
| 36 | + mixin._controller = mock_controller |
| 37 | + mixin._telemetry_metrics = [] |
| 38 | + mixin.run_hooks = AsyncMock() |
| 39 | + |
| 40 | + return mixin |
| 41 | + |
| 42 | + def test_mixin_initialization(self, mocked_mixin): |
| 43 | + """Test that mixin initializes with correct attributes.""" |
| 44 | + assert hasattr(mocked_mixin, "_controller") |
| 45 | + assert hasattr(mocked_mixin, "_telemetry_metrics") |
| 46 | + assert hasattr(mocked_mixin, "_telemetry_metrics_lock") |
| 47 | + assert mocked_mixin._telemetry_metrics == [] |
| 48 | + |
| 49 | + @pytest.mark.asyncio |
| 50 | + async def test_on_realtime_telemetry_metrics_stores_metrics(self, mocked_mixin): |
| 51 | + """Test that telemetry metrics are stored when message is received.""" |
| 52 | + metrics = [ |
| 53 | + MetricResult(tag="gpu_util", header="GPU Utilization", unit="%", avg=75.0), |
| 54 | + MetricResult( |
| 55 | + tag="gpu_memory", header="GPU Memory Used", unit="GB", avg=8.5 |
| 56 | + ), |
| 57 | + ] |
| 58 | + |
| 59 | + message = RealtimeTelemetryMetricsMessage( |
| 60 | + service_id="records_manager", metrics=metrics |
| 61 | + ) |
| 62 | + |
| 63 | + await mocked_mixin._on_realtime_telemetry_metrics(message) |
| 64 | + |
| 65 | + # Verify metrics were stored |
| 66 | + assert mocked_mixin._telemetry_metrics == metrics |
| 67 | + |
| 68 | + @pytest.mark.asyncio |
| 69 | + async def test_on_realtime_telemetry_metrics_triggers_hook(self, mocked_mixin): |
| 70 | + """Test that receiving telemetry metrics triggers the appropriate hook.""" |
| 71 | + |
| 72 | + metrics = [ |
| 73 | + MetricResult(tag="gpu_util", header="GPU Utilization", unit="%", avg=75.0) |
| 74 | + ] |
| 75 | + |
| 76 | + message = RealtimeTelemetryMetricsMessage( |
| 77 | + service_id="records_manager", metrics=metrics |
| 78 | + ) |
| 79 | + |
| 80 | + await mocked_mixin._on_realtime_telemetry_metrics(message) |
| 81 | + |
| 82 | + # Verify hook was triggered with correct arguments |
| 83 | + mocked_mixin.run_hooks.assert_called_once_with( |
| 84 | + AIPerfHook.ON_REALTIME_TELEMETRY_METRICS, metrics=metrics |
| 85 | + ) |
| 86 | + |
| 87 | + @pytest.mark.asyncio |
| 88 | + async def test_on_realtime_telemetry_metrics_replaces_previous_metrics( |
| 89 | + self, mocked_mixin |
| 90 | + ): |
| 91 | + """Test that new metrics replace previous metrics (not append).""" |
| 92 | + # Set initial metrics |
| 93 | + initial_metrics = [ |
| 94 | + MetricResult(tag="old_metric", header="Old Metric", unit="ms", avg=10.0) |
| 95 | + ] |
| 96 | + mocked_mixin._telemetry_metrics = initial_metrics |
| 97 | + |
| 98 | + # Receive new metrics |
| 99 | + new_metrics = [ |
| 100 | + MetricResult(tag="new_metric", header="New Metric", unit="%", avg=50.0) |
| 101 | + ] |
| 102 | + message = RealtimeTelemetryMetricsMessage( |
| 103 | + service_id="records_manager", metrics=new_metrics |
| 104 | + ) |
| 105 | + |
| 106 | + await mocked_mixin._on_realtime_telemetry_metrics(message) |
| 107 | + |
| 108 | + # Verify old metrics were replaced, not appended |
| 109 | + assert mocked_mixin._telemetry_metrics == new_metrics |
| 110 | + assert len(mocked_mixin._telemetry_metrics) == 1 |
| 111 | + |
| 112 | + @pytest.mark.asyncio |
| 113 | + async def test_on_realtime_telemetry_metrics_with_empty_list(self, mocked_mixin): |
| 114 | + """Test that receiving empty metrics list is handled correctly.""" |
| 115 | + message = RealtimeTelemetryMetricsMessage( |
| 116 | + service_id="records_manager", metrics=[] |
| 117 | + ) |
| 118 | + |
| 119 | + await mocked_mixin._on_realtime_telemetry_metrics(message) |
| 120 | + |
| 121 | + # Should store empty list and still trigger hook |
| 122 | + assert mocked_mixin._telemetry_metrics == [] |
| 123 | + mocked_mixin.run_hooks.assert_called_once() |
| 124 | + |
| 125 | + @pytest.mark.asyncio |
| 126 | + async def test_concurrent_access_with_lock(self, mocked_mixin): |
| 127 | + """Test that the lock protects concurrent access to telemetry metrics.""" |
| 128 | + |
| 129 | + # Track lock acquisition order |
| 130 | + lock_acquired_order = [] |
| 131 | + |
| 132 | + async def acquire_lock_and_update(metrics_value, delay): |
| 133 | + """Helper to simulate concurrent updates.""" |
| 134 | + async with mocked_mixin._telemetry_metrics_lock: |
| 135 | + lock_acquired_order.append(metrics_value) |
| 136 | + await asyncio.sleep(delay) |
| 137 | + mocked_mixin._telemetry_metrics = [ |
| 138 | + MetricResult( |
| 139 | + tag=f"metric_{metrics_value}", |
| 140 | + header=f"Metric {metrics_value}", |
| 141 | + unit="ms", |
| 142 | + avg=float(metrics_value), |
| 143 | + ) |
| 144 | + ] |
| 145 | + |
| 146 | + # Start two concurrent operations |
| 147 | + await asyncio.gather( |
| 148 | + acquire_lock_and_update(1, 0.01), acquire_lock_and_update(2, 0.005) |
| 149 | + ) |
| 150 | + |
| 151 | + # Both should have acquired the lock (order doesn't matter for this test) |
| 152 | + assert len(lock_acquired_order) == 2 |
| 153 | + assert set(lock_acquired_order) == {1, 2} |
| 154 | + |
| 155 | + # Final value should be from the last completed operation |
| 156 | + assert len(mocked_mixin._telemetry_metrics) == 1 |
| 157 | + |
| 158 | + @pytest.mark.asyncio |
| 159 | + async def test_multiple_metrics_handling(self, mocked_mixin): |
| 160 | + """Test handling of message with multiple metrics.""" |
| 161 | + metrics = [ |
| 162 | + MetricResult( |
| 163 | + tag=f"metric_{i}", header=f"Metric {i}", unit="ms", avg=float(i) |
| 164 | + ) |
| 165 | + for i in range(10) |
| 166 | + ] |
| 167 | + |
| 168 | + message = RealtimeTelemetryMetricsMessage( |
| 169 | + service_id="records_manager", metrics=metrics |
| 170 | + ) |
| 171 | + |
| 172 | + await mocked_mixin._on_realtime_telemetry_metrics(message) |
| 173 | + |
| 174 | + # All metrics should be stored |
| 175 | + assert len(mocked_mixin._telemetry_metrics) == 10 |
| 176 | + assert mocked_mixin._telemetry_metrics == metrics |
| 177 | + |
| 178 | + @pytest.mark.asyncio |
| 179 | + async def test_integration_with_controller(self): |
| 180 | + """Test that mixin integrates correctly with controller.""" |
| 181 | + service_config = ServiceConfig() |
| 182 | + mock_controller = MagicMock() |
| 183 | + mock_controller.some_method = MagicMock(return_value="test_value") |
| 184 | + |
| 185 | + with patch( |
| 186 | + "aiperf.common.mixins.message_bus_mixin.MessageBusClientMixin.__init__", |
| 187 | + return_value=None, |
| 188 | + ): |
| 189 | + mixin = RealtimeTelemetryMetricsMixin( |
| 190 | + service_config=service_config, controller=mock_controller |
| 191 | + ) |
| 192 | + |
| 193 | + # Verify controller is accessible |
| 194 | + assert mixin._controller == mock_controller |
| 195 | + assert mixin._controller.some_method() == "test_value" |
0 commit comments