getsentry · ram-senth · Mar 14, 2025 · aayush-se · Mar 14, 2025
@@ -595,7 +595,7 @@ def store_data(
                 level="error",
             )
             raise ServerError(
-                "Batch detection took too long"
+                f"Batch detection took too long. Time taken: {time_elapsed}, Time allocated: {time_allocated}"
             )  # Abort without saving to avoid data going out of sync with alerting system.
 
         saved_alert_id = alert_data_accessor.save_alert(

@@ -264,7 +264,9 @@ def detect(
                             "stream_detection_took_too_long",
                             level="error",
                         )
-                        raise ServerError("Stream detection took too long")
+                        raise ServerError(
+                            f"Stream detection took too long. Time taken: {time_elapsed}, Time allocated: {time_allocated}"
+                        )
 
                 # Update the stumpi stream processor with new data
                 stream.update(cur_val)

@@ -148,13 +148,15 @@ def batch_score(
             if time_allocated is not None and i % batch_size == 0:
                 time_elapsed = datetime.datetime.now() - time_start
                 if time_allocated is not None and time_elapsed > time_allocated:
-                    sentry_sdk.set_extra("time_taken_for_batch_detection", time_elapsed)
-                    sentry_sdk.set_extra("time_allocated_for_batch_detection", time_allocated)
+                    sentry_sdk.set_extra("time_taken", time_elapsed)
+                    sentry_sdk.set_extra("time_allocated", time_allocated)
                     sentry_sdk.capture_message(
                         "batch_detection_took_too_long",
                         level="error",
                     )
-                    raise ServerError("Batch detection took too long")
+                    raise ServerError(
+                        "Batch detection took too long. Time taken: {time_elapsed}, Time allocated: {time_allocated}"
+                    )
             flag: AnomalyFlags = "none"
             location_thresholds: List[Threshold] = []
 

@@ -1,12 +1,13 @@
 from unittest import mock
 
 import numpy as np
+import pandas as pd
 import pytest
 from scipy import stats
 
 from seer.anomaly_detection.detectors.mp_boxcox_scorer import MPBoxCoxScorer
 from seer.anomaly_detection.models import AnomalyDetectionConfig
-from seer.exceptions import ClientError
+from seer.exceptions import ClientError, ServerError
 
 
 @pytest.fixture
@@ -188,3 +189,28 @@ def test_sensitivity_levels(self, box_cox_scorer):
 
         # High sensitivity should detect more anomalies than low sensitivity
         assert high_anomaly_count >= low_anomaly_count
+
+    def test_time_budget_exceeded(self, box_cox_scorer):
+        # Test different sensitivity levels
+        values = np.random.normal(10, 2, 10000)
+        timestamps = pd.date_range(
+            start="2024-01-01", periods=len(values), freq="15min", tz="UTC", unit="s"
+        ).values.astype(np.int64)
+        mp_dist = np.zeros_like(values)
+
+        # Test high sensitivity
+        high_config = AnomalyDetectionConfig(
+            time_period=15,
+            sensitivity="high",
+            direction="both",
+            expected_seasonality="auto",
+        )
+        with pytest.raises(ServerError):
+            box_cox_scorer.batch_score(
+                values=values,
+                timestamps=timestamps,
+                mp_dist=mp_dist,
+                ad_config=high_config,
+                window_size=10,
+                time_budget_ms=10,
+            )
@@ -535,42 +535,43 @@ def test_detect_anomalies_combo(self):
             assert len(response.timeseries) == n
             assert isinstance(response.timeseries[0], TimeSeriesPoint)
 
-    def test_detect_anomalies_combo_large_current(self):
-        config = AnomalyDetectionConfig(
-            time_period=15, sensitivity="low", direction="both", expected_seasonality="auto"
-        )
-
-        loaded_synthetic_data = convert_synthetic_ts(
-            "tests/seer/anomaly_detection/test_data/synthetic_series", as_ts_datatype=True
-        )
-        ts_history = loaded_synthetic_data.timeseries[0]
-        last_history_timestamp = ts_history[-1].timestamp
-        last_history_value = ts_history[-1].value
-        n = 700  # should be greater than 7 days * 24 hours * 60 minutes * 15 minutes = 672
-
-        # Generate new observation window of n points which are the same as the last point
-        ts_current = []
-        for j in range(1, n + 1):
-            ts_current.append(
-                TimeSeriesPoint(
-                    timestamp=last_history_timestamp + config.time_period * 60 * j,
-                    value=last_history_value,
-                )
-            )
-
-        context = TimeSeriesWithHistory(history=ts_history, current=ts_current)
-
-        request = DetectAnomaliesRequest(
-            organization_id=1, project_id=1, config=config, context=context
-        )
-
-        response = AnomalyDetection().detect_anomalies(request=request, time_budget_ms=10000)
-
-        assert isinstance(response, DetectAnomaliesResponse)
-        assert isinstance(response.timeseries, list)
-        assert len(response.timeseries) == n
-        assert isinstance(response.timeseries[0], TimeSeriesPoint)
-        # assert False
+    # TODO: Enable this test once we have a way to run tests in parallel without causing multiple parallel runs
+    # def test_detect_anomalies_combo_large_current(self):
+    #     config = AnomalyDetectionConfig(
+    #         time_period=15, sensitivity="low", direction="both", expected_seasonality="auto"
+    #     )
+
+    #     loaded_synthetic_data = convert_synthetic_ts(
+    #         "tests/seer/anomaly_detection/test_data/synthetic_series", as_ts_datatype=True
+    #     )
+    #     ts_history = loaded_synthetic_data.timeseries[0]
+    #     last_history_timestamp = ts_history[-1].timestamp
+    #     last_history_value = ts_history[-1].value
+    #     n = 700  # should be greater than 7 days * 24 hours * 60 minutes * 15 minutes = 672
+
+    #     # Generate new observation window of n points which are the same as the last point
+    #     ts_current = []
+    #     for j in range(1, n + 1):
+    #         ts_current.append(
+    #             TimeSeriesPoint(
+    #                 timestamp=last_history_timestamp + config.time_period * 60 * j,
+    #                 value=last_history_value,
+    #             )
+    #         )
+
+    #     context = TimeSeriesWithHistory(history=ts_history, current=ts_current)
+
+    #     request = DetectAnomaliesRequest(
+    #         organization_id=1, project_id=1, config=config, context=context
+    #     )
+
+    #     response = AnomalyDetection().detect_anomalies(request=request, time_budget_ms=5000)
+
+    #     assert isinstance(response, DetectAnomaliesResponse)
+    #     assert isinstance(response.timeseries, list)
+    #     assert len(response.timeseries) == n
+    #     assert isinstance(response.timeseries[0], TimeSeriesPoint)
+    # assert False
 
     def test_detect_anomalies_combo_large_current_timeout(self):