Coverage for mlos_bench/mlos_bench/tests/environments/local/local_env_telemetry_test.py: 100%
56 statements
« prev ^ index » next coverage.py v7.6.9, created at 2024-12-14 01:58 +0000
« prev ^ index » next coverage.py v7.6.9, created at 2024-12-14 01:58 +0000
1#
2# Copyright (c) Microsoft Corporation.
3# Licensed under the MIT License.
4#
5"""Unit tests for telemetry and status of LocalEnv benchmark environment."""
6from datetime import datetime, timedelta, tzinfo
7from typing import Optional
9import pytest
10from pytz import UTC
12from mlos_bench.tests import ZONE_INFO
13from mlos_bench.tests.environments import check_env_fail_telemetry, check_env_success
14from mlos_bench.tests.environments.local import create_local_env
15from mlos_bench.tunables.tunable_groups import TunableGroups
18def _format_str(zone_info: Optional[tzinfo]) -> str:
19 if zone_info is not None:
20 return "%Y-%m-%d %H:%M:%S %z"
21 return "%Y-%m-%d %H:%M:%S"
24# FIXME: This fails with zone_info = None when run with `TZ="America/Chicago pytest -n0 ...`
25@pytest.mark.parametrize(("zone_info"), ZONE_INFO)
26def test_local_env_telemetry(tunable_groups: TunableGroups, zone_info: Optional[tzinfo]) -> None:
27 """Produce benchmark and telemetry data in a local script and read it."""
28 ts1 = datetime.now(zone_info)
29 ts1 -= timedelta(microseconds=ts1.microsecond) # Round to a second
30 ts2 = ts1 + timedelta(minutes=1)
32 format_str = _format_str(zone_info)
33 time_str1 = ts1.strftime(format_str)
34 time_str2 = ts2.strftime(format_str)
36 local_env = create_local_env(
37 tunable_groups,
38 {
39 "run": [
40 "echo 'metric,value' > output.csv",
41 "echo 'latency,4.1' >> output.csv",
42 "echo 'throughput,512' >> output.csv",
43 "echo 'score,0.95' >> output.csv",
44 "echo '-------------------'", # This output does not go anywhere
45 "echo 'timestamp,metric,value' > telemetry.csv",
46 f"echo {time_str1},cpu_load,0.65 >> telemetry.csv",
47 f"echo {time_str1},mem_usage,10240 >> telemetry.csv",
48 f"echo {time_str2},cpu_load,0.8 >> telemetry.csv",
49 f"echo {time_str2},mem_usage,20480 >> telemetry.csv",
50 ],
51 "read_results_file": "output.csv",
52 "read_telemetry_file": "telemetry.csv",
53 },
54 )
56 check_env_success(
57 local_env,
58 tunable_groups,
59 expected_results={
60 "latency": 4.1,
61 "throughput": 512.0,
62 "score": 0.95,
63 },
64 expected_telemetry=[
65 (ts1.astimezone(UTC), "cpu_load", 0.65),
66 (ts1.astimezone(UTC), "mem_usage", 10240.0),
67 (ts2.astimezone(UTC), "cpu_load", 0.8),
68 (ts2.astimezone(UTC), "mem_usage", 20480.0),
69 ],
70 )
73# FIXME: This fails with zone_info = None when run with `TZ="America/Chicago pytest -n0 ...`
74@pytest.mark.parametrize(("zone_info"), ZONE_INFO)
75def test_local_env_telemetry_no_header(
76 tunable_groups: TunableGroups,
77 zone_info: Optional[tzinfo],
78) -> None:
79 """Read the telemetry data with no header."""
80 ts1 = datetime.now(zone_info)
81 ts1 -= timedelta(microseconds=ts1.microsecond) # Round to a second
82 ts2 = ts1 + timedelta(minutes=1)
84 format_str = _format_str(zone_info)
85 time_str1 = ts1.strftime(format_str)
86 time_str2 = ts2.strftime(format_str)
88 local_env = create_local_env(
89 tunable_groups,
90 {
91 "run": [
92 f"echo {time_str1},cpu_load,0.65 > telemetry.csv",
93 f"echo {time_str1},mem_usage,10240 >> telemetry.csv",
94 f"echo {time_str2},cpu_load,0.8 >> telemetry.csv",
95 f"echo {time_str2},mem_usage,20480 >> telemetry.csv",
96 ],
97 "read_telemetry_file": "telemetry.csv",
98 },
99 )
101 check_env_success(
102 local_env,
103 tunable_groups,
104 expected_results={},
105 expected_telemetry=[
106 (ts1.astimezone(UTC), "cpu_load", 0.65),
107 (ts1.astimezone(UTC), "mem_usage", 10240.0),
108 (ts2.astimezone(UTC), "cpu_load", 0.8),
109 (ts2.astimezone(UTC), "mem_usage", 20480.0),
110 ],
111 )
114@pytest.mark.filterwarnings(
115 (
116 "ignore:.*(Could not infer format, so each element will be parsed individually, "
117 "falling back to `dateutil`).*:UserWarning::0"
118 )
119) # pylint: disable=line-too-long # noqa
120@pytest.mark.parametrize(("zone_info"), ZONE_INFO)
121def test_local_env_telemetry_wrong_header(
122 tunable_groups: TunableGroups,
123 zone_info: Optional[tzinfo],
124) -> None:
125 """Read the telemetry data with incorrect header."""
126 ts1 = datetime.now(zone_info)
127 ts1 -= timedelta(microseconds=ts1.microsecond) # Round to a second
128 ts2 = ts1 + timedelta(minutes=1)
130 format_str = _format_str(zone_info)
131 time_str1 = ts1.strftime(format_str)
132 time_str2 = ts2.strftime(format_str)
134 local_env = create_local_env(
135 tunable_groups,
136 {
137 "run": [
138 # Error: the data is correct, but the header has unexpected column names
139 "echo 'ts,metric_name,metric_value' > telemetry.csv",
140 f"echo {time_str1},cpu_load,0.65 >> telemetry.csv",
141 f"echo {time_str1},mem_usage,10240 >> telemetry.csv",
142 f"echo {time_str2},cpu_load,0.8 >> telemetry.csv",
143 f"echo {time_str2},mem_usage,20480 >> telemetry.csv",
144 ],
145 "read_telemetry_file": "telemetry.csv",
146 },
147 )
149 check_env_fail_telemetry(local_env, tunable_groups)
152def test_local_env_telemetry_invalid(tunable_groups: TunableGroups) -> None:
153 """Fail when the telemetry data has wrong format."""
154 zone_info = UTC
155 ts1 = datetime.now(zone_info)
156 ts1 -= timedelta(microseconds=ts1.microsecond) # Round to a second
157 ts2 = ts1 + timedelta(minutes=1)
159 format_str = _format_str(zone_info)
160 time_str1 = ts1.strftime(format_str)
161 time_str2 = ts2.strftime(format_str)
163 local_env = create_local_env(
164 tunable_groups,
165 {
166 "run": [
167 # Error: too many columns
168 f"echo {time_str1},EXTRA,cpu_load,0.65 > telemetry.csv",
169 f"echo {time_str1},EXTRA,mem_usage,10240 >> telemetry.csv",
170 f"echo {time_str2},EXTRA,cpu_load,0.8 >> telemetry.csv",
171 f"echo {time_str2},EXTRA,mem_usage,20480 >> telemetry.csv",
172 ],
173 "read_telemetry_file": "telemetry.csv",
174 },
175 )
177 check_env_fail_telemetry(local_env, tunable_groups)
180def test_local_env_telemetry_invalid_ts(tunable_groups: TunableGroups) -> None:
181 """Fail when the telemetry data has wrong format."""
182 local_env = create_local_env(
183 tunable_groups,
184 {
185 "run": [
186 # Error: field 1 must be a timestamp
187 "echo 1,cpu_load,0.65 > telemetry.csv",
188 "echo 2,mem_usage,10240 >> telemetry.csv",
189 "echo 3,cpu_load,0.8 >> telemetry.csv",
190 "echo 4,mem_usage,20480 >> telemetry.csv",
191 ],
192 "read_telemetry_file": "telemetry.csv",
193 },
194 )
196 check_env_fail_telemetry(local_env, tunable_groups)