wip-3

pitercl · pitercl · commit 5f19c1710e3c · 2025-10-14T15:41:12.000+02:00
diff --git a/tests/e2e/internal/test_split.py b/tests/e2e/internal/test_split.py
@@ -1,5 +1,9 @@
 import pytest
-from helpers.metrics import normalize_metrics_data
+from helpers.metrics import (
+    FloatPointValue,
+    assert_metric_mappings_equal,
+    normalize_metrics_data,
+)
 
 import neptune_query as npt
 from neptune_query.exceptions import (
@@ -288,13 +292,18 @@ def test_fetch_float_series_values_retrieval(client, project, experiment_identif
                 RunAttributeDefinition(
                     run_identifier=identifiers.RunIdentifier(project.project_identifier, exp.sys_id),
                     attribute_definition=identifiers.AttributeDefinition(key, "float_series"),
-                ): [(int(NOW.timestamp() * 1000), 1.0, value, False, 1.0)]
+                ): [
+                    FloatPointValue.create(
+                        step=1.0,
+                        value=value,
+                    )
+                ]
                 for exp in exp_identifiers
                 for key, value in attribute_data.items()
             }
         )
         assert thrown_e is None
-        assert result == expected_values
+        assert_metric_mappings_equal(result, expected_values)
     else:
         assert result is None
         assert thrown_e is not None
diff --git a/tests/e2e/v1/runs/test_runs_fetch_metrics.py b/tests/e2e/v1/runs/test_runs_fetch_metrics.py
@@ -10,7 +10,10 @@
     RUN_BY_ID,
     timestamp_for_step,
 )
-from tests.helpers.metrics import normalize_metrics_data
+from tests.helpers.metrics import (
+    FloatPointValue,
+    normalize_metrics_data,
+)
 
 NEPTUNE_PROJECT = os.getenv("NEPTUNE_E2E_PROJECT")
 
@@ -235,7 +238,15 @@ def create_expected_data(project, expected_metrics, include_time: str, type_suff
         rows = data.setdefault(attribute_run, [])
 
         for step, value in values:
-            rows.append((int(timestamp_for_step(step).timestamp() * 1000), step, value, False, 1.0))
+            rows.append(
+                FloatPointValue.create(
+                    timestamp_ms=int(timestamp_for_step(step).timestamp() * 1000),
+                    step=step,
+                    value=value,
+                    is_preview=False,
+                    completion_ratio=1.0,
+                )
+            )
 
     sys_id_label_mapping = {identifiers.SysId(run): run for run, _ in expected_metrics.keys()}
 
diff --git a/tests/e2e/v1/test_fetch_metrics.py b/tests/e2e/v1/test_fetch_metrics.py
@@ -54,7 +54,13 @@ def _to_run_attribute_definition(project, run, metric_name):
 
 
 def _to_float_point_value(step, value):
-    return int(timestamp_for_step(step).timestamp() * 1000), step, value, False, 1.0
+    return FloatPointValue.create(
+        timestamp_ms=int(timestamp_for_step(step).timestamp() * 1000),
+        step=step,
+        value=value,
+        is_preview=False,
+        completion_ratio=1.0,
+    )
 
 
 def _sys_id_label_mapping(experiments: list[ExperimentData]) -> dict[SysId, str]:
@@ -73,12 +79,12 @@ def _run_attribute_definition(
 
 
 def _float_point_value(step, value) -> FloatPointValue:
-    return (
-        int((NOW + timedelta(seconds=int(step))).timestamp()) * 1000,
-        step,
-        value,
-        False,
-        1.0,
+    return FloatPointValue.create(
+        timestamp_ms=int((NOW + timedelta(seconds=int(step))).timestamp()) * 1000,
+        step=step,
+        value=value,
+        is_preview=False,
+        completion_ratio=1.0,
     )
 
 
@@ -132,12 +138,12 @@ def create_expected_data(
                     columns.add(f"{path}:float_series" if type_suffix_in_column_names else path)
                     filtered_experiments.add(experiment.name)
                     filtered.append(
-                        (
-                            int((NOW + timedelta(seconds=int(step))).timestamp()) * 1000,
-                            step,
-                            series[int(step)],
-                            False,
-                            1.0,
+                        FloatPointValue.create(
+                            timestamp_ms=int((NOW + timedelta(seconds=int(step))).timestamp()) * 1000,
+                            step=step,
+                            value=series[int(step)],
+                            is_preview=False,
+                            completion_ratio=1.0,
                         )
                     )
             limited = filtered[-tail_limit:] if tail_limit is not None else filtered
diff --git a/tests/fuzzy/data_generators.py b/tests/fuzzy/data_generators.py
@@ -93,12 +93,12 @@ def float_point_values(draw, *, min_size: int = 0, max_size: Optional[int] = Non
         preview_completion_list = [1.0] * size
 
     return [
-        (
-            timestamp_millis,
-            step,
-            value,
-            preview,
-            preview_completion,
+        FloatPointValue.create(
+            timestamp_ms=timestamp_millis,
+            step=step,
+            value=value,
+            is_preview=preview,
+            completion_ratio=preview_completion,
         )
         for timestamp_millis, step, value, preview, preview_completion in zip(
             timestamp_millis_list, step_list, values_list, preview_list, preview_completion_list
diff --git a/tests/helpers/metrics.py b/tests/helpers/metrics.py
@@ -1,9 +1,9 @@
 from __future__ import annotations
 
+from dataclasses import dataclass
 from typing import (
     Mapping,
     Sequence,
-    Tuple,
     Union,
 )
 
@@ -12,44 +12,107 @@
 from neptune_query.internal.identifiers import RunAttributeDefinition
 from neptune_query.internal.retrieval.metrics import MetricValues
 
-FloatPointValue = Tuple[float, float, float, bool, float]
+
+@dataclass(frozen=True)
+class FloatPointValue:
+    timestamp_ms: float | None
+    step: float | None
+    value: float | None
+    is_preview: bool | None = None
+    completion_ratio: float | None = None
+
+    @classmethod
+    def create(
+        cls,
+        step: float | None,
+        value: float | None,
+        *,
+        timestamp_ms: float | None = None,
+        is_preview: bool | None = None,
+        completion_ratio: float | None = None,
+    ) -> "FloatPointValue":
+        return cls(
+            timestamp_ms=timestamp_ms,
+            step=step,
+            value=value,
+            is_preview=is_preview,
+            completion_ratio=completion_ratio,
+        )
+
+    def as_tuple(self) -> tuple[object, ...]:
+        return self.timestamp_ms, self.step, self.value, self.is_preview, self.completion_ratio
+
+    def __iter__(self):
+        return iter(self.as_tuple())
+
+    def __getitem__(self, index: int) -> object:
+        return self.as_tuple()[index]
+
+    def __len__(self) -> int:
+        return len(self.as_tuple())
+
+    def has_timestamp(self) -> bool:
+        return self.timestamp_ms is not None
+
+    def has_preview_data(self) -> bool:
+        return self.is_preview is not None and self.completion_ratio is not None
 
 
 def to_metric_values(points: Sequence[FloatPointValue]) -> MetricValues:
     size = len(points)
-    include_timestamp = any(len(point) > 0 and point[0] is not None for point in points)
-    include_preview = any(len(point) >= 4 for point in points)
+    include_timestamp = any(point.has_timestamp() for point in points)
+    include_preview = any(point.has_preview_data() for point in points)
 
     metric_values = MetricValues.allocate(
         size=size, include_timestamp=include_timestamp, include_preview=include_preview
     )
 
     for idx, point in enumerate(points):
-        timestamp = point[0] if len(point) > 0 else None
-        step = point[1] if len(point) > 1 else np.nan
-        value = point[2] if len(point) > 2 else np.nan
-        preview = point[3] if len(point) > 3 else False
-        completion_ratio = point[4] if len(point) > 4 else 1.0
-
-        metric_values.steps[idx] = float(step) if step is not None else np.nan
-        metric_values.values[idx] = float(value) if value is not None else np.nan
+        metric_values.steps[idx] = float(point.step)
+        metric_values.values[idx] = float(point.value)
 
         if metric_values.timestamps is not None:
-            metric_values.timestamps[idx] = float(timestamp) if timestamp is not None else np.nan
+            metric_values.timestamps[idx] = float(point.timestamp_ms) if point.timestamp_ms is not None else np.nan
 
         if metric_values.is_preview is not None:
-            metric_values.is_preview[idx] = bool(preview)
+            metric_values.is_preview[idx] = bool(point.is_preview) if point.is_preview is not None else False
 
         if metric_values.completion_ratio is not None:
-            metric_values.completion_ratio[idx] = float(completion_ratio) if completion_ratio is not None else np.nan
+            metric_values.completion_ratio[idx] = (
+                float(point.completion_ratio) if point.completion_ratio is not None else 1.0
+            )
 
     return metric_values
 
 
 def normalize_metrics_data(
-    metrics_data: Mapping[RunAttributeDefinition, Union[MetricValues, Sequence[FloatPointValue]]],
+    metrics_data: Mapping[
+        RunAttributeDefinition,
+        Union[MetricValues, Sequence[FloatPointValue]],
+    ],
 ) -> dict[RunAttributeDefinition, MetricValues]:
     return {
         definition: value if isinstance(value, MetricValues) else to_metric_values(value)
         for definition, value in metrics_data.items()
     }
+
+
+def assert_metric_mappings_equal(
+    actual: Mapping[RunAttributeDefinition, MetricValues],
+    expected: Mapping[RunAttributeDefinition, MetricValues],
+) -> None:
+    actual_keys = set(actual.keys())
+    expected_keys = set(expected.keys())
+
+    if actual_keys != expected_keys:
+        missing = expected_keys - actual_keys
+        unexpected = actual_keys - expected_keys
+        raise AssertionError(f"Metric definitions mismatch. Missing: {missing}, unexpected: {unexpected}")
+
+    for definition in expected_keys:
+        actual_values = actual[definition]
+        expected_values = expected[definition]
+        if actual_values != expected_values:
+            raise AssertionError(
+                "Metric values differ for " f"{definition}: actual={actual_values!r}, expected={expected_values!r}"
+            )
diff --git a/tests/performance/generate.py b/tests/performance/generate.py
@@ -26,7 +26,13 @@ def random_alnum_strings(count: int, length: int) -> list[str]:
 
 
 def float_point_value(i: int, exp: int) -> FloatPointValue:
-    return (1234567890 + i * 1000.0, float(i) + exp, float(i) * 10, False, 1.0)
+    return FloatPointValue.create(
+        timestamp_ms=1234567890 + i * 1000.0,
+        step=float(i) + exp,
+        value=float(i) * 10,
+        is_preview=False,
+        completion_ratio=1.0,
+    )
 
 
 EXPERIMENT_IDENTIFIER = RunIdentifier(ProjectIdentifier("project/abc"), SysId("XXX-1"))
diff --git a/tests/performance/test_perf_output_format.py b/tests/performance/test_perf_output_format.py
@@ -6,7 +6,10 @@
     create_series_dataframe,
 )
 from neptune_query.internal.retrieval.series import SeriesValue
-from tests.helpers.metrics import normalize_metrics_data
+from tests.helpers.metrics import (
+    FloatPointValue,
+    normalize_metrics_data,
+)
 
 from . import generate
 from .decorator import expected_benchmark
@@ -42,8 +45,14 @@ def test_perf_create_metrics_dataframe(benchmark, num_experiments, num_steps, nu
         for path in range(num_paths):
             run_attr_def = generate.run_attribute_definition(exp, path)
             metrics_data[run_attr_def] = [
-                (None, float(step), float(step * exp), False, 1.0)
-                for step in range(num_steps)  # FloatPointValue as tuple
+                FloatPointValue.create(
+                    timestamp_ms=None,
+                    step=float(step),
+                    value=float(step * exp),
+                    is_preview=False,
+                    completion_ratio=1.0,
+                )
+                for step in range(num_steps)
             ]
 
     sys_id_label_mapping = {SysId(f"sysid{exp}"): f"exp{exp}" for exp in range(num_experiments)}
diff --git a/tests/unit/internal/test_output_format.py b/tests/unit/internal/test_output_format.py