|
| 1 | +from .single_run_data import DataInstance, SingleRunData |
| 2 | + |
| 3 | + |
| 4 | +def trim_single_run_data( |
| 5 | + data: SingleRunData, |
| 6 | + ts_start: float, |
| 7 | + ts_end: float, |
| 8 | +) -> SingleRunData: |
| 9 | + """Return a new SingleRunData with every variable trimmed to [ts_start, ts_end]. |
| 10 | +
|
| 11 | + Parameters |
| 12 | + ---------- |
| 13 | + data : SingleRunData |
| 14 | + ts_start, ts_end : float |
| 15 | + Timestamps in the same unit as data.timestamp_unit. |
| 16 | +
|
| 17 | + Returns |
| 18 | + ------- |
| 19 | + SingleRunData |
| 20 | + Fresh object; the original is not mutated. |
| 21 | + """ |
| 22 | + trimmed: dict[int, DataInstance] = { |
| 23 | + var_id: di.trim(ts_start, ts_end) for var_id, di in data.id_to_instance.items() |
| 24 | + } |
| 25 | + |
| 26 | + return SingleRunData( |
| 27 | + id_to_instance=trimmed, |
| 28 | + cpp_name_to_id=dict(data.cpp_name_to_id), |
| 29 | + id_to_cpp_name=dict(data.id_to_cpp_name), |
| 30 | + id_to_descript=dict(data.id_to_descript), |
| 31 | + total_data_points=sum(len(di.value_np) for di in trimmed.values()), |
| 32 | + data_start_time=int(ts_start), |
| 33 | + data_end_time=int(ts_end), |
| 34 | + timestamp_unit=data.timestamp_unit, |
| 35 | + concat_boundaries=[], |
| 36 | + ) |
| 37 | + |
| 38 | + |
| 39 | +def split_single_run_data( |
| 40 | + data: SingleRunData, |
| 41 | + split_timestamps: list[float], |
| 42 | +) -> list[SingleRunData]: |
| 43 | + """Split a SingleRunData into segments defined by a list of boundary timestamps. |
| 44 | +
|
| 45 | + Each consecutive pair of timestamps in ``split_timestamps`` defines one |
| 46 | + segment. The result is keyed by 1-based segment number. |
| 47 | +
|
| 48 | + Parameters |
| 49 | + ---------- |
| 50 | + data : SingleRunData |
| 51 | + split_timestamps : list[float] |
| 52 | + Ordered boundary timestamps in the same unit as data.timestamp_unit. |
| 53 | + Must contain at least 2 values. |
| 54 | +
|
| 55 | + Returns |
| 56 | + ------- |
| 57 | + List[SingleRunData] |
| 58 | + """ |
| 59 | + if len(split_timestamps) < 2: |
| 60 | + raise ValueError(f"Need at least 2 boundary timestamps") |
| 61 | + |
| 62 | + segments = [] |
| 63 | + for t_start, t_end in zip(split_timestamps[:-1], split_timestamps[1:]): |
| 64 | + segments.append(trim_single_run_data(data, t_start, t_end)) |
| 65 | + |
| 66 | + return segments |
0 commit comments