|
9 | 9 | import typer |
10 | 10 |
|
11 | 11 | from .config import FlakewallConfig, ensure_default_files, CONFIG_PATH |
12 | | -from .junit import parse_junit_files, failing_ids, compute_flake_stats |
| 12 | +from .junit import ( |
| 13 | + parse_junit_files, |
| 14 | + parse_junit_files_grouped, |
| 15 | + failing_ids, |
| 16 | + compute_flake_stats, |
| 17 | + compute_flake_metrics, |
| 18 | +) |
13 | 19 | from .quarantine import load_quarantined, add_to_quarantine |
14 | 20 | from .runner import retry_tests |
15 | 21 | from . import __version__ |
@@ -116,51 +122,105 @@ def score( |
116 | 122 | gh_summary: bool = typer.Option( |
117 | 123 | False, help="Write summary of flaky candidates to GITHUB_STEP_SUMMARY" |
118 | 124 | ), |
| 125 | + rich: bool = typer.Option( |
| 126 | + False, help="Compute richer metrics (flips, instability, streaks) across runs" |
| 127 | + ), |
119 | 128 | ) -> None: |
120 | 129 | """Compute minimal flake stats from a set of JUnit XML files and print tests that flipped.""" |
121 | 130 | cfg = FlakewallConfig.load() |
122 | 131 | pattern = junit or cfg.report_glob |
123 | 132 | files = [Path(p) for p in glob.glob(pattern, recursive=True)] |
124 | 133 | results = parse_junit_files(files) |
125 | | - stats = compute_flake_stats(results) |
126 | | - |
127 | | - flippers = [s for s in stats.values() if s.total_runs >= min_total and s.has_flip] |
128 | | - flippers.sort(key=lambda s: (-(s.fail_ratio), s.test_id)) |
| 134 | + if rich: |
| 135 | + grouped = parse_junit_files_grouped(files) |
| 136 | + metrics = compute_flake_metrics(grouped) |
| 137 | + flippers = [ |
| 138 | + m |
| 139 | + for m in metrics.values() |
| 140 | + if m.total_runs >= min_total and (m.fail_error_count > 0 and m.pass_count > 0) |
| 141 | + ] |
| 142 | + flippers.sort(key=lambda m: (-m.instability_index, -m.flips, m.test_id)) |
| 143 | + else: |
| 144 | + stats = compute_flake_stats(results) |
| 145 | + flippers = [s for s in stats.values() if s.total_runs >= min_total and s.has_flip] |
| 146 | + flippers.sort(key=lambda s: (-(s.fail_ratio), s.test_id)) |
129 | 147 |
|
130 | 148 | if json_out: |
131 | | - payload = { |
132 | | - "files_count": len(files), |
133 | | - "cases_count": len(results), |
134 | | - "flaky_candidates_count": len(flippers), |
135 | | - "flaky_candidates": [ |
136 | | - { |
137 | | - "test_id": s.test_id, |
138 | | - "total_runs": s.total_runs, |
139 | | - "pass_count": s.pass_count, |
140 | | - "fail_error_count": s.fail_error_count, |
141 | | - "skipped_count": s.skipped_count, |
142 | | - "has_flip": s.has_flip, |
143 | | - "fail_ratio": s.fail_ratio, |
144 | | - } |
145 | | - for s in flippers |
146 | | - ], |
147 | | - } |
| 149 | + if rich: |
| 150 | + payload = { |
| 151 | + "files_count": len(files), |
| 152 | + "flaky_candidates_count": len(flippers), |
| 153 | + "flaky_candidates": [ |
| 154 | + { |
| 155 | + "test_id": m.test_id, |
| 156 | + "total_runs": m.total_runs, |
| 157 | + "pass_count": m.pass_count, |
| 158 | + "fail_error_count": m.fail_error_count, |
| 159 | + "skipped_count": m.skipped_count, |
| 160 | + "flips": m.flips, |
| 161 | + "instability_index": m.instability_index, |
| 162 | + "longest_pass_streak": m.longest_pass_streak, |
| 163 | + "longest_failerr_streak": m.longest_failerr_streak, |
| 164 | + } |
| 165 | + for m in flippers |
| 166 | + ], |
| 167 | + } |
| 168 | + else: |
| 169 | + payload = { |
| 170 | + "files_count": len(files), |
| 171 | + "cases_count": len(results), |
| 172 | + "flaky_candidates_count": len(flippers), |
| 173 | + "flaky_candidates": [ |
| 174 | + { |
| 175 | + "test_id": s.test_id, |
| 176 | + "total_runs": s.total_runs, |
| 177 | + "pass_count": s.pass_count, |
| 178 | + "fail_error_count": s.fail_error_count, |
| 179 | + "skipped_count": s.skipped_count, |
| 180 | + "has_flip": s.has_flip, |
| 181 | + "fail_ratio": s.fail_ratio, |
| 182 | + } |
| 183 | + for s in flippers |
| 184 | + ], |
| 185 | + } |
148 | 186 | typer.echo(json.dumps(payload, indent=2)) |
149 | 187 | return |
150 | 188 | else: |
151 | | - header = f"Files: {len(files)} | Cases: {len(results)} | Flaky candidates: {len(flippers)}" |
152 | | - typer.echo(header) |
153 | | - for s in flippers: |
154 | | - line = ( |
155 | | - f" - {s.test_id}: runs={s.total_runs} pass={s.pass_count} " |
156 | | - f"fail+error={s.fail_error_count} skipped={s.skipped_count} " |
157 | | - f"fail_ratio={s.fail_ratio:.2f}" |
| 189 | + if rich: |
| 190 | + header = f"Files: {len(files)} | Flaky candidates: {len(flippers)}" |
| 191 | + else: |
| 192 | + header = ( |
| 193 | + f"Files: {len(files)} | Cases: {len(results)} | Flaky candidates: {len(flippers)}" |
158 | 194 | ) |
159 | | - typer.echo(line) |
| 195 | + typer.echo(header) |
| 196 | + if rich: |
| 197 | + for m in flippers: |
| 198 | + line = ( |
| 199 | + f" - {m.test_id}: runs={m.total_runs} flips={m.flips} " |
| 200 | + f"instability={m.instability_index:.2f} pass_streak={m.longest_pass_streak} " |
| 201 | + f"fail_streak={m.longest_failerr_streak}" |
| 202 | + ) |
| 203 | + typer.echo(line) |
| 204 | + else: |
| 205 | + for s in flippers: |
| 206 | + line = ( |
| 207 | + f" - {s.test_id}: runs={s.total_runs} pass={s.pass_count} " |
| 208 | + f"fail+error={s.fail_error_count} skipped={s.skipped_count} " |
| 209 | + f"fail_ratio={s.fail_ratio:.2f}" |
| 210 | + ) |
| 211 | + typer.echo(line) |
160 | 212 | if gh_summary: |
161 | 213 | lines = ["### flakewall score", header] |
162 | | - for s in flippers: |
163 | | - lines.append(f"- {s.test_id} (runs={s.total_runs}, fail_ratio={s.fail_ratio:.2f})") |
| 214 | + if rich: |
| 215 | + for m in flippers: |
| 216 | + lines.append( |
| 217 | + f"- {m.test_id} (runs={m.total_runs}, flips={m.flips}, instability={m.instability_index:.2f})" |
| 218 | + ) |
| 219 | + else: |
| 220 | + for s in flippers: |
| 221 | + lines.append( |
| 222 | + f"- {s.test_id} (runs={s.total_runs}, fail_ratio={s.fail_ratio:.2f})" |
| 223 | + ) |
164 | 224 | write_step_summary(lines) |
165 | 225 |
|
166 | 226 |
|
|
0 commit comments