Skip to content

Commit be0ce2f

Browse files
committed
fix: lint issues — gci formatting and testifylint float comparisons
Assisted-By: docker-agent
1 parent be64f3b commit be0ce2f

File tree

4 files changed

+17
-17
lines changed

4 files changed

+17
-17
lines changed

pkg/evaluation/eval_test.go

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -658,7 +658,7 @@ func TestProgressBarPrintResult(t *testing.T) {
658658
Size: "S",
659659
RelevanceExpected: 2,
660660
RelevancePassed: 1,
661-
RelevanceResults: []RelevanceResult{{Criterion: "check failed", Passed: false, Reason: "did not meet criteria"}},
661+
RelevanceResults: []RelevanceResult{{Criterion: "check failed", Passed: false, Reason: "did not meet criteria"}},
662662
},
663663
wantContains: []string{
664664
"✗ mixed-session", // overall failed

pkg/evaluation/save_test.go

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -256,8 +256,8 @@ func TestSaveRunSessionsJSON(t *testing.T) {
256256
// Verify structured relevance check
257257
require.NotNil(t, sess1Loaded.EvalResult.Checks.Relevance)
258258
assert.True(t, sess1Loaded.EvalResult.Checks.Relevance.Passed)
259-
assert.Equal(t, float64(2), sess1Loaded.EvalResult.Checks.Relevance.PassedCount)
260-
assert.Equal(t, float64(2), sess1Loaded.EvalResult.Checks.Relevance.Total)
259+
assert.InDelta(t, 2, sess1Loaded.EvalResult.Checks.Relevance.PassedCount, 0.01)
260+
assert.InDelta(t, 2, sess1Loaded.EvalResult.Checks.Relevance.Total, 0.01)
261261

262262
// No size or tool calls checks were configured
263263
assert.Nil(t, sess1Loaded.EvalResult.Checks.Size)
@@ -276,7 +276,7 @@ func TestSaveRunSessionsJSON(t *testing.T) {
276276
// Verify structured relevance check with per-criterion results
277277
require.NotNil(t, sess2Loaded.EvalResult.Checks.Relevance)
278278
assert.False(t, sess2Loaded.EvalResult.Checks.Relevance.Passed)
279-
assert.Equal(t, float64(1), sess2Loaded.EvalResult.Checks.Relevance.PassedCount)
279+
assert.InDelta(t, 1, sess2Loaded.EvalResult.Checks.Relevance.PassedCount, 0.01)
280280
assert.Equal(t, float64(2), sess2Loaded.EvalResult.Checks.Relevance.Total)
281281
require.Len(t, sess2Loaded.EvalResult.Checks.Relevance.Results, 2)
282282

pkg/evaluation/types.go

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -26,9 +26,9 @@ type Result struct {
2626
SizeExpected string `json:"size_expected"`
2727
ToolCallsScore float64 `json:"tool_calls_score"`
2828
ToolCallsExpected float64 `json:"tool_calls_score_expected"`
29-
RelevancePassed float64 `json:"relevance"`
30-
RelevanceExpected float64 `json:"relevance_expected"`
31-
RelevanceResults []RelevanceResult `json:"relevance_results,omitempty"`
29+
RelevancePassed float64 `json:"relevance"`
30+
RelevanceExpected float64 `json:"relevance_expected"`
31+
RelevanceResults []RelevanceResult `json:"relevance_results,omitempty"`
3232
Error string `json:"error,omitempty"`
3333
RawOutput []map[string]any `json:"raw_output,omitempty"`
3434
Session *session.Session `json:"-"` // Full session for database storage (not in JSON)

pkg/session/session.go

Lines changed: 10 additions & 10 deletions
Original file line numberDiff line numberDiff line change
@@ -234,13 +234,13 @@ func NewSubSessionItem(subSession *Session) Item {
234234

235235
// EvalResult contains the evaluation scoring outcome for a session.
236236
type EvalResult struct {
237-
Passed bool `json:"passed"`
238-
Successes []string `json:"successes,omitempty"`
239-
Failures []string `json:"failures,omitempty"`
240-
Error string `json:"error,omitempty"`
241-
Cost float64 `json:"cost"`
242-
OutputTokens int64 `json:"output_tokens"`
243-
Checks EvalResultChecks `json:"checks"`
237+
Passed bool `json:"passed"`
238+
Successes []string `json:"successes,omitempty"`
239+
Failures []string `json:"failures,omitempty"`
240+
Error string `json:"error,omitempty"`
241+
Cost float64 `json:"cost"`
242+
OutputTokens int64 `json:"output_tokens"`
243+
Checks EvalResultChecks `json:"checks"`
244244
}
245245

246246
// EvalResultChecks groups the individual check results.
@@ -266,9 +266,9 @@ type ToolCallsCheck struct {
266266

267267
// RelevanceCheck contains the result of the LLM judge relevance check.
268268
type RelevanceCheck struct {
269-
Passed bool `json:"passed"`
270-
PassedCount float64 `json:"passed_count"`
271-
Total float64 `json:"total"`
269+
Passed bool `json:"passed"`
270+
PassedCount float64 `json:"passed_count"`
271+
Total float64 `json:"total"`
272272
Results []RelevanceCriterionResult `json:"results"`
273273
}
274274

0 commit comments

Comments
 (0)