-
Notifications
You must be signed in to change notification settings - Fork 16
Expand file tree
/
Copy pathassertions-report-20260307_210649.html
More file actions
150 lines (150 loc) · 7.39 KB
/
assertions-report-20260307_210649.html
File metadata and controls
150 lines (150 loc) · 7.39 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
<!DOCTYPE html>
<html lang="en">
<head>
<meta charset="UTF-8">
<meta name="viewport" content="width=device-width, initial-scale=1.0">
<title>AFM Assertion Test Report</title>
<style>
* { margin: 0; padding: 0; box-sizing: border-box; }
body { font-family: -apple-system, BlinkMacSystemFont, 'SF Pro', system-ui, sans-serif; background: #0d1117; color: #e6edf3; padding: 2rem; }
.header { text-align: center; margin-bottom: 2rem; padding: 2rem; background: linear-gradient(135deg, #1a1f2e 0%, #0d1117 100%); border: 1px solid #30363d; border-radius: 12px; }
.header h1 { font-size: 1.8rem; margin-bottom: 0.5rem; background: linear-gradient(90deg, #58a6ff, #bc8cff); -webkit-background-clip: text; -webkit-text-fill-color: transparent; }
.header .meta { color: #8b949e; font-size: 0.9rem; line-height: 1.6; }
.summary { display: flex; gap: 1rem; justify-content: center; margin: 1.5rem 0; flex-wrap: wrap; }
.stat { background: #161b22; border: 1px solid #30363d; border-radius: 10px; padding: 1rem 1.5rem; text-align: center; min-width: 120px; }
.stat .value { font-size: 2rem; font-weight: 700; }
.stat .label { color: #8b949e; font-size: 0.8rem; text-transform: uppercase; letter-spacing: 0.05em; margin-top: 0.25rem; }
.stat.pass .value { color: #3fb950; }
.stat.fail .value { color: #f85149; }
.stat.skip .value { color: #d29922; }
.stat.time .value { color: #58a6ff; }
.stat.pct .value { color: #d2a8ff; }
.progress-bar { width: 100%; height: 8px; background: #21262d; border-radius: 4px; margin: 1rem auto; max-width: 400px; overflow: hidden; }
.progress-fill { height: 100%; border-radius: 4px; }
table { width: 100%; border-collapse: collapse; margin-top: 1.5rem; }
th { background: #161b22; color: #8b949e; font-weight: 600; text-transform: uppercase; font-size: 0.75rem; letter-spacing: 0.05em; padding: 0.75rem 1rem; text-align: left; border-bottom: 1px solid #30363d; }
td { padding: 0.75rem 1rem; border-bottom: 1px solid #21262d; vertical-align: top; }
tr:hover { background: #161b22; }
.badge { display: inline-block; padding: 0.15rem 0.6rem; border-radius: 12px; font-size: 0.75rem; font-weight: 600; }
.badge.pass { background: #0d2818; color: #3fb950; border: 1px solid #238636; }
.badge.fail { background: #2d1215; color: #f85149; border: 1px solid #da3633; }
.badge.skip { background: #2d2400; color: #d29922; border: 1px solid #9e6a03; }
.group-badge { display: inline-block; padding: 0.15rem 0.5rem; border-radius: 6px; font-size: 0.7rem; font-weight: 500; background: #1a1f2e; color: #8b949e; border: 1px solid #30363d; }
.group-badge.Preflight { color: #8b949e; border-color: #484f58; }
.group-badge.Lifecycle { color: #3fb950; border-color: #238636; }
.group-badge.Stop { color: #f85149; border-color: #da3633; }
.group-badge.Logprobs { color: #58a6ff; border-color: #1f6feb; }
.group-badge.Think { color: #d2a8ff; border-color: #8957e5; }
.group-badge.Tools { color: #ffa657; border-color: #d18616; }
.group-badge.XMLTools { color: #f0883e; border-color: #bd561d; }
.group-badge.Cache { color: #79c0ff; border-color: #388bfd; }
.group-badge.Concurrent { color: #f778ba; border-color: #db61a2; }
.group-badge.Error { color: #ff7b72; border-color: #da3633; }
.group-badge.Kwargs { color: #a5d6ff; border-color: #58a6ff; }
.group-badge.Perf { color: #3fb950; border-color: #238636; }
.detail { font-family: 'SF Mono', 'Menlo', monospace; font-size: 0.8rem; color: #8b949e; white-space: pre-wrap; word-break: break-word; max-height: 100px; overflow-y: auto; background: #0d1117; padding: 0.5rem; border-radius: 6px; border: 1px solid #21262d; margin-top: 0.25rem; }
.duration { color: #8b949e; font-family: 'SF Mono', monospace; font-size: 0.85rem; }
.footer { text-align: center; margin-top: 2rem; color: #484f58; font-size: 0.8rem; }
</style>
</head>
<body>
<div class="header">
<h1>AFM Assertion Test Report</h1>
<div class="meta">
Model: <strong>mlx-community/Qwen3-Coder-Next-4bit</strong> · Tier: <strong>standard</strong><br>
Server: <code>http://127.0.0.1:9999</code><br>
Date: 2026-03-07 21:06:54
</div>
</div>
<div class="summary">
<div class="stat pass"><div class="value">9</div><div class="label">Passed</div></div>
<div class="stat fail"><div class="value">0</div><div class="label">Failed</div></div>
<div class="stat skip"><div class="value">0</div><div class="label">Skipped</div></div>
<div class="stat pct"><div class="value">100%</div><div class="label">Pass Rate</div></div>
<div class="stat time"><div class="value">5s</div><div class="label">Total Time</div></div>
</div>
<div class="progress-bar"><div class="progress-fill" style="width:100%;background:#3fb950;"></div></div>
<table>
<thead>
<tr><th>#</th><th>Test</th><th>Group</th><th>Status</th><th>Duration</th><th>Details</th></tr>
</thead>
<tbody>
<tr>
<td><strong>1</strong></td>
<td>Binary exists at .build/release/afm</td>
<td><span class="group-badge Preflight">Preflight</span></td>
<td><span class="badge pass">PASS</span></td>
<td><span class="duration">0.0s</span></td>
<td><div class="detail">file exists</div></td>
</tr>
<tr>
<td><strong>2</strong></td>
<td>Server reachable at http://127.0.0.1:9999</td>
<td><span class="group-badge Preflight">Preflight</span></td>
<td><span class="badge pass">PASS</span></td>
<td><span class="duration">0.0s</span></td>
<td><div class="detail">200 OK</div></td>
</tr>
<tr>
<td><strong>3</strong></td>
<td>Empty messages → 400</td>
<td><span class="group-badge Error">Error</span></td>
<td><span class="badge pass">PASS</span></td>
<td><span class="duration">0.0s</span></td>
<td><div class="detail">400</div></td>
</tr>
<tr>
<td><strong>4</strong></td>
<td>Malformed JSON → 400</td>
<td><span class="group-badge Error">Error</span></td>
<td><span class="badge pass">PASS</span></td>
<td><span class="duration">0.0s</span></td>
<td><div class="detail">400</div></td>
</tr>
<tr>
<td><strong>5</strong></td>
<td>Missing messages field → 400</td>
<td><span class="group-badge Error">Error</span></td>
<td><span class="badge pass">PASS</span></td>
<td><span class="duration">0.0s</span></td>
<td><div class="detail">400</div></td>
</tr>
<tr>
<td><strong>6</strong></td>
<td>response_format json_object returns valid JSON</td>
<td><span class="group-badge Error">Error</span></td>
<td><span class="badge pass">PASS</span></td>
<td><span class="duration">1.3s</span></td>
<td><div class="detail">valid JSON</div></td>
</tr>
<tr>
<td><strong>7</strong></td>
<td>max_tokens=5 is respected</td>
<td><span class="group-badge Error">Error</span></td>
<td><span class="badge pass">PASS</span></td>
<td><span class="duration">0.2s</span></td>
<td><div class="detail"><=10 tokens</div></td>
</tr>
<tr>
<td><strong>8</strong></td>
<td>OPTIONS /v1/chat/completions → 200 (CORS)</td>
<td><span class="group-badge Error">Error</span></td>
<td><span class="badge pass">PASS</span></td>
<td><span class="duration">0.0s</span></td>
<td><div class="detail">200</div></td>
</tr>
<tr>
<td><strong>9</strong></td>
<td>developer role accepted (mapped to system)</td>
<td><span class="group-badge Error">Error</span></td>
<td><span class="badge pass">PASS</span></td>
<td><span class="duration">2.4s</span></td>
<td><div class="detail">valid response</div></td>
</tr>
</tbody>
</table>
<div class="footer">
Generated by Scripts/test-assertions.sh (tier: standard) — 2026-03-07 21:06:54
</div>
</body>
</html>