|
1964 | 1964 | "value": "Node" |
1965 | 1965 | } |
1966 | 1966 | ] |
| 1967 | + }, |
| 1968 | + { |
| 1969 | + "matcher": { |
| 1970 | + "id": "byName", |
| 1971 | + "options": "Time Last Run" |
| 1972 | + }, |
| 1973 | + "properties": [ |
| 1974 | + { |
| 1975 | + "id": "unit", |
| 1976 | + "value": "dateTimeAsIso" |
| 1977 | + }, |
| 1978 | + { |
| 1979 | + "id": "custom.align", |
| 1980 | + "value": "auto" |
| 1981 | + } |
| 1982 | + ] |
1967 | 1983 | } |
1968 | 1984 | ] |
1969 | 1985 | }, |
|
2157 | 2173 | "legendFormat": "__auto", |
2158 | 2174 | "range": false, |
2159 | 2175 | "refId": "K" |
| 2176 | + }, |
| 2177 | + { |
| 2178 | + "datasource": { |
| 2179 | + "type": "prometheus", |
| 2180 | + "uid": "{{DATASOURCE_PROMETHEUS}}" |
| 2181 | + }, |
| 2182 | + "editorMode": "code", |
| 2183 | + "exemplar": false, |
| 2184 | + "expr": "max by (instance) (push_time_seconds{job=\"oci_lens_healthchecks\"}) * 1000", |
| 2185 | + "format": "table", |
| 2186 | + "instant": true, |
| 2187 | + "legendFormat": "__auto", |
| 2188 | + "range": false, |
| 2189 | + "refId": "L", |
| 2190 | + "hide": false |
2160 | 2191 | } |
2161 | 2192 | ], |
2162 | 2193 | "title": "OCI GPU Scanner - ACTIVE health check summary", |
|
2391 | 2422 | "test 6": true, |
2392 | 2423 | "test 7": true, |
2393 | 2424 | "test 8": true, |
2394 | | - "test 9": true |
| 2425 | + "test 9": true, |
| 2426 | + "Time 1": true, |
| 2427 | + "Value #L": false, |
| 2428 | + "dtype 11": true, |
| 2429 | + "dtype 12": true, |
| 2430 | + "dtype 13": true, |
| 2431 | + "dtype 14": true, |
| 2432 | + "dtype 15": true, |
| 2433 | + "dtype 16": true, |
| 2434 | + "dtype 17": true, |
| 2435 | + "dtype 18": true, |
| 2436 | + "dtype 19": true, |
| 2437 | + "dtype 20": true, |
| 2438 | + "dtype": true, |
| 2439 | + "tensor_parallel_size 11": true, |
| 2440 | + "tensor_parallel_size 12": true, |
| 2441 | + "tensor_parallel_size 13": true, |
| 2442 | + "tensor_parallel_size 14": true |
2395 | 2443 | }, |
2396 | 2444 | "includeByName": {}, |
2397 | | - "indexByName": {}, |
| 2445 | + "indexByName": { |
| 2446 | + "instance": 0, |
| 2447 | + "Value #L": 1, |
| 2448 | + "hostGPU 1": 2, |
| 2449 | + "hostIP 1": 3, |
| 2450 | + "hostRegion 1": 4, |
| 2451 | + "tensor_parallel_size 1": 5, |
| 2452 | + "Value #A": 6, |
| 2453 | + "Value #B": 7, |
| 2454 | + "Value #C": 8, |
| 2455 | + "Value #D": 9, |
| 2456 | + "Value #E": 10, |
| 2457 | + "Value #F": 11, |
| 2458 | + "Value #G": 12, |
| 2459 | + "Value #H": 13, |
| 2460 | + "Value #I": 14, |
| 2461 | + "Value #J": 15, |
| 2462 | + "Value #K": 16 |
| 2463 | + }, |
2398 | 2464 | "renameByName": { |
2399 | | - "Time 1": "Time Last Run", |
| 2465 | + "Time 1": "", |
| 2466 | + "tensor_parallel_size 1": "Tensor Parallel Size", |
2400 | 2467 | "Value #A": "Compute Throughput", |
2401 | 2468 | "Value #B": "Memory Bandwidth", |
2402 | 2469 | "Value #C": "Error Detection", |
|
2408 | 2475 | "Value #I": "GPU Temperature Check", |
2409 | 2476 | "Value #J": "GPU Power Check", |
2410 | 2477 | "Value #K": "GPU Utilization Check", |
2411 | | - "Value #L": "", |
| 2478 | + "Value #L": "Time Last Run", |
2412 | 2479 | "__name__ 1": "", |
2413 | 2480 | "gpu 1": "GPU", |
2414 | 2481 | "hostGPU 1": "GPU Shape", |
|
0 commit comments