|
3 | 3 | "startTime": "2024-11-28T12:00:00Z", |
4 | 4 | "endTime": "2024-11-28T12:05:00Z", |
5 | 5 | "errorMessage": null, |
6 | | - "testCases": [ |
7 | | - { |
8 | | - "status": "COMPLETED", |
9 | | - "number": 1, |
10 | | - "startTime": "2024-11-28T12:00:10Z", |
11 | | - "endTime": "2024-11-28T12:00:20Z", |
12 | | - "generatedData": { |
13 | | - "type": "AGENT", |
14 | | - "actionsSequence": ["Action1", "Action2"], |
15 | | - "outcome": "Success", |
16 | | - "topic": "Mathematics", |
17 | | - "inputTokensCount": 50, |
18 | | - "outputTokensCount": 55 |
19 | | - }, |
20 | | - "expectationResults": [ |
21 | | - { |
22 | | - "name": "topic_sequence_match", |
23 | | - "actualValue": "Result A", |
24 | | - "expectedValue": "Result A", |
25 | | - "score": 1.0, |
26 | | - "result": "Passed", |
27 | | - "metricLabel": "Accuracy", |
28 | | - "metricExplainability": "Measures the correctness of the result.", |
29 | | - "status": "Completed", |
30 | | - "startTime": "2024-11-28T12:00:12Z", |
31 | | - "endTime": "2024-11-28T12:00:13Z", |
32 | | - "errorCode": null, |
33 | | - "errorMessage": null |
| 6 | + "subjectName": "Copilot_for_Salesforce", |
| 7 | + "testSet": { |
| 8 | + "name": "CRM_Sanity_v1", |
| 9 | + "testCases": [ |
| 10 | + { |
| 11 | + "status": "COMPLETED", |
| 12 | + "number": 1, |
| 13 | + "startTime": "2024-11-28T12:00:10Z", |
| 14 | + "endTime": "2024-11-28T12:00:20Z", |
| 15 | + "generatedData": { |
| 16 | + "type": "AGENT", |
| 17 | + "actionsSequence": ["Action1", "Action2"], |
| 18 | + "outcome": "Success", |
| 19 | + "topic": "Mathematics", |
| 20 | + "inputTokensCount": 50, |
| 21 | + "outputTokensCount": 55 |
34 | 22 | }, |
35 | | - { |
36 | | - "name": "action_sequence_match", |
37 | | - "actualValue": "Result B", |
38 | | - "expectedValue": "Result B", |
39 | | - "score": 0.9, |
40 | | - "result": "Passed", |
41 | | - "metricLabel": "Precision", |
42 | | - "metricExplainability": "Measures the precision of the result.", |
43 | | - "status": "Completed", |
44 | | - "startTime": "2024-11-28T12:00:14Z", |
45 | | - "endTime": "2024-11-28T12:00:15Z", |
46 | | - "errorCode": null, |
47 | | - "errorMessage": null |
48 | | - } |
49 | | - ] |
50 | | - }, |
51 | | - { |
52 | | - "status": "ERROR", |
53 | | - "number": 2, |
54 | | - "startTime": "2024-11-28T12:00:30Z", |
55 | | - "endTime": "2024-11-28T12:00:40Z", |
56 | | - "generatedData": { |
57 | | - "type": "AGENT", |
58 | | - "actionsSequence": ["Action3", "Action4"], |
59 | | - "outcome": "Failure", |
60 | | - "topic": "Physics", |
61 | | - "inputTokensCount": 60, |
62 | | - "outputTokensCount": 50 |
| 23 | + "expectationResults": [ |
| 24 | + { |
| 25 | + "name": "topic_sequence_match", |
| 26 | + "actualValue": "Result A", |
| 27 | + "expectedValue": "Result A", |
| 28 | + "score": 1.0, |
| 29 | + "result": "Passed", |
| 30 | + "metricLabel": "Accuracy", |
| 31 | + "metricExplainability": "Measures the correctness of the result.", |
| 32 | + "status": "Completed", |
| 33 | + "startTime": "2024-11-28T12:00:12Z", |
| 34 | + "endTime": "2024-11-28T12:00:13Z", |
| 35 | + "errorCode": null, |
| 36 | + "errorMessage": null |
| 37 | + }, |
| 38 | + { |
| 39 | + "name": "action_sequence_match", |
| 40 | + "actualValue": "Result B", |
| 41 | + "expectedValue": "Result B", |
| 42 | + "score": 0.9, |
| 43 | + "result": "Passed", |
| 44 | + "metricLabel": "Precision", |
| 45 | + "metricExplainability": "Measures the precision of the result.", |
| 46 | + "status": "Completed", |
| 47 | + "startTime": "2024-11-28T12:00:14Z", |
| 48 | + "endTime": "2024-11-28T12:00:15Z", |
| 49 | + "errorCode": null, |
| 50 | + "errorMessage": null |
| 51 | + } |
| 52 | + ] |
63 | 53 | }, |
64 | | - "expectationResults": [ |
65 | | - { |
66 | | - "name": "topic_sequence_match", |
67 | | - "actualValue": "Result C", |
68 | | - "expectedValue": "Result D", |
69 | | - "score": 0.5, |
70 | | - "result": "Failed", |
71 | | - "metricLabel": "Accuracy", |
72 | | - "metricExplainability": "Measures the correctness of the result.", |
73 | | - "status": "Completed", |
74 | | - "startTime": "2024-11-28T12:00:32Z", |
75 | | - "endTime": "2024-11-28T12:00:33Z", |
76 | | - "errorCode": null, |
77 | | - "errorMessage": null |
78 | | - } |
79 | | - ] |
80 | | - } |
81 | | - ] |
| 54 | + { |
| 55 | + "status": "ERROR", |
| 56 | + "number": 2, |
| 57 | + "startTime": "2024-11-28T12:00:30Z", |
| 58 | + "endTime": "2024-11-28T12:00:40Z", |
| 59 | + "generatedData": { |
| 60 | + "type": "AGENT", |
| 61 | + "actionsSequence": ["Action3", "Action4"], |
| 62 | + "outcome": "Failure", |
| 63 | + "topic": "Physics", |
| 64 | + "inputTokensCount": 60, |
| 65 | + "outputTokensCount": 50 |
| 66 | + }, |
| 67 | + "expectationResults": [ |
| 68 | + { |
| 69 | + "name": "topic_sequence_match", |
| 70 | + "actualValue": "Result C", |
| 71 | + "expectedValue": "Result D", |
| 72 | + "score": 0.5, |
| 73 | + "result": "Failed", |
| 74 | + "metricLabel": "Accuracy", |
| 75 | + "metricExplainability": "Measures the correctness of the result.", |
| 76 | + "status": "Completed", |
| 77 | + "startTime": "2024-11-28T12:00:32Z", |
| 78 | + "endTime": "2024-11-28T12:00:33Z", |
| 79 | + "errorCode": null, |
| 80 | + "errorMessage": "Expected \"Result D\" but got \"Result C\"." |
| 81 | + }, |
| 82 | + { |
| 83 | + "name": "topic_sequence_match", |
| 84 | + "actualValue": "Result C", |
| 85 | + "expectedValue": "Result D", |
| 86 | + "score": 0.5, |
| 87 | + "result": "Failed", |
| 88 | + "metricLabel": "Accuracy", |
| 89 | + "metricExplainability": "Measures the correctness of the result.", |
| 90 | + "status": "Completed", |
| 91 | + "startTime": "2024-11-28T12:00:32Z", |
| 92 | + "endTime": "2024-11-28T12:00:33Z", |
| 93 | + "errorCode": null, |
| 94 | + "errorMessage": "Expected \"Result D\" but got \"Result C\"." |
| 95 | + } |
| 96 | + ] |
| 97 | + } |
| 98 | + ] |
| 99 | + } |
82 | 100 | } |
0 commit comments