Skip to content

Commit b30064f

Browse files
nirganina-kollman
andauthored
docs: Update eval config + html eval (#151)
Co-authored-by: nina-kollman <59646487+nina-kollman@users.noreply.github.com>
1 parent 0d8234a commit b30064f

File tree

3 files changed

+100
-26
lines changed

3 files changed

+100
-26
lines changed
Lines changed: 3 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,3 @@
1+
---
2+
openapi: post /v2/evaluators/execute/html-comparison
3+
---

mint.json

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -290,6 +290,7 @@
290290
"api-reference/evaluators/execute-context-relevance-evaluator",
291291
"api-reference/evaluators/execute-conversation-quality-evaluator",
292292
"api-reference/evaluators/execute-faithfulness-evaluator",
293+
"api-reference/evaluators/execute-html-comparison-evaluator",
293294
"api-reference/evaluators/execute-instruction-adherence-evaluator",
294295
"api-reference/evaluators/execute-intent-change-evaluator",
295296
"api-reference/evaluators/execute-json-validator-evaluator",

openapi.json

Lines changed: 96 additions & 26 deletions
Original file line numberDiff line numberDiff line change
@@ -911,7 +911,7 @@
911911
},
912912
"/v2/evaluators/execute/conversation-quality": {
913913
"post": {
914-
"description": "Evaluate conversation quality based on tone, clarity, flow, responsiveness, and transparency\n\n**Request Body:**\n- `input.prompts` (string, required): JSON array of prompts in the conversation\n- `input.completions` (string, required): JSON array of completions in the conversation\n- `config.model` (string, optional): Model to use for evaluation (default: gpt-4o)",
914+
"description": "Evaluate conversation quality based on tone, clarity, flow, responsiveness, and transparency\n\n**Request Body:**\n- `input.prompts` (string, required): JSON array of prompts in the conversation\n- `input.completions` (string, required): JSON array of completions in the conversation",
915915
"requestBody": {
916916
"content": {
917917
"application/json": {
@@ -1023,6 +1023,63 @@
10231023
]
10241024
}
10251025
},
1026+
"/v2/evaluators/execute/html-comparison": {
1027+
"post": {
1028+
"description": "Compare two HTML documents for structural and content similarity\n\n**Request Body:**\n- `input.html1` (string, required): The first HTML document to compare\n- `input.html2` (string, required): The second HTML document to compare",
1029+
"requestBody": {
1030+
"content": {
1031+
"application/json": {
1032+
"schema": {
1033+
"$ref": "#/components/schemas/request.HtmlComparisonRequest"
1034+
}
1035+
}
1036+
},
1037+
"description": "Request body",
1038+
"required": true
1039+
},
1040+
"responses": {
1041+
"200": {
1042+
"description": "OK",
1043+
"content": {
1044+
"application/json": {
1045+
"schema": {
1046+
"$ref": "#/components/schemas/response.HtmlComparisonResponse"
1047+
}
1048+
}
1049+
}
1050+
},
1051+
"400": {
1052+
"description": "Bad Request",
1053+
"content": {
1054+
"application/json": {
1055+
"schema": {
1056+
"$ref": "#/components/schemas/response.ErrorResponse"
1057+
}
1058+
}
1059+
}
1060+
},
1061+
"500": {
1062+
"description": "Internal Server Error",
1063+
"content": {
1064+
"application/json": {
1065+
"schema": {
1066+
"$ref": "#/components/schemas/response.ErrorResponse"
1067+
}
1068+
}
1069+
}
1070+
}
1071+
},
1072+
"security": [
1073+
{
1074+
"BearerAuth": []
1075+
}
1076+
],
1077+
"summary": "Execute html-comparison evaluator",
1078+
"tags": [
1079+
"evaluators"
1080+
]
1081+
}
1082+
},
10261083
"/v2/evaluators/execute/instruction-adherence": {
10271084
"post": {
10281085
"description": "Evaluate how well responses follow given instructions\n\n**Request Body:**\n- `input.instructions` (string, required): The instructions that should be followed\n- `input.response` (string, required): The response to evaluate for instruction adherence",
@@ -1082,7 +1139,7 @@
10821139
},
10831140
"/v2/evaluators/execute/intent-change": {
10841141
"post": {
1085-
"description": "Detect changes in user intent between prompts and completions\n\n**Request Body:**\n- `input.prompts` (string, required): JSON array of prompts in the conversation\n- `input.completions` (string, required): JSON array of completions in the conversation\n- `config.model` (string, optional): Model to use for evaluation (default: gpt-4o)",
1142+
"description": "Detect changes in user intent between prompts and completions\n\n**Request Body:**\n- `input.prompts` (string, required): JSON array of prompts in the conversation\n- `input.completions` (string, required): JSON array of completions in the conversation",
10861143
"requestBody": {
10871144
"content": {
10881145
"application/json": {
@@ -2798,15 +2855,6 @@
27982855
],
27992856
"type": "object"
28002857
},
2801-
"request.ConversationQualityConfigRequest": {
2802-
"properties": {
2803-
"model": {
2804-
"example": "gpt-4o",
2805-
"type": "string"
2806-
}
2807-
},
2808-
"type": "object"
2809-
},
28102858
"request.ConversationQualityInput": {
28112859
"properties": {
28122860
"completions": {
@@ -2826,9 +2874,6 @@
28262874
},
28272875
"request.ConversationQualityRequest": {
28282876
"properties": {
2829-
"config": {
2830-
"$ref": "#/components/schemas/request.ConversationQualityConfigRequest"
2831-
},
28322877
"input": {
28332878
"$ref": "#/components/schemas/request.ConversationQualityInput"
28342879
}
@@ -2963,6 +3008,34 @@
29633008
},
29643009
"type": "object"
29653010
},
3011+
"request.HtmlComparisonInput": {
3012+
"properties": {
3013+
"html1": {
3014+
"example": "<html><body><h1>Hello, world!</h1></body></html>",
3015+
"type": "string"
3016+
},
3017+
"html2": {
3018+
"example": "<html><body><h1>Hello, world!</h1></body></html>",
3019+
"type": "string"
3020+
}
3021+
},
3022+
"required": [
3023+
"html1",
3024+
"html2"
3025+
],
3026+
"type": "object"
3027+
},
3028+
"request.HtmlComparisonRequest": {
3029+
"properties": {
3030+
"input": {
3031+
"$ref": "#/components/schemas/request.HtmlComparisonInput"
3032+
}
3033+
},
3034+
"required": [
3035+
"input"
3036+
],
3037+
"type": "object"
3038+
},
29663039
"request.InstructionAdherenceInput": {
29673040
"properties": {
29683041
"instructions": {
@@ -2991,15 +3064,6 @@
29913064
],
29923065
"type": "object"
29933066
},
2994-
"request.IntentChangeConfigRequest": {
2995-
"properties": {
2996-
"model": {
2997-
"example": "gpt-4o",
2998-
"type": "string"
2999-
}
3000-
},
3001-
"type": "object"
3002-
},
30033067
"request.IntentChangeInput": {
30043068
"properties": {
30053069
"completions": {
@@ -3019,9 +3083,6 @@
30193083
},
30203084
"request.IntentChangeRequest": {
30213085
"properties": {
3022-
"config": {
3023-
"$ref": "#/components/schemas/request.IntentChangeConfigRequest"
3024-
},
30253086
"input": {
30263087
"$ref": "#/components/schemas/request.IntentChangeInput"
30273088
}
@@ -3881,6 +3942,15 @@
38813942
},
38823943
"type": "object"
38833944
},
3945+
"response.HtmlComparisonResponse": {
3946+
"properties": {
3947+
"similarity_score": {
3948+
"example": 0.92,
3949+
"type": "number"
3950+
}
3951+
},
3952+
"type": "object"
3953+
},
38843954
"response.InstructionAdherenceResponse": {
38853955
"properties": {
38863956
"instruction_adherence_score": {

0 commit comments

Comments
 (0)