[
{
"name": "The output of the model is polite and informative",
"description": "Uses another LLM to check if the output of the model is polite and informative",
"type": "performance",
"subtype": "llmRubricThresholdV2",
"thresholds": [
{
"insightName": "llmRubricV2",
"insightParameters": [
{
"name": "criteria_list",
"value": [
{
"name": "Polite and informative", // Name of the criterion
"criteria": "Ensure outputs are polite and informative", // Prompt for the LLM evaluator
"scoring": "Yes or No" // Must be either 'Yes or No' (for a binary evaluation) or '0-1' (for a score within the 0-1 range)
}
]
}
],
"measurement": "criteria0MeanScore",
"operator": ">=",
"value": 1.0
}
],
"subpopulationFilters": null,
"mode": "development",
"usesValidationDataset": true, // Apply test to the validation set
"usesTrainingDataset": false,
"usesMlModel": false,
"syncId": "b4dee7dc-4f15-48ca-a282-63e2c04e0689" // Some unique id
}
]