From 996b3a658b3570e76fcdf64b903a9c7a8d31b78e Mon Sep 17 00:00:00 2001 From: Rita Aleksziev Date: Thu, 28 Nov 2024 16:53:33 +0100 Subject: [PATCH] add custom metric implementation --- evals/deepeval_metrics.py | 14 ++++++++++++++ 1 file changed, 14 insertions(+) create mode 100644 evals/deepeval_metrics.py diff --git a/evals/deepeval_metrics.py b/evals/deepeval_metrics.py new file mode 100644 index 000000000..03f9f6dba --- /dev/null +++ b/evals/deepeval_metrics.py @@ -0,0 +1,14 @@ +from deepeval.metrics import GEval +from deepeval.test_case import LLMTestCaseParams + +correctness_metric = GEval( + name="Correctness", + model="gpt-4o-mini", + evaluation_params=[ + LLMTestCaseParams.ACTUAL_OUTPUT, + LLMTestCaseParams.EXPECTED_OUTPUT + ], + evaluation_steps=[ + "Determine whether the actual output is factually correct based on the expected output." + ] + )