diff --git a/lang_agent/eval/evaluator.py b/lang_agent/eval/evaluator.py index 4e0d9f7..16b5e2a 100644 --- a/lang_agent/eval/evaluator.py +++ b/lang_agent/eval/evaluator.py @@ -56,7 +56,7 @@ class Evaluator: self.result = self.cli.evaluate( runnable, data=self.dataset.name, - evaluators=[self.validator.get_val_fnc(self.config.dataset_name)], + evaluators=self.validator.get_val_fnc(self.config.dataset_name), experiment_prefix=self.config.experiment_prefix, description=self.config.experiment_desc, max_concurrency=4 diff --git a/lang_agent/eval/validator.py b/lang_agent/eval/validator.py index 310cb42..47eeedb 100644 --- a/lang_agent/eval/validator.py +++ b/lang_agent/eval/validator.py @@ -21,7 +21,7 @@ class Validator: # NOTE: Need to register function here self.dict_corr_map = { - "Toxic Queries" : self.Toxic_Queries_correct + "Toxic Queries" : [self.Toxic_Queries_correct] } # NOTE: Need to register function here