diff --git a/community_tasks/french_evals.py b/community_tasks/french_evals.py index 81fd2c367..29b820840 100644 --- a/community_tasks/french_evals.py +++ b/community_tasks/french_evals.py @@ -111,7 +111,7 @@ def prompt_gpqa_fr(line, task_name: str = None): few_shots_split=None, few_shots_select="random_sampling", generation_size=1, - metric=[Metrics.loglikelihood_acc_single_token], + metric=[Metrics.loglikelihood_acc], stop_sequence=["\n"], trust_dataset=True, version=0,