From 57f29bc41c1f860391abc1c9ee6db812de20ef75 Mon Sep 17 00:00:00 2001 From: Yann Dubois Date: Sun, 18 Aug 2024 15:03:15 -0700 Subject: [PATCH] [ENH] add strict decoding OAI (#394) --- .../alpaca_eval_cot_gpt4_turbo_fn/configs.yaml | 1 + .../evaluators_configs/alpaca_eval_gpt4_fn/configs.yaml | 1 + .../evaluators_configs/alpaca_eval_gpt4_turbo_fn/configs.yaml | 1 + src/alpaca_eval/evaluators_configs/chatgpt_fn/configs.yaml | 1 + 4 files changed, 4 insertions(+) diff --git a/src/alpaca_eval/evaluators_configs/alpaca_eval_cot_gpt4_turbo_fn/configs.yaml b/src/alpaca_eval/evaluators_configs/alpaca_eval_cot_gpt4_turbo_fn/configs.yaml index 20615b68..f344346d 100644 --- a/src/alpaca_eval/evaluators_configs/alpaca_eval_cot_gpt4_turbo_fn/configs.yaml +++ b/src/alpaca_eval/evaluators_configs/alpaca_eval_cot_gpt4_turbo_fn/configs.yaml @@ -14,6 +14,7 @@ alpaca_eval_cot_gpt4_turbo_fn: function: name: "make_partial_leaderboard" description: "Make a leaderboard of models given a list of the models ordered by the preference of their outputs." + strict: true parameters: type: "object" properties: diff --git a/src/alpaca_eval/evaluators_configs/alpaca_eval_gpt4_fn/configs.yaml b/src/alpaca_eval/evaluators_configs/alpaca_eval_gpt4_fn/configs.yaml index f16b20e5..ddb1772d 100644 --- a/src/alpaca_eval/evaluators_configs/alpaca_eval_gpt4_fn/configs.yaml +++ b/src/alpaca_eval/evaluators_configs/alpaca_eval_gpt4_fn/configs.yaml @@ -14,6 +14,7 @@ alpaca_eval_gpt4_fn: function: name: "make_leaderboard" description: "Make a leaderboard of models given a list of the models ordered by the preference of their outputs." + strict: true parameters: type: "object" properties: diff --git a/src/alpaca_eval/evaluators_configs/alpaca_eval_gpt4_turbo_fn/configs.yaml b/src/alpaca_eval/evaluators_configs/alpaca_eval_gpt4_turbo_fn/configs.yaml index 9896a327..08262cfa 100644 --- a/src/alpaca_eval/evaluators_configs/alpaca_eval_gpt4_turbo_fn/configs.yaml +++ b/src/alpaca_eval/evaluators_configs/alpaca_eval_gpt4_turbo_fn/configs.yaml @@ -14,6 +14,7 @@ alpaca_eval_gpt4_turbo_fn: function: name: "make_partial_leaderboard" description: "Make a leaderboard of models given a list of the models ordered by the preference of their outputs." + strict: true parameters: type: "object" properties: diff --git a/src/alpaca_eval/evaluators_configs/chatgpt_fn/configs.yaml b/src/alpaca_eval/evaluators_configs/chatgpt_fn/configs.yaml index d200aa7b..1eb22f22 100644 --- a/src/alpaca_eval/evaluators_configs/chatgpt_fn/configs.yaml +++ b/src/alpaca_eval/evaluators_configs/chatgpt_fn/configs.yaml @@ -14,6 +14,7 @@ chatgpt_fn: function: name: "print_best_model" description: "Print the best model given the preferred output." + strict: true parameters: type: "object" properties: