Skip to content

Commit 8c20361

Browse files
authored
[BFCL] Add New Model gpt-4.5-preview-2025-02-27, gpt-4.5-preview-2025-02-27-FC (#922)
Add the following new models to the leaderboard: - `gpt-4.5-preview-2025-02-27` - `gpt-4.5-preview-2025-02-27-FC` This PR also upgraded `openai` library to version `1.65.0`.
1 parent e10b7f3 commit 8c20361

File tree

6 files changed

+34
-3
lines changed

6 files changed

+34
-3
lines changed

berkeley-function-call-leaderboard/CHANGELOG.md

Lines changed: 3 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -2,6 +2,9 @@
22

33
All notable changes to the Berkeley Function Calling Leaderboard will be documented in this file.
44

5+
- [Feb 27, 2025] [#922](https://github.com/ShishirPatil/gorilla/pull/922): Add the following new models to the leaderboard:
6+
- `gpt-4.5-preview-2025-02-27`
7+
- `gpt-4.5-preview-2025-02-27-FC`
58
- [Feb 24, 2025] [#917](https://github.com/ShishirPatil/gorilla/pull/917): Add new model `BitAgent/BitAgent-8B` to the leaderboard.
69
- [Feb 5, 2025] [#900](https://github.com/ShishirPatil/gorilla/pull/900), [#913](https://github.com/ShishirPatil/gorilla/pull/913): Add the following new models to the leaderboard:
710
- `uiuc-convai/CoALM-8B`

berkeley-function-call-leaderboard/SUPPORTED_MODELS.md

Lines changed: 2 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -25,6 +25,8 @@ Below is a comprehensive table of models supported for running leaderboard evalu
2525
|gpt-4o-2024-11-20 | Prompt|
2626
|gpt-4o-mini-2024-07-18-FC | Function Calling|
2727
|gpt-4o-mini-2024-07-18 | Prompt|
28+
|gpt-4.5-preview-2025-02-27-FC | Function Calling|
29+
|gpt-4.5-preview-2025-02-27 | Prompt|
2830
|o1-2024-12-17-FC | Function Calling|
2931
|o1-2024-12-17 | Prompt|
3032
|o3-mini-2025-01-31-FC | Function Calling|

berkeley-function-call-leaderboard/bfcl/eval_checker/model_metadata.py

Lines changed: 25 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -1,5 +1,12 @@
11
from bfcl.model_handler.handler_map import local_inference_handler_map
22

3+
# Items in the dictionary are in the format of:
4+
# {model_name: [
5+
# model_display_name_in_leaderboard,
6+
# url_to_model_page,
7+
# model_creator,
8+
# model_license,
9+
# ]}
310
MODEL_METADATA_MAPPING = {
411
"gorilla-openfunctions-v2": [
512
"Gorilla-OpenFunctions-v2 (FC)",
@@ -13,6 +20,18 @@
1320
"DeepSeek",
1421
"DeepSeek License",
1522
],
23+
"gpt-4.5-preview-2025-02-27-FC": [
24+
"GPT-4.5-Preview-2025-02-27 (FC)",
25+
"https://openai.com/index/introducing-gpt-4-5/",
26+
"OpenAI",
27+
"Proprietary",
28+
],
29+
"gpt-4.5-preview-2025-02-27": [
30+
"GPT-4.5-Preview-2025-02-27 (Prompt)",
31+
"https://openai.com/index/introducing-gpt-4-5/",
32+
"OpenAI",
33+
"Proprietary",
34+
],
1635
"o1-2024-12-17-FC": [
1736
"o1-2024-12-17 (FC)",
1837
"https://openai.com/o1/",
@@ -38,13 +57,13 @@
3857
"Proprietary",
3958
],
4059
"gpt-4o-2024-11-20": [
41-
"gpt-4o-2024-11-20 (Prompt)",
60+
"GPT-4o-2024-11-20 (Prompt)",
4261
"https://openai.com/index/hello-gpt-4o/",
4362
"OpenAI",
4463
"Proprietary",
4564
],
4665
"gpt-4o-2024-11-20-FC": [
47-
"gpt-4o-2024-11-20 (FC)",
66+
"GPT-4o-2024-11-20 (FC)",
4867
"https://openai.com/index/hello-gpt-4o/",
4968
"OpenAI",
5069
"Proprietary",
@@ -932,6 +951,8 @@
932951
"mistral-small-2402-FC": 1,
933952
"mistral-small-2402": 1,
934953
"mistral-tiny-2312": 0.25,
954+
"gpt-4.5-preview-2025-02-27-FC": 75,
955+
"gpt-4.5-preview-2025-02-27": 75,
935956
"o1-2024-12-17-FC": 15,
936957
"o1-2024-12-17": 15,
937958
"o3-mini-2025-01-31-FC": 1.1,
@@ -1005,6 +1026,8 @@
10051026
"mistral-medium-2312": 8.1,
10061027
"mistral-small-2402-FC": 3,
10071028
"mistral-tiny-2312": 0.25,
1029+
"gpt-4.5-preview-2025-02-27-FC": 150,
1030+
"gpt-4.5-preview-2025-02-27": 150,
10081031
"o1-2024-12-17-FC": 60,
10091032
"o1-2024-12-17": 60,
10101033
"o3-mini-2025-01-31-FC": 4,

berkeley-function-call-leaderboard/bfcl/model_handler/constant.py

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -114,6 +114,7 @@
114114
UNDERSCORE_TO_DOT = [
115115
# TODO: Use the model style to determine this, single source of truth
116116
"DeepSeek-V3",
117+
"gpt-4.5-preview-2025-02-27-FC",
117118
"o1-2024-12-17-FC",
118119
"o3-mini-2025-01-31-FC",
119120
"gpt-4o-2024-11-20-FC",

berkeley-function-call-leaderboard/bfcl/model_handler/handler_map.py

Lines changed: 2 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -41,6 +41,8 @@
4141
api_inference_handler_map = {
4242
"gorilla-openfunctions-v2": GorillaHandler,
4343
"DeepSeek-V3": DeepSeekAPIHandler,
44+
"gpt-4.5-preview-2025-02-27": OpenAIHandler,
45+
"gpt-4.5-preview-2025-02-27-FC": OpenAIHandler,
4446
"o1-2024-12-17-FC": OpenAIHandler,
4547
"o1-2024-12-17": OpenAIHandler,
4648
"o3-mini-2025-01-31-FC": OpenAIHandler,

berkeley-function-call-leaderboard/pyproject.toml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -22,7 +22,7 @@ dependencies = [
2222
"tree_sitter==0.21.3",
2323
"tree-sitter-java==0.21.0",
2424
"tree-sitter-javascript==0.21.4",
25-
"openai==1.58.0",
25+
"openai==1.65.0",
2626
"mistralai==1.1.0",
2727
"anthropic==0.39.0",
2828
"cohere==5.13.3",

0 commit comments

Comments
 (0)