TheFloatingString
diff --git a/‎berkeley-function-call-leaderboard/CHANGELOG.md
Lines changed: 6 additions & 0 deletions b/‎berkeley-function-call-leaderboard/CHANGELOG.md
Lines changed: 6 additions & 0 deletions
diff --git a/‎berkeley-function-call-leaderboard/SUPPORTED_MODELS.md
Lines changed: 6 additions & 4 deletions b/‎berkeley-function-call-leaderboard/SUPPORTED_MODELS.md
Lines changed: 6 additions & 4 deletions
diff --git a/‎berkeley-function-call-leaderboard/bfcl_eval/.env.example
Lines changed: 3 additions & 0 deletions b/‎berkeley-function-call-leaderboard/bfcl_eval/.env.example
Lines changed: 3 additions & 0 deletions
diff --git a/‎berkeley-function-call-leaderboard/bfcl_eval/constants/model_config.py
Lines changed: 46 additions & 8 deletions b/‎berkeley-function-call-leaderboard/bfcl_eval/constants/model_config.py
Lines changed: 46 additions & 8 deletions
diff --git a/‎berkeley-function-call-leaderboard/bfcl_eval/constants/supported_models.py
Lines changed: 5 additions & 2 deletions b/‎berkeley-function-call-leaderboard/bfcl_eval/constants/supported_models.py
Lines changed: 5 additions & 2 deletions
@@ -2,6 +2,12 @@
 
 All notable changes to the Berkeley Function Calling Leaderboard will be documented in this file.
 
+- [Jun 18, 2025] [#1068](https://github.com/ShishirPatil/gorilla/pull/1068): Fix prompt concatenation issue in Qwen chat template. The self-hosted `Qwen3` models are affected.
+- [Jun 15, 2025] [#966](https://github.com/ShishirPatil/gorilla/pull/966): Removed the `travel_cost` parameter from multi-turn backend `TravelAPI.book_flight()` and now compute cost internally to eliminate ambiguity.
+- [Jun 15, 2025] [#1060](https://github.com/ShishirPatil/gorilla/pull/1060): Fixed multi-turn backend `GorillaFileSystem._get_item()` method to correctly handle `"."` in path strings.
+- [Jun 14, 2025] [#1032](https://github.com/ShishirPatil/gorilla/pull/1032): Add `Llama-3.1-Nemotron-Ultra-253B-v1` to the leaderboard.
+- [Jun 12, 2025] [#1056](https://github.com/ShishirPatil/gorilla/pull/1056): Add `Ling-Lite-V1.5` to the leaderboard.
+- [Jun 12, 2025] [#1063](https://github.com/ShishirPatil/gorilla/pull/1063): Add support for `DeepSeek-R1-0528` and `DeepSeek-V3-0324`
 - [Jun 11, 2025] [#1061](https://github.com/ShishirPatil/gorilla/pull/1061): Add support for DashScope API inference for `Qwen3` series
 - [Jun 8, 2025] [#1054](https://github.com/ShishirPatil/gorilla/pull/1054), [#1055](https://github.com/ShishirPatil/gorilla/pull/1055): Packagerize codebase for PyPI Distribution. Now available with `pip install bfcl-eval`, in addition to the existing `pip install -e`.
 - [May 27, 2025] [#1040](https://github.com/ShishirPatil/gorilla/pull/1040): Add the following new models to the leaderboard:
 
@@ -34,9 +34,10 @@ For model names containing `{...}`, multiple versions are available. For example
 | Command R7B                            | Function Calling | Cohere         | command-r7b-12-2024-FC                                      |
 | Command-R-Plus                         | Function Calling | Cohere         | command-r-plus-FC                                           |
 | DBRX-Instruct                          | Prompt           | Databricks     | databricks-dbrx-instruct                                    |
-| DeepSeek-R1                            | Prompt           | DeepSeek       | DeepSeek-R1                                                 |
 | DeepSeek-R1                            | Prompt           | Self-hosted 💻 | deepseek-ai/DeepSeek-R1                                     |
-| DeepSeek-V3                            | Function Calling | DeepSeek       | DeepSeek-V3-FC                                              |
+| DeepSeek-R1-0528                       | Prompt           | DeepSeek       | DeepSeek-R1-0528                                            |
+| DeepSeek-R1-0528                       | Function Calling | DeepSeek       | DeepSeek-R1-0528-FC                                         |
+| DeepSeek-V3-0324                       | Function Calling | DeepSeek       | DeepSeek-V3-0324-FC                                         |
 | DM-Cito-8B                             | Prompt           | Mininglamp     | DM-Cito-8B                                                  |
 | Falcon3-{1B,3B,7B,10B}-Instruct        | Function Calling | Self-hosted 💻 | tiiuae/Falcon3-{1B,3B,7B,10B}-Instruct                      |
 | FireFunction-v2                        | Function Calling | Fireworks AI   | firefunction-v2-FC                                          |
@@ -73,6 +74,7 @@ For model names containing `{...}`, multiple versions are available. For example
 | Hammer2.1-{7b,3b,1.5b,0.5b}            | Function Calling | Self-hosted 💻 | MadeAgents/Hammer2.1-{7b,3b,1.5b,0.5b}                      |
 | Llama-3.1-{8B,70B}-Instruct            | Function Calling | Self-hosted 💻 | meta-llama/Llama-3.1-{8B,70B}-Instruct-FC                   |
 | Llama-3.1-{8B,70B}-Instruct            | Prompt           | Self-hosted 💻 | meta-llama/Llama-3.1-{8B,70B}-Instruct                      |
+| Llama-3.1-Nemotron-Ultra-253B-v1       | Prompt           | Nvidia         | nvidia/llama-3.1-nemotron-ultra-253b-v1                     |
 | Llama-3.2-{1B,3B}-Instruct             | Function Calling | Self-hosted 💻 | meta-llama/Llama-3.2-{1B,3B}-Instruct-FC                    |
 | Llama-3.3-70B-Instruct                 | Function Calling | Self-hosted 💻 | meta-llama/Llama-3.3-70B-Instruct-FC                        |
 | Llama-4-Maverick-17B-128E-Instruct-FP8 | Prompt           | Novita AI      | meta-llama/llama-4-maverick-17b-128e-instruct-fp8-novita    |
@@ -104,7 +106,7 @@ For model names containing `{...}`, multiple versions are available. For example
 | Phi-4-mini-instruct                    | Function Calling | Self-hosted 💻 | microsoft/Phi-4-mini-instruct-FC                            |
 | Qwen3-{0.6B,1.7B,4B,8B,14B,32B}        | Prompt           | Alibaba Cloud  | qwen3-{0.6b,1.7b,4b,8b,14b,32b}                             |
 | Qwen3-{0.6B,1.7B,4B,8B,14B,32B}        | Prompt           | Self-hosted 💻 | Qwen/Qwen3-{0.6B,1.7B,4B,8B,14B,32B}                        |
-| Qwen3-{0.6B,1.7B,4B,8B,14B,32B}        | Function Calling | Alibaba Cloud  | qwen3-{0.6b,1.7b,4b,8b,14b,32b}-FC                         |
+| Qwen3-{0.6B,1.7B,4B,8B,14B,32B}        | Function Calling | Alibaba Cloud  | qwen3-{0.6b,1.7b,4b,8b,14b,32b}-FC                          |
 | Qwen3-{0.6B,1.7B,4B,8B,14B,32B}        | Function Calling | Self-hosted 💻 | Qwen/Qwen3-{0.6B,1.7B,4B,8B,14B,32B}-FC                     |
 | Qwen3-{30B-A3B,235B-A22B}              | Prompt           | Alibaba Cloud  | qwen3-{30b-a3b, 235b-a22b}                                  |
 | Qwen3-{30B-A3B,235B-A22B}              | Prompt           | Self-hosted 💻 | Qwen/Qwen3-{30B-A3B,235B-A22B}                              |
@@ -126,7 +128,7 @@ For model names containing `{...}`, multiple versions are available. For example
 | xLAM-2-70b-fc-r                        | Function Calling | Self-hosted 💻 | Salesforce/Llama-xLAM-2-70b-fc-r                            |
 | xLAM-2-8b-fc-r                         | Function Calling | Self-hosted 💻 | Salesforce/Llama-xLAM-2-8b-fc-r                             |
 | yi-large                               | Function Calling | 01.AI          | yi-large-fc                                                 |
-
+| Ling-lite-v1.5                         | Prompt           | Ant Group      | Ling/ling-lite-v1.5                                         |
 ---
 
 ## Additional Requirements for Certain Models
 
@@ -30,6 +30,9 @@ DATABRICKS_AZURE_ENDPOINT_URL=
 # [OPTIONAL] For inference via Novita AI endpoint
 NOVITA_API_KEY=sk-XXXXXX
 
+# We use the API Key from Alipay to inference Bailing (Ling) models (see https://zxb.alipay.com/llm/landing)
+LING_API_KEY=sk-XXXXXX
+
 # [OPTIONAL] For local vllm/sglang server configuration
 # Defaults to localhost port 1053 if not provided
 VLLM_ENDPOINT=localhost
 
@@ -14,6 +14,7 @@
 from bfcl_eval.model_handler.api_inference.grok import GrokHandler
 from bfcl_eval.model_handler.api_inference.mining import MiningHandler
 from bfcl_eval.model_handler.api_inference.mistral import MistralHandler
+from bfcl_eval.model_handler.api_inference.nemotron import NemotronHandler
 from bfcl_eval.model_handler.api_inference.nexus import NexusHandler
 from bfcl_eval.model_handler.api_inference.nova import NovaHandler
 from bfcl_eval.model_handler.api_inference.novita import NovitaHandler
@@ -46,6 +47,7 @@
 from bfcl_eval.model_handler.local_inference.salesforce_llama import SalesforceLlamaHandler
 from bfcl_eval.model_handler.local_inference.salesforce_qwen import SalesforceQwenHandler
 from bfcl_eval.model_handler.local_inference.think_agent import ThinkAgentHandler
+from bfcl_eval.model_handler.api_inference.ling import LingAPIHandler
 
 # -----------------------------------------------------------------------------
 # A mapping of model identifiers to their respective model configurations.
@@ -107,10 +109,10 @@ class ModelConfig:
         is_fc_model=False,
         underscore_to_dot=False,
     ),
-    "DeepSeek-R1": ModelConfig(
-        model_name="DeepSeek-R1",
-        display_name="DeepSeek-R1 (Prompt)",
-        url="https://api-docs.deepseek.com/news/news1226",
+    "DeepSeek-R1-0528": ModelConfig(
+        model_name="DeepSeek-R1-0528",
+        display_name="DeepSeek-R1-0528 (Prompt)",
+        url="https://api-docs.deepseek.com/news/news250528",
         org="DeepSeek",
         license="MIT",
         model_handler=DeepSeekAPIHandler,
@@ -119,10 +121,22 @@ class ModelConfig:
         is_fc_model=False,
         underscore_to_dot=False,
     ),
-    "DeepSeek-V3-FC": ModelConfig(
-        model_name="DeepSeek-V3-FC",
-        display_name="DeepSeek-V3 (FC)",
-        url="https://api-docs.deepseek.com/news/news1226",
+    "DeepSeek-R1-0528-FC": ModelConfig(
+        model_name="DeepSeek-R1-0528-FC",
+        display_name="DeepSeek-R1-0528 (FC)",
+        url="https://api-docs.deepseek.com/news/news250528",
+        org="DeepSeek",
+        license="MIT",
+        model_handler=DeepSeekAPIHandler,
+        input_price=None,
+        output_price=None,
+        is_fc_model=True,
+        underscore_to_dot=True,
+    ),
+    "DeepSeek-V3-0324-FC": ModelConfig(
+        model_name="DeepSeek-V3-0324",
+        display_name="DeepSeek-V3-0324 (FC)",
+        url="https://api-docs.deepseek.com/news/news250325",
         org="DeepSeek",
         license="DeepSeek License",
         model_handler=DeepSeekAPIHandler,
@@ -743,6 +757,18 @@ class ModelConfig:
         is_fc_model=False,
         underscore_to_dot=False,
     ),
+    "nvidia/llama-3.1-nemotron-ultra-253b-v1": ModelConfig(
+        model_name="nvidia/llama-3.1-nemotron-ultra-253b-v1",
+        display_name="Llama-3.1-Nemotron-Ultra-253B-v1 (FC)",
+        url="https://huggingface.co/nvidia/Llama-3_1-Nemotron-Ultra-253B-v1",
+        org="NVIDIA",
+        license="nvidia-open-model-license",
+        model_handler=NemotronHandler,
+        input_price=None,
+        output_price=None,
+        is_fc_model=True,
+        underscore_to_dot=False,
+    ),
     "nvidia/nemotron-4-340b-instruct": ModelConfig(
         model_name="nvidia/nemotron-4-340b-instruct",
         display_name="Nemotron-4-340b-instruct (Prompt)",
@@ -1067,6 +1093,18 @@ class ModelConfig:
         is_fc_model=False,
         underscore_to_dot=False,
     ),
+    "Ling/ling-lite-v1.5": ModelConfig(
+        model_name="Ling/ling-lite-v1.5",
+        display_name="ling-lite-v1.5 (Prompt)",
+        url="https://huggingface.co/inclusionAI/Ling-lite-1.5",
+        org="Ling",
+        license="MIT",
+        model_handler=LingAPIHandler,
+        input_price=None,
+        output_price=None,
+        is_fc_model=False,
+        underscore_to_dot=False,
+    ),
 }
 
 # Inference through local hosting
 
@@ -14,8 +14,9 @@
 
 SUPPORTED_MODELS = [
     "gorilla-openfunctions-v2",
-    "DeepSeek-R1",
-    "DeepSeek-V3-FC",
+    "DeepSeek-R1-0528",
+    "DeepSeek-R1-0528-FC",
+    "DeepSeek-V3-0324-FC",
     "gpt-4.5-preview-2025-02-27",
     "gpt-4.5-preview-2025-02-27-FC",
     "gpt-4.1-2025-04-14-FC",
@@ -67,6 +68,7 @@
     "command-r7b-12-2024-FC",
     "command-a-03-2025-FC",
     "snowflake/arctic",
+    "nvidia/llama-3.1-nemotron-ultra-253b-v1",
     "nvidia/nemotron-4-340b-instruct",
     "BitAgent/GoGoAgent",
     "palmyra-x-004",
@@ -162,4 +164,5 @@
     "meta-llama/llama-4-scout-17b-16e-instruct-FC-novita",
     "qwen/qwq-32b-FC-novita",
     "qwen/qwq-32b-novita",
+    "Ling/ling-lite-v1.5",
 ]