Skip to content

Commit d3a4479

Browse files
authored
feat: improve tool calling & add tools to qwen 2.5 72b (#1615)
* fix: clean up tool calling more inline with latest changes in transformers lib and adds tool calling to qwen 2.5 72b * fix: add more field name options * fix: make tool calls a bit more robust
1 parent a27c61e commit d3a4479

File tree

6 files changed

+161
-105
lines changed

6 files changed

+161
-105
lines changed

chart/env/prod.yaml

Lines changed: 1 addition & 7 deletions
Original file line numberDiff line numberDiff line change
@@ -50,7 +50,6 @@ envVars:
5050
[
5151
{
5252
"name": "Qwen/Qwen2.5-72B-Instruct",
53-
"tokenizer": "Qwen/Qwen2.5-72B-Instruct",
5453
"description": "The latest Qwen open model with improved role-playing, long text generation and structured data understanding.",
5554
"modelUrl": "https://huggingface.co/Qwen/Qwen2.5-72B-Instruct",
5655
"websiteUrl": "https://qwenlm.github.io/blog/qwen2.5/",
@@ -62,6 +61,7 @@ envVars:
6261
"truncate": 28672,
6362
"max_new_tokens": 3072
6463
},
64+
"tools": true,
6565
"promptExamples": [
6666
{
6767
"title": "Write an email from bullet list",
@@ -80,7 +80,6 @@ envVars:
8080
{
8181
"name": "meta-llama/Meta-Llama-3.1-70B-Instruct",
8282
"id": "meta-llama/Meta-Llama-3.1-70B-Instruct",
83-
"tokenizer": "nsarrazin/llama3.1-tokenizer",
8483
"description": "Ideal for everyday use. A fast and extremely capable model matching closed source models' capabilities.",
8584
"modelUrl": "https://huggingface.co/meta-llama/Meta-Llama-3.1-70B-Instruct",
8685
"websiteUrl": "https://llama.meta.com/",
@@ -110,7 +109,6 @@ envVars:
110109
},
111110
{
112111
"name": "CohereForAI/c4ai-command-r-plus-08-2024",
113-
"tokenizer": "nsarrazin/c4ai-command-r-v01-tokenizer",
114112
"description": "Cohere's largest language model, optimized for conversational interaction and tool use. Now with the 2024 update!",
115113
"modelUrl": "https://huggingface.co/CohereForAI/c4ai-command-r-plus-08-2024",
116114
"websiteUrl": "https://docs.cohere.com/docs/command-r-plus",
@@ -350,10 +348,6 @@ envVars:
350348
},
351349
{
352350
"name": "llhf/Meta-Llama-3.1-8B-Instruct",
353-
"tokenizer": {
354-
"tokenizerUrl": "https://huggingface.co/nsarrazin/llama3.1-tokenizer/resolve/main/tokenizer.json",
355-
"tokenizerConfigUrl": "https://huggingface.co/nsarrazin/llama3.1-tokenizer/raw/main/tokenizer_config.json"
356-
},
357351
"parameters": {
358352
"temperature": 0.6,
359353
"stop": ["<|endoftext|>", "<|eot_id|>"]

package-lock.json

Lines changed: 76 additions & 51 deletions
Some generated files are not rendered by default. Learn more about customizing how changed files appear on GitHub.

package.json

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -63,10 +63,10 @@
6363
"dependencies": {
6464
"@aws-sdk/credential-providers": "^3.592.0",
6565
"@cliqz/adblocker-playwright": "^1.27.2",
66-
"@gradio/client": "^1.1.1",
66+
"@gradio/client": "^1.8.0",
6767
"@huggingface/hub": "^0.5.1",
68-
"@huggingface/inference": "^2.7.0",
69-
"@huggingface/transformers": "^3.0.0-alpha.6",
68+
"@huggingface/inference": "^2.8.1",
69+
"@huggingface/transformers": "^3.1.1",
7070
"@iconify-json/bi": "^1.1.21",
7171
"@playwright/browser-chromium": "^1.43.1",
7272
"@resvg/resvg-js": "^2.6.2",

0 commit comments

Comments
 (0)