From f62ea6285c1f026ae61450c26c87d9694ad9bba4 Mon Sep 17 00:00:00 2001 From: Yifan Mai Date: Tue, 4 Feb 2025 14:16:59 -0800 Subject: [PATCH] Add QwQ model on Together AI (#3307) --- src/helm/config/model_deployments.yaml | 7 +++++++ src/helm/config/model_metadata.yaml | 9 +++++++++ src/helm/config/tokenizer_configs.yaml | 10 ++++++++-- 3 files changed, 24 insertions(+), 2 deletions(-) diff --git a/src/helm/config/model_deployments.yaml b/src/helm/config/model_deployments.yaml index 571c4c8125..9b82fa1d71 100644 --- a/src/helm/config/model_deployments.yaml +++ b/src/helm/config/model_deployments.yaml @@ -2824,6 +2824,13 @@ model_deployments: client_spec: class_name: "helm.clients.together_client.TogetherChatClient" + - name: together/qwq-32b-preview + model_name: qwen/qwq-32b-preview + tokenizer_name: qwen/qwq-32b-preview + max_sequence_length: 32768 + client_spec: + class_name: "helm.clients.together_client.TogetherChatClient" + - name: huggingface/qwen-vl model_name: qwen/qwen-vl tokenizer_name: qwen/qwen-vl diff --git a/src/helm/config/model_metadata.yaml b/src/helm/config/model_metadata.yaml index f534e93c26..8f90556616 100644 --- a/src/helm/config/model_metadata.yaml +++ b/src/helm/config/model_metadata.yaml @@ -2909,6 +2909,15 @@ models: release_date: 2024-09-19 tags: [TEXT_MODEL_TAG, LIMITED_FUNCTIONALITY_TEXT_MODEL_TAG, INSTRUCTION_FOLLOWING_MODEL_TAG] + - name: qwen/qwq-32b-preview + display_name: QwQ (32B Preview) + description: QwQ-32B-Preview is an experimental research model developed by the Qwen Team, focused on advancing AI reasoning capabilities. ([blog post](https://qwenlm.github.io/blog/qwq-32b-preview/)). + creator_organization_name: Alibaba Cloud + access: open + num_parameters: 32800000000 + release_date: 2024-11-28 + tags: [TEXT_MODEL_TAG, LIMITED_FUNCTIONALITY_TEXT_MODEL_TAG, INSTRUCTION_FOLLOWING_MODEL_TAG] + - name: qwen/qwen-vl display_name: Qwen-VL description: Visual multimodal version of the Qwen large language model series ([paper](https://arxiv.org/abs/2308.12966)). diff --git a/src/helm/config/tokenizer_configs.yaml b/src/helm/config/tokenizer_configs.yaml index 0260ce204f..f9c7f45623 100644 --- a/src/helm/config/tokenizer_configs.yaml +++ b/src/helm/config/tokenizer_configs.yaml @@ -578,7 +578,7 @@ tokenizer_configs: args: pretrained_model_name_or_path: Qwen/Qwen2-72B-Instruct end_of_text_token: "<|im_end|>" - prefix_token: "<|im_start|>'" + prefix_token: "<|im_start|>" - name: qwen/qwen2.5-7b-instruct tokenizer_spec: @@ -586,7 +586,13 @@ tokenizer_configs: args: pretrained_model_name_or_path: Qwen/Qwen2.5-7B-Instruct end_of_text_token: "<|im_end|>" - prefix_token: "<|im_start|>'" + prefix_token: "<|im_start|>" + + - name: qwen/qwq-32b-preview + tokenizer_spec: + class_name: "helm.tokenizers.huggingface_tokenizer.HuggingFaceTokenizer" + end_of_text_token: "<|im_end|>" + prefix_token: "" - name: qwen/qwen-vl tokenizer_spec: