From 6fd879cea94003c54ee35ea4b67c178134381b60 Mon Sep 17 00:00:00 2001 From: JinCheng666 <48248936+JinCheng666@users.noreply.github.com> Date: Thu, 24 Oct 2024 20:42:29 +0800 Subject: [PATCH] BUG: fix embedding model gte-Qwen2 dimensions (#2479) --- doc/source/models/builtin/embedding/gte-qwen2.rst | 4 ++-- xinference/model/embedding/model_spec.json | 2 +- 2 files changed, 3 insertions(+), 3 deletions(-) diff --git a/doc/source/models/builtin/embedding/gte-qwen2.rst b/doc/source/models/builtin/embedding/gte-qwen2.rst index a88fdece9d..85eeeac39a 100644 --- a/doc/source/models/builtin/embedding/gte-qwen2.rst +++ b/doc/source/models/builtin/embedding/gte-qwen2.rst @@ -11,11 +11,11 @@ gte-Qwen2 Specifications ^^^^^^^^^^^^^^ -- **Dimensions:** 3584 +- **Dimensions:** 4096 - **Max Tokens:** 32000 - **Model ID:** Alibaba-NLP/gte-Qwen2-7B-instruct - **Model Hubs**: `Hugging Face `__, `ModelScope `__ Execute the following command to launch the model:: - xinference launch --model-name gte-Qwen2 --model-type embedding \ No newline at end of file + xinference launch --model-name gte-Qwen2 --model-type embedding diff --git a/xinference/model/embedding/model_spec.json b/xinference/model/embedding/model_spec.json index 14d4ced519..dc8d851b85 100644 --- a/xinference/model/embedding/model_spec.json +++ b/xinference/model/embedding/model_spec.json @@ -233,7 +233,7 @@ }, { "model_name": "gte-Qwen2", - "dimensions": 3584, + "dimensions": 4096, "max_tokens": 32000, "language": ["zh", "en"], "model_id": "Alibaba-NLP/gte-Qwen2-7B-instruct",