Skip to content

Commit

Permalink
feat:Support QvQ-72B-Preview
Browse files Browse the repository at this point in the history
  • Loading branch information
JunHowie authored and JunHowie committed Dec 27, 2024
1 parent 7ba5660 commit e7b0406
Show file tree
Hide file tree
Showing 3 changed files with 3 additions and 2 deletions.
2 changes: 1 addition & 1 deletion xinference/core/model.py
Original file line number Diff line number Diff line change
Expand Up @@ -76,7 +76,7 @@ class _OutOfMemoryError(Exception):
"glm-4v",
"MiniCPM-V-2.6",
"qwen2-vl-instruct",
"qvq-72b-preview",
"QvQ-72B-Preview",
]

XINFERENCE_TEXT_TO_IMAGE_BATCHING_ALLOWED_MODELS = ["FLUX.1-dev", "FLUX.1-schnell"]
Expand Down
1 change: 1 addition & 0 deletions xinference/model/llm/transformers/core.py
Original file line number Diff line number Diff line change
Expand Up @@ -69,6 +69,7 @@
"deepseek-v2.5",
"deepseek-v2-chat-0628",
"glm-edge-v",
"QvQ-72B-Preview",
]


Expand Down
2 changes: 1 addition & 1 deletion xinference/model/llm/vllm/core.py
Original file line number Diff line number Diff line change
Expand Up @@ -195,7 +195,7 @@ class VLLMGenerateConfig(TypedDict, total=False):
VLLM_SUPPORTED_MODELS.append("llama-3.2-vision")
VLLM_SUPPORTED_VISION_MODEL_LIST.append("llama-3.2-vision-instruct")
VLLM_SUPPORTED_VISION_MODEL_LIST.append("qwen2-vl-instruct")
VLLM_SUPPORTED_VISION_MODEL_LIST.append("qvq-72b-preview")
VLLM_SUPPORTED_VISION_MODEL_LIST.append("QvQ-72B-Preview")


class VLLMModel(LLM):
Expand Down

0 comments on commit e7b0406

Please sign in to comment.