Skip to content

Commit 1ce10c1

Browse files
committed
更新readme 发布新版本
1 parent 4a65448 commit 1ce10c1

File tree

4 files changed

+6
-4
lines changed

4 files changed

+6
-4
lines changed

Dockerfile.copy

+1-1
Original file line numberDiff line numberDiff line change
@@ -1,4 +1,4 @@
1-
FROM func.ink/506610466/gpt_server:latest
1+
FROM hub.littlediary.cn/506610466/gpt_server:latest
22

33
COPY ./ /gpt_server
44

README.md

+3-1
Original file line numberDiff line numberDiff line change
@@ -47,6 +47,7 @@
4747
## 更新信息
4848

4949
```plaintext
50+
2025-2-9 支持了 QVQ
5051
2024-12-22 支持了 tts, /v1/audio/speech TTS模型
5152
2024-12-21 支持了 text-moderation, /v1/moderations 文本审核模型
5253
2024-12-14 支持了 phi-4
@@ -170,7 +171,7 @@ python gpt_server/serving/main.py
170171
```bash
171172
docker pull 506610466/gpt_server:latest # 如果拉取失败可尝试下面的方式
172173
# 如果国内无法拉取docker镜像,可以尝试下面的国内镜像拉取的方式(不保证国内镜像源一直可用)
173-
docker pull func.ink/506610466/gpt_server:latest
174+
docker pull hub.littlediary.cn/506610466/gpt_server:latest
174175
```
175176

176177
##### 3.2.1 手动构建镜像(可选)
@@ -246,6 +247,7 @@ Chat UI界面:
246247
| InternVL2 | internvl2 | × | × |||
247248
| MiniCPM-V-2_6 | minicpmv | × ||| × |
248249
| Qwen2-VL | qwen | × || × ||
250+
| QVQ | qwen | × || × | × |
249251
<br>
250252

251253
### Embedding/Rerank/Classify模型

gpt_server/model_backend/vllm_backend.py

+1-1
Original file line numberDiff line numberDiff line change
@@ -88,7 +88,7 @@ async def stream_chat(self, params: Dict[str, Any]) -> AsyncGenerator:
8888
tokenizer = await self.engine.get_tokenizer()
8989
model_config = await self.engine.get_model_config()
9090
conversation, mm_data_future = parse_chat_messages_futures(
91-
messages, model_config, tokenizer
91+
messages, model_config, tokenizer, content_format="openai"
9292
)
9393
prompt = apply_hf_chat_template(
9494
tokenizer,

pyproject.toml

+1-1
Original file line numberDiff line numberDiff line change
@@ -1,6 +1,6 @@
11
[project]
22
name = "gpt_server"
3-
version = "0.3.5"
3+
version = "0.3.6"
44
description = "gpt_server是一个用于生产级部署LLMs或Embedding的开源框架。"
55
readme = "README.md"
66
license = { text = "Apache 2.0" }

0 commit comments

Comments
 (0)