File tree Expand file tree Collapse file tree 5 files changed +99
-69
lines changed Expand file tree Collapse file tree 5 files changed +99
-69
lines changed Original file line number Diff line number Diff line change @@ -99,5 +99,5 @@ def get_embedding_mode(model_path: str):
9999if __name__ == "__main__" :
100100
101101 # 示例用法
102- r = get_embedding_mode ("/home/dev/model/BAAI/bge-m3 /" )
102+ r = get_embedding_mode ("/home/dev/model/Qwen/Qwen3-Reranker-0___6B /" )
103103 print (r )
Original file line number Diff line number Diff line change 11from typing import Tuple
22
3- __version__ = "0.3.7 "
3+ __version__ = "0.6.0 "
44short_version = __version__
55
66
Original file line number Diff line number Diff line change 11[project ]
22name = " gpt_server"
3- version = " 0.5.4 "
3+ version = " 0.6.0 "
44description = " gpt_server是一个用于生产级部署LLMs或Embedding的开源框架。"
55readme = " README.md"
66license = { text = " Apache 2.0" }
@@ -12,7 +12,7 @@ dependencies = [
1212 " ffmpy" ,
1313 " fschat==0.2.36" ,
1414 " infinity-emb[all]==0.0.76" ,
15- " lmdeploy==0.9.1 " ,
15+ " lmdeploy==0.9.2 " ,
1616 " loguru>=0.7.2" ,
1717 " openai==1.86.0" ,
1818 " setuptools==75.2.0" ,
@@ -25,7 +25,7 @@ dependencies = [
2525 " modelscope==1.26.0" ,
2626 " edge-tts>=7.0.0" ,
2727 " funasr>=1.2.6" ,
28- " sglang[all]>=0.4.9.post3 " ,
28+ " sglang[all]>=0.4.10 " ,
2929 " flashinfer-python" ,
3030 " flashtts>=0.1.7" ,
3131 " diffusers>=0.33.1" ,
@@ -42,6 +42,7 @@ override-dependencies = [
4242 " transformers==4.53.3" , # infinity-emb
4343 " soundfile==0.13.1" , # infinity
4444 " xgrammar==0.1.21" , # sglang[all]==0.4.5 depends on xgrammar==0.1.17
45+ " flashinfer-python==0.2.10" ,
4546]
4647
4748[project .scripts ]
You can’t perform that action at this time.
0 commit comments