Skip to content

Commit 9c99de1

Browse files
committed
将models 设置为全局
1 parent 4ee1b45 commit 9c99de1

File tree

1 file changed

+6
-4
lines changed

1 file changed

+6
-4
lines changed

gpt_server/serving/openai_api_server.py

Lines changed: 6 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -111,11 +111,12 @@ class AppSettings(BaseSettings):
111111
from contextlib import asynccontextmanager
112112

113113
model_address_map = {}
114+
models_ = []
114115

115116

116117
async def timing_tasks():
117118
"""定时任务"""
118-
global model_address_map
119+
global model_address_map, models_
119120
logger.info("定时任务已启动!")
120121
controller_address = app_settings.controller_address
121122

@@ -135,6 +136,7 @@ async def timing_tasks():
135136
worker_address_list = await asyncio.gather(*worker_addr_coro_list)
136137
for model, worker_addr in zip(models, worker_address_list):
137138
model_address_map[model] = worker_addr
139+
models_ = list(model_address_map.keys())
138140
await asyncio.sleep(6)
139141
except Exception:
140142
traceback.print_exc()
@@ -186,10 +188,10 @@ async def validation_exception_handler(request, exc):
186188

187189

188190
def check_model(request) -> Optional[JSONResponse]:
189-
global model_address_map
191+
global model_address_map, models_
190192
ret = None
191-
models = list(model_address_map.keys())
192-
if request.model not in models:
193+
models = models_
194+
if request.model not in models_:
193195
ret = create_error_response(
194196
ErrorCode.INVALID_MODEL,
195197
f"Only {'&&'.join(models)} allowed now, your model {request.model}",

0 commit comments

Comments
 (0)