File tree Expand file tree Collapse file tree 3 files changed +3
-3
lines changed
Expand file tree Collapse file tree 3 files changed +3
-3
lines changed Original file line number Diff line number Diff line change @@ -110,7 +110,7 @@ def __init__(self, kvargs):
110110 self ._init_some_value ()
111111 self ._init_custom ()
112112 self ._init_inferstate_cls ()
113- # self._autotune_warmup()
113+ self ._autotune_warmup ()
114114 self ._init_padded_req ()
115115 # wait必须在init cudagraph 之前,避免错误捕获
116116 self ._wait_other_modules_ready ()
Original file line number Diff line number Diff line change @@ -50,7 +50,7 @@ def __init__(self, model):
5050 self .softmax_scale = self .softmax_scale * mscale * mscale
5151
5252
53- @ModelRegistry (["deepseek_v2" , "deepseek_v3" , "deepseek_v32" ])
53+ @ModelRegistry (["deepseek_v2" , "deepseek_v3" ])
5454class Deepseek2TpPartModel (LlamaTpPartModel ):
5555 # weight class
5656 transformer_weight_class = Deepseek2TransformerLayerWeight
Original file line number Diff line number Diff line change 55from lightllm .utils .envs_utils import get_env_start_args
66from lightllm .models .deepseek3_2 .infer_struct import Deepseek3_2FlashAttentionStateInfo
77from lightllm .models .deepseek3_2 .mem_manager import Deepseek3_2MemoryManager , Deepseek3_2FP8KVMemoryManager
8- # @ModelRegistry(["deepseek_v32"])
8+ @ModelRegistry (["deepseek_v32" ])
99class Deepseek3_2TpPartModel (Deepseek2TpPartModel ):
1010 # weight class
1111 transformer_weight_class = Deepseek3_2TransformerLayerWeight
You can’t perform that action at this time.
0 commit comments