diff --git a/llama.cpp b/llama.cpp index ee6e28226d52d..4ac46193caf7c 100644 --- a/llama.cpp +++ b/llama.cpp @@ -5570,6 +5570,7 @@ static const std::unordered_map k_offload_map { "ffn_moe_weighted", OFFLOAD_FUNC }, { "ffn_moe_up", OFFLOAD_FUNC }, { "ffn_moe_gate", OFFLOAD_FUNC }, + { "ffn_moe_silu", OFFLOAD_FUNC }, { "ffn_moe_gate_par", OFFLOAD_FUNC }, { "ffn_moe_down", OFFLOAD_FUNC }, { "ffn_moe_out", OFFLOAD_FUNC },