mirror of
https://github.com/ikawrakow/ik_llama.cpp.git
synced 2026-06-28 04:30:15 -05:00
Fix Qwen3.5/3.6 MTP and -muge (#1816)
This commit is contained in:
parent
1f8c603d9c
commit
0ab9bdf793
@ -6013,6 +6013,9 @@ void llama_free_model(struct llama_model * model) {
|
||||
}
|
||||
|
||||
static void llama_repack_up_gate_exps(llama_context & lctx) {
|
||||
if (lctx.cparams.mtp_op_type != MTP_OP_NONE) {
|
||||
return;
|
||||
}
|
||||
auto & model = lctx.model;
|
||||
bool needs_repack = false;
|
||||
for (auto & l : model.layers) {
|
||||
|
||||
Loading…
x
Reference in New Issue
Block a user