@@ -13861,14 +13861,14 @@ struct llm_build_context {
1386113861 cb(Qcur, "Qcur", il);
1386213862 }
1386313863
13864- struct ggml_tensor * Kcur = ggml_mul_mat( ctx0, model.layers[il].wk, cur);
13864+ struct ggml_tensor * Kcur = llm_build_lora_mm(lctx, ctx0, model.layers[il].wk, cur);
1386513865 cb(Kcur, "Kcur", il);
1386613866 if (model.layers[il].bk) {
1386713867 Kcur = ggml_add(ctx0, Kcur, model.layers[il].bk);
1386813868 cb(Kcur, "Kcur", il);
1386913869 }
1387013870
13871- struct ggml_tensor * Vcur = ggml_mul_mat( ctx0, model.layers[il].wv, cur);
13871+ struct ggml_tensor * Vcur = llm_build_lora_mm(lctx, ctx0, model.layers[il].wv, cur);
1387213872 cb(Vcur, "Vcur", il);
1387313873 if (model.layers[il].bv) {
1387413874 Vcur = ggml_add(ctx0, Vcur, model.layers[il].bv);
@@ -13937,7 +13937,7 @@ struct llm_build_context {
1393713937 cb(cur, "result_norm", -1);
1393813938
1393913939 // lm_head
13940- cur = ggml_mul_mat( ctx0, model.output, cur);
13940+ cur = llm_build_lora_mm(lctx, ctx0, model.output, cur);
1394113941 cb(cur, "result_output", -1);
1394213942
1394313943 ggml_build_forward_expand(gf, cur);
0 commit comments