mirror of
https://github.com/RYDE-WORK/llama.cpp.git
synced 2026-01-29 19:53:16 +08:00
llama : fix old glm4 models (#11670)
This commit is contained in:
parent
8a59053f63
commit
855cd0734a
@ -7217,7 +7217,7 @@ struct llm_build_context {
|
|||||||
struct ggml_tensor * Qcur = nullptr;
|
struct ggml_tensor * Qcur = nullptr;
|
||||||
struct ggml_tensor * Kcur = nullptr;
|
struct ggml_tensor * Kcur = nullptr;
|
||||||
struct ggml_tensor * Vcur = nullptr;
|
struct ggml_tensor * Vcur = nullptr;
|
||||||
if (model.type == LLM_TYPE_1_5B || model.type == LLM_TYPE_4B || model.type == LLM_TYPE_9B) {
|
if (model.layers[il].wqkv == nullptr) {
|
||||||
Qcur = llm_build_lora_mm(lctx, ctx0, model.layers[il].wq, cur);
|
Qcur = llm_build_lora_mm(lctx, ctx0, model.layers[il].wq, cur);
|
||||||
if (model.layers[il].bq) {
|
if (model.layers[il].bq) {
|
||||||
Qcur = ggml_add(ctx0, Qcur, model.layers[il].bq);
|
Qcur = ggml_add(ctx0, Qcur, model.layers[il].bq);
|
||||||
|
|||||||
Loading…
x
Reference in New Issue
Block a user