We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent 6f412e1 commit 8af0ab8Copy full SHA for 8af0ab8
src/llama.cpp
@@ -7217,7 +7217,7 @@ struct llm_build_context {
7217
struct ggml_tensor * Qcur = nullptr;
7218
struct ggml_tensor * Kcur = nullptr;
7219
struct ggml_tensor * Vcur = nullptr;
7220
- if (model.type == LLM_TYPE_1_5B || model.type == LLM_TYPE_4B || model.type == LLM_TYPE_9B) {
+ if (model.layers[il].wqkv == nullptr) {
7221
Qcur = llm_build_lora_mm(lctx, ctx0, model.layers[il].wq, cur);
7222
if (model.layers[il].bq) {
7223
Qcur = ggml_add(ctx0, Qcur, model.layers[il].bq);
0 commit comments