@@ -566,8 +566,8 @@ struct ggml_tensor * forward(
566
566
// wk shape [n_embd, n_embd, 1, 1]
567
567
// Qcur shape [n_embd/n_head, n_head, N, 1]
568
568
// Kcur shape [n_embd/n_head, n_head, N, 1]
569
- struct ggml_tensor * Qcur = ggml_rope (ctx0, ggml_reshape_3d (ctx0, ggml_mul_mat (ctx0, model->layers [il].wq , cur), n_embd/n_head, n_head, N), n_past, n_rot, 0 );
570
- struct ggml_tensor * Kcur = ggml_rope (ctx0, ggml_reshape_3d (ctx0, ggml_mul_mat (ctx0, model->layers [il].wk , cur), n_embd/n_head, n_head, N), n_past, n_rot, 0 );
569
+ struct ggml_tensor * Qcur = ggml_rope (ctx0, ggml_reshape_3d (ctx0, ggml_mul_mat (ctx0, model->layers [il].wq , cur), n_embd/n_head, n_head, N), n_past, n_rot, 0 , 0 );
570
+ struct ggml_tensor * Kcur = ggml_rope (ctx0, ggml_reshape_3d (ctx0, ggml_mul_mat (ctx0, model->layers [il].wk , cur), n_embd/n_head, n_head, N), n_past, n_rot, 0 , 0 );
571
571
572
572
// store key and value to memory
573
573
{
@@ -823,8 +823,8 @@ struct ggml_tensor * forward_batch(
823
823
// wk shape [n_embd, n_embd, 1, 1]
824
824
// Qcur shape [n_embd/n_head, n_head, N, n_batch]
825
825
// Kcur shape [n_embd/n_head, n_head, N, n_batch]
826
- struct ggml_tensor * Qcur = ggml_rope (ctx0, ggml_reshape_4d (ctx0, ggml_mul_mat (ctx0, model->layers [il].wq , cur), n_embd/n_head, n_head, N, n_batch), n_past, n_rot, 0 );
827
- struct ggml_tensor * Kcur = ggml_rope (ctx0, ggml_reshape_4d (ctx0, ggml_mul_mat (ctx0, model->layers [il].wk , cur), n_embd/n_head, n_head, N, n_batch), n_past, n_rot, 0 );
826
+ struct ggml_tensor * Qcur = ggml_rope (ctx0, ggml_reshape_4d (ctx0, ggml_mul_mat (ctx0, model->layers [il].wq , cur), n_embd/n_head, n_head, N, n_batch), n_past, n_rot, 0 , 0 );
827
+ struct ggml_tensor * Kcur = ggml_rope (ctx0, ggml_reshape_4d (ctx0, ggml_mul_mat (ctx0, model->layers [il].wk , cur), n_embd/n_head, n_head, N, n_batch), n_past, n_rot, 0 , 0 );
828
828
assert_shape_4d (Qcur, n_embd/n_head, n_head, N, n_batch);
829
829
assert_shape_4d (Kcur, n_embd/n_head, n_head, N, n_batch);
830
830
@@ -1116,7 +1116,7 @@ struct ggml_tensor * forward_lora(
1116
1116
model->layers [il].wqb ,
1117
1117
cur)),
1118
1118
n_embd/n_head, n_head, N),
1119
- n_past, n_rot, 0 );
1119
+ n_past, n_rot, 0 , 0 );
1120
1120
struct ggml_tensor * Kcur = ggml_rope (ctx0,
1121
1121
ggml_reshape_3d (ctx0,
1122
1122
ggml_mul_mat (ctx0,
@@ -1125,7 +1125,7 @@ struct ggml_tensor * forward_lora(
1125
1125
model->layers [il].wkb ,
1126
1126
cur)),
1127
1127
n_embd/n_head, n_head, N),
1128
- n_past, n_rot, 0 );
1128
+ n_past, n_rot, 0 , 0 );
1129
1129
1130
1130
// store key and value to memory
1131
1131
{
0 commit comments