File tree Expand file tree Collapse file tree 2 files changed +2
-7
lines changed Expand file tree Collapse file tree 2 files changed +2
-7
lines changed Original file line number Diff line number Diff line change @@ -1040,12 +1040,7 @@ void ggml_metal_graph_compute(
1040
1040
const float scale = ((float *) dst->op_params )[0 ];
1041
1041
1042
1042
[encoder setBuffer: id_src0 offset: offs_src0 atIndex: 0 ];
1043
- if (id_src1) {
1044
- [encoder setBuffer: id_src1 offset: offs_src1 atIndex: 1 ];
1045
- } else {
1046
- [encoder setBuffer: nil offset: 0 atIndex: 1 ];
1047
- }
1048
-
1043
+ [encoder setBuffer: id_src1 offset: offs_src1 atIndex: 1 ];
1049
1044
[encoder setBuffer: id_dst offset: offs_dst atIndex: 2 ];
1050
1045
[encoder setBytes: &ne00 length: sizeof (ne00) atIndex: 3 ];
1051
1046
[encoder setBytes: &ne01 length: sizeof (ne01) atIndex: 4 ];
Original file line number Diff line number Diff line change @@ -3705,8 +3705,8 @@ static struct ggml_tensor * llm_build_kqv(
3705
3705
struct ggml_tensor * kq = ggml_mul_mat (ctx, k, q);
3706
3706
cb (kq, " kq" , il);
3707
3707
3708
- // TODO: !!!!!!!!!
3709
3708
if (max_alibi_bias > 0 .0f ) {
3709
+ // temporary branch until we figure out how to handle ggml_alibi through ggml_add
3710
3710
kq = ggml_scale (ctx, kq, kq_scale);
3711
3711
cb (kq, " kq_scaled" , il);
3712
3712
You can’t perform that action at this time.
0 commit comments