@@ -1408,11 +1408,11 @@ static int ggml_metal_encode_node(struct ggml_metal_encode_context * ctx_enc, in
1408
1408
// src1 is a row
1409
1409
GGML_ASSERT (ne11 == 1 );
1410
1410
1411
- pipeline = ggml_metal_op_bin_get_pipeline (ctx, dst ->op , n_fuse, true );
1411
+ pipeline = ggml_metal_op_bin_get_pipeline (node ->op , ctx , n_fuse, true );
1412
1412
1413
1413
bcast_row = true ;
1414
1414
} else {
1415
- pipeline = ggml_metal_op_bin_get_pipeline (ctx, dst ->op , n_fuse, false );
1415
+ pipeline = ggml_metal_op_bin_get_pipeline (node ->op , ctx , n_fuse, false );
1416
1416
}
1417
1417
1418
1418
if (n_fuse > 1 ) {
@@ -1602,7 +1602,7 @@ static int ggml_metal_encode_node(struct ggml_metal_encode_context * ctx_enc, in
1602
1602
};
1603
1603
1604
1604
// const id<MTLComputePipelineState> pipeline = ctx->pipelines[GGML_METAL_PIPELINE_TYPE_ADD].pipeline;
1605
- const id <MTLComputePipelineState > pipeline = ggml_metal_op_bin_get_pipeline (ctx, GGML_OP_ADD , 1 , false );
1605
+ const id <MTLComputePipelineState > pipeline = ggml_metal_op_bin_get_pipeline (GGML_OP_ADD, ctx , 1 , false );
1606
1606
1607
1607
[encoder setComputePipelineState: pipeline];
1608
1608
[encoder setBytes: &args length: sizeof (args) atIndex: 0 ];
@@ -3517,7 +3517,7 @@ static int ggml_metal_encode_node(struct ggml_metal_encode_context * ctx_enc, in
3517
3517
}
3518
3518
}
3519
3519
3520
- const id <MTLComputePipelineState > pipeline = ggml_metal_op_rms_norm_get_pipeline (ctx, node , n_fuse);
3520
+ const id <MTLComputePipelineState > pipeline = ggml_metal_op_rms_norm_get_pipeline (node, ctx , n_fuse);
3521
3521
3522
3522
int nth = 32 ; // SIMD width
3523
3523
@@ -4257,7 +4257,7 @@ static int ggml_metal_encode_node(struct ggml_metal_encode_context * ctx_enc, in
4257
4257
/* .logit_softcap =*/ logit_softcap,
4258
4258
};
4259
4259
4260
- id <MTLComputePipelineState > pipeline = ggml_metal_op_flash_attn_ext_get_pipeline (ctx, node , has_mask, has_sinks, has_bias, has_scap, nsg);
4260
+ id <MTLComputePipelineState > pipeline = ggml_metal_op_flash_attn_ext_get_pipeline (node, ctx , has_mask, has_sinks, has_bias, has_scap, nsg);
4261
4261
4262
4262
[encoder setComputePipelineState: pipeline];
4263
4263
[encoder setBytes: &args length: sizeof (args) atIndex: 0 ];
@@ -4372,7 +4372,7 @@ static int ggml_metal_encode_node(struct ggml_metal_encode_context * ctx_enc, in
4372
4372
/* .logit_softcap =*/ logit_softcap,
4373
4373
};
4374
4374
4375
- id <MTLComputePipelineState > pipeline = ggml_metal_op_flash_attn_ext_vec_get_pipeline (ctx, node , has_mask, has_sinks, has_bias, has_scap, nsg, nwg);
4375
+ id <MTLComputePipelineState > pipeline = ggml_metal_op_flash_attn_ext_vec_get_pipeline (node, ctx , has_mask, has_sinks, has_bias, has_scap, nsg, nwg);
4376
4376
4377
4377
GGML_ASSERT (nsg*32 <= (int ) pipeline.maxTotalThreadsPerThreadgroup );
4378
4378
@@ -4426,7 +4426,7 @@ static int ggml_metal_encode_node(struct ggml_metal_encode_context * ctx_enc, in
4426
4426
nrows,
4427
4427
};
4428
4428
4429
- id <MTLComputePipelineState > pipeline0 = ggml_metal_op_flash_attn_ext_vec_reduce_get_pipeline (ctx, node , ne20, nwg);
4429
+ id <MTLComputePipelineState > pipeline0 = ggml_metal_op_flash_attn_ext_vec_reduce_get_pipeline (node, ctx , ne20, nwg);
4430
4430
4431
4431
[encoder setComputePipelineState: pipeline0];
4432
4432
[encoder setBytes: &args0 length: sizeof (args0) atIndex: 0 ];
0 commit comments