ggerganov commited on
Commit
2dd8c56
·
unverified ·
1 Parent(s): 02d7878

metal : restore matrix x vector f16_f32 kerenls for now

Browse files
Files changed (1) hide show
  1. ggml-metal.m +1 -3
ggml-metal.m CHANGED
@@ -937,9 +937,7 @@ void ggml_metal_graph_compute(
937
  nth1 = 1;
938
  if (ne11 * ne12 < 4) {
939
  [encoder setComputePipelineState:ctx->pipeline_mul_mat_f16_f32_1row];
940
- //} else if (ne00 >= 128 && ne01 >= 8 && ne00%4 == 0) {
941
- } else if (false) {
942
- // TODO: with ggml_mul_mat_pad this kernel no longer seems to be needed
943
  [encoder setComputePipelineState:ctx->pipeline_mul_mat_f16_f32_l4];
944
  nrows = ne11;
945
  } else {
 
937
  nth1 = 1;
938
  if (ne11 * ne12 < 4) {
939
  [encoder setComputePipelineState:ctx->pipeline_mul_mat_f16_f32_1row];
940
+ } else if (ne00 >= 128 && ne01 >= 8 && ne00%4 == 0) {
 
 
941
  [encoder setComputePipelineState:ctx->pipeline_mul_mat_f16_f32_l4];
942
  nrows = ne11;
943
  } else {