Spaces:
Running
Running
metal : restore matrix x vector f16_f32 kerenls for now
Browse files- ggml-metal.m +1 -3
ggml-metal.m
CHANGED
|
@@ -937,9 +937,7 @@ void ggml_metal_graph_compute(
|
|
| 937 |
nth1 = 1;
|
| 938 |
if (ne11 * ne12 < 4) {
|
| 939 |
[encoder setComputePipelineState:ctx->pipeline_mul_mat_f16_f32_1row];
|
| 940 |
-
|
| 941 |
-
} else if (false) {
|
| 942 |
-
// TODO: with ggml_mul_mat_pad this kernel no longer seems to be needed
|
| 943 |
[encoder setComputePipelineState:ctx->pipeline_mul_mat_f16_f32_l4];
|
| 944 |
nrows = ne11;
|
| 945 |
} else {
|
|
|
|
| 937 |
nth1 = 1;
|
| 938 |
if (ne11 * ne12 < 4) {
|
| 939 |
[encoder setComputePipelineState:ctx->pipeline_mul_mat_f16_f32_1row];
|
| 940 |
+
} else if (ne00 >= 128 && ne01 >= 8 && ne00%4 == 0) {
|
|
|
|
|
|
|
| 941 |
[encoder setComputePipelineState:ctx->pipeline_mul_mat_f16_f32_l4];
|
| 942 |
nrows = ne11;
|
| 943 |
} else {
|