Skip to content

Commit

Permalink
Disable BLAS branch in mul_mat - seems there is a bug
Browse files Browse the repository at this point in the history
  • Loading branch information
ggerganov committed Mar 24, 2023
1 parent 04c6f5e commit b3f460e
Showing 1 changed file with 5 additions and 5 deletions.
10 changes: 5 additions & 5 deletions ggml.c
Original file line number Diff line number Diff line change
Expand Up @@ -5858,11 +5858,11 @@ static bool ggml_compute_forward_mul_mat_use_blas(
if (ggml_is_contiguous(src0) &&
ggml_is_contiguous(src1) && ((ne0 >= 32 && ne1 >= 32 && ne10 >= 32))) {

//// disable BLAS for Q4_0 and Q4_1
//// looks like there is no benefit and we only waste a lot of memory
//if (src0->type == GGML_TYPE_Q4_0 || src0->type == GGML_TYPE_Q4_1) {
// return false;
//}
// disable BLAS for Q4_0 and Q4_1
// there is a bug that has to be fixed before enabling
if (src0->type == GGML_TYPE_Q4_0 || src0->type == GGML_TYPE_Q4_1) {
return false;
}

//printf("BLAS: %d %d %d %d %d\n", ne0, ne1, ne10, ne00, ne01);
return true;
Expand Down

0 comments on commit b3f460e

Please sign in to comment.