ggml : minor

2023-03-28 20:10:14 +03:00 · 2023-03-28 20:10:14 +03:00 · a0c2401359
commit a0c2401359
parent 3a6b10d22d
1 changed files with 6 additions and 8 deletions
--- a/ggml.c
+++ b/ggml.c
@ -6218,6 +6218,7 @@ static void ggml_compute_forward_mul_mat_q_f32(
    const enum ggml_type type = src0->type;
    quantize_row_q_t const quantize_row_q = quantize_fns[type].quantize_row_q;
    vec_dot_q_t      const vec_dot_q      = quantize_fns[type].vec_dot_q;
    // we don't support permuted src0 or src1
    GGML_ASSERT(nb00 == (int) GGML_TYPE_SIZE[type]);
    GGML_ASSERT(nb10 == sizeof(float));
@ -8952,8 +8953,7 @@ void ggml_graph_compute(struct ggml_context * ctx, struct ggml_cgraph * cgraph)
                        size_t cur = 0;
-                        if (node->src0->type == GGML_TYPE_F16 &&
+                        if (node->src0->type == GGML_TYPE_F16 && node->src1->type == GGML_TYPE_F32) {
                                node->src1->type == GGML_TYPE_F32) {
 #if defined(GGML_USE_ACCELERATE) || defined(GGML_USE_OPENBLAS)
                            if (ggml_compute_forward_mul_mat_use_blas(node->src0, node->src1, node)) {
                                node->n_tasks = 1; // TODO: this actually is doing nothing
@ -8968,11 +8968,9 @@ void ggml_graph_compute(struct ggml_context * ctx, struct ggml_cgraph * cgraph)
 #else
                            cur = GGML_TYPE_SIZE[GGML_TYPE_F16]*ggml_nelements(node->src1);
 #endif
-                        } else if (node->src0->type == GGML_TYPE_F32 &&
+                        } else if (node->src0->type == GGML_TYPE_F32 && node->src1->type == GGML_TYPE_F32) {
                                node->src1->type == GGML_TYPE_F32) {
                            cur = 0;
-                        } else if (quantize_fns[node->src0->type].vec_dot_q &&
+                        } else if (quantize_fns[node->src0->type].vec_dot_q && node->src1->type == GGML_TYPE_F32) {
                                node->src1->type == GGML_TYPE_F32) {
 #if defined(GGML_USE_ACCELERATE) || defined(GGML_USE_OPENBLAS)
                            if (ggml_compute_forward_mul_mat_use_blas(node->src0, node->src1, node)) {
                                node->n_tasks = 1;