use right type, and define GGML_F32_VEC_ZERO.

This commit is contained in:
Julia Longtin 2024-03-13 19:23:53 +00:00
parent 25095cac23
commit c08ddb831f

3
ggml.c
View file

@ -953,7 +953,7 @@ ggml_type_traits_t ggml_internal_get_type_traits(enum ggml_type type) {
#define GGML_F32_ARR (GGML_F32_STEP/GGML_F32_EPR) #define GGML_F32_ARR (GGML_F32_STEP/GGML_F32_EPR)
// our vector. 128*32=512 // our vector. 128*32=512
typedef float32_t float32x16_t __attribute__((vector_size (128))); typedef float float32x16_t __attribute__((vector_size (128)));
#define GGML_F32x16 float32x16_t #define GGML_F32x16 float32x16_t
#define GGML_F32x16_ZERO \ #define GGML_F32x16_ZERO \
{ \ { \
@ -968,6 +968,7 @@ typedef float32_t float32x16_t __attribute__((vector_size (128)));
//vdupq_n_f32(0.0f) //vdupq_n_f32(0.0f)
#define GGML_F32_VEC GGML_F32x16 #define GGML_F32_VEC GGML_F32x16
#define GGML_F32_VEC_ZERO GGML_F32x16_ZERO
#elif defined(__ARM_NEON) && defined(__ARM_FEATURE_FMA) #elif defined(__ARM_NEON) && defined(__ARM_FEATURE_FMA)