Skip to content

Commit a219c70

Browse files
committed
ggml : try fix ppc64 (#0)
1 parent 9daa4eb commit a219c70

File tree

2 files changed

+3
-1
lines changed

2 files changed

+3
-1
lines changed

ggml-quants.c

+1-1
Original file line numberDiff line numberDiff line change
@@ -11425,7 +11425,7 @@ void ggml_vec_dot_iq1_s_q8_K (int n, float * restrict s, size_t bs, const void
1142511425

1142611426
vector signed short qxh = (vector signed short)vec_sld(vec_splats(qh[1]), vec_splats(qh[0]), 8);
1142711427
qh += 2;
11428-
vector bool short vsel = vec_cmpge(qxh, (vector signed short)v0);
11428+
vector __bool short vsel = vec_cmpge(qxh, (vector signed short)v0);
1142911429

1143011430
vector signed short q8ysum = vec_sel((vector signed short)vec_xor((vector unsigned short)q8ysums, vsign), q8ysums, vsel);
1143111431

ggml.c

+2
Original file line numberDiff line numberDiff line change
@@ -1306,6 +1306,8 @@ static inline void __avx_f32cx8_store(ggml_fp16_t *x, __m256 y) {
13061306
#define GGML_F16_VEC_ZERO GGML_F32x4_ZERO
13071307
#define GGML_F16_VEC_SET1 GGML_F32x4_SET1
13081308
#define GGML_F16_VEC_FMA GGML_F32x4_FMA
1309+
#define GGML_F16_VEC_ADD GGML_F32x4_ADD
1310+
#define GGML_F16_VEC_MUL GGML_F32x4_MUL
13091311
#define GGML_F16_VEC_REDUCE GGML_F32x4_REDUCE
13101312
// Use vec_xl, not vec_ld, in case the load address is not aligned.
13111313
#define GGML_F16_VEC_LOAD(p, i) (i & 0x1) ? \

0 commit comments

Comments
 (0)