Skip to content

Commit

Permalink
Arm AArch64: optimized GEMV and GEMM kernels for q4_0_q8_0, and q8_0_…
Browse files Browse the repository at this point in the history
…q8_0 quantization
  • Loading branch information
Dibakar committed Feb 28, 2024
1 parent 973053d commit b8983a0
Show file tree
Hide file tree
Showing 6 changed files with 1,413 additions and 36 deletions.
5 changes: 5 additions & 0 deletions ggml-impl.h
Original file line number Diff line number Diff line change
@@ -1,3 +1,4 @@
// SPDX-FileCopyrightText: Copyright 2024 Arm Ltd.
#pragma once

#include "ggml.h"
Expand Down Expand Up @@ -207,6 +208,10 @@ static inline ggml_fp16_t ggml_compute_fp32_to_fp16(float f) {

#endif // __ARM_NEON

#ifdef __ARM_FEATURE_SVE
#include <arm_sve.h>
#endif // __ARM_FEATURE_SVE

// precomputed f32 table for f16 (256 KB)
// defined in ggml.c, initialized in ggml_init()
extern float ggml_table_f32_f16[1 << 16];
Expand Down
Loading

0 comments on commit b8983a0

Please sign in to comment.