Skip to content

Commit 1888c1f

Browse files
committed
ggml : move ggml_flash_attn_ext_get_prec to ggml-impl.h
1 parent bc143ec commit 1888c1f

File tree

3 files changed

+4
-3
lines changed

3 files changed

+4
-3
lines changed

ggml/include/ggml.h

Lines changed: 0 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -1746,9 +1746,6 @@ extern "C" {
17461746
struct ggml_tensor * a,
17471747
enum ggml_prec prec);
17481748

1749-
GGML_API enum ggml_prec ggml_flash_attn_ext_get_prec(
1750-
const struct ggml_tensor * a);
1751-
17521749
// TODO: needs to be adapted to ggml_flash_attn_ext
17531750
GGML_API struct ggml_tensor * ggml_flash_attn_back(
17541751
struct ggml_context * ctx,

ggml/src/ggml-cuda/fattn.cu

Lines changed: 2 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -7,6 +7,8 @@
77
#include "fattn-wmma-f16.cuh"
88
#include "fattn.cuh"
99

10+
#include "ggml-impl.h"
11+
1012
#include <cstdint>
1113

1214
static void ggml_cuda_flash_attn_ext_wmma_f16(ggml_backend_cuda_context & ctx, ggml_tensor * dst) {

ggml/src/ggml-impl.h

Lines changed: 2 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -114,6 +114,8 @@ static void ggml_set_op_params_f32(struct ggml_tensor * tensor, uint32_t i, floa
114114
((float *)(tensor->op_params))[i] = value;
115115
}
116116

117+
static enum ggml_prec ggml_flash_attn_ext_get_prec(const struct ggml_tensor * a);
118+
117119
struct ggml_map_custom1_op_params {
118120
ggml_custom1_op_t fun;
119121
int n_tasks;

0 commit comments

Comments
 (0)