File tree 3 files changed +4
-13
lines changed 3 files changed +4
-13
lines changed Original file line number Diff line number Diff line change 4
4
5
5
// GGML internal header
6
6
7
+ #include <assert.h>
7
8
#include <stddef.h>
8
9
#include <stdbool.h>
9
10
#include <string.h> // memcpy
Original file line number Diff line number Diff line change 1
1
#pragma once
2
2
3
- // This is a private API for quantization and dequantization
4
- // Should not be used directly, use ggml.h instead
3
+ #include "ggml-impl.h"
5
4
6
- #include "ggml.h"
5
+ // GGML internal header
7
6
8
7
#include <stdint.h>
9
- #include <assert.h>
10
8
#include <stddef.h>
11
9
12
- #ifndef static_assert
13
- #if defined(__STDC_VERSION__ ) && (__STDC_VERSION__ >= 201100L )
14
- #define static_assert (cond , msg ) _Static_assert(cond, msg)
15
- #else
16
- #define static_assert (cond , msg ) struct global_scope_noop_trick
17
- #endif
18
- #endif
19
-
20
10
#define QK4_0 32
21
11
typedef struct {
22
12
ggml_fp16_t d ; // delta
Original file line number Diff line number Diff line change @@ -1467,7 +1467,7 @@ static int32_t llama_kv_cache_cell_max(const struct llama_kv_cache & cache) {
1467
1467
}
1468
1468
1469
1469
static void llama_kv_cache_clear (struct llama_kv_cache & cache) {
1470
- for (int32_t i = 0 ; i < cache.size ; ++i) {
1470
+ for (int32_t i = 0 ; i < ( int32_t ) cache.size ; ++i) {
1471
1471
cache.cells [i].pos = -1 ;
1472
1472
cache.cells [i].seq_id .clear ();
1473
1473
}
You can’t perform that action at this time.
0 commit comments