File tree Expand file tree Collapse file tree 3 files changed +4
-0
lines changed Expand file tree Collapse file tree 3 files changed +4
-0
lines changed Original file line number Diff line number Diff line change @@ -34,6 +34,7 @@ models/*
34
34
/perplexity
35
35
/embedding
36
36
/train-text-from-scratch
37
+ /simple
37
38
/benchmark-matmult
38
39
/vdot
39
40
/server
Original file line number Diff line number Diff line change 38
38
add_subdirectory (benchmark)
39
39
add_subdirectory (baby-llama)
40
40
add_subdirectory (train-text-from-scratch)
41
+ add_subdirectory (simple)
41
42
if (LLAMA_METAL)
42
43
add_subdirectory (metal)
43
44
endif ()
Original file line number Diff line number Diff line change @@ -886,6 +886,7 @@ static bool kv_cache_init(
886
886
const int64_t n_elements = n_embd*n_mem;
887
887
888
888
cache.buf .resize (2u *n_elements*ggml_type_size (wtype) + 2u *MB);
889
+ cache.n = 0 ;
889
890
890
891
struct ggml_init_params params;
891
892
params.mem_size = cache.buf .size ;
@@ -904,6 +905,7 @@ static bool kv_cache_init(
904
905
ggml_set_name (cache.k , " cache_k" );
905
906
ggml_set_name (cache.v , " cache_v" );
906
907
908
+ (void ) n_gpu_layers;
907
909
#ifdef GGML_USE_CUBLAS
908
910
if (n_gpu_layers > n_layer + 1 ) {
909
911
ggml_cuda_assign_buffers_no_scratch (cache.v );
You can’t perform that action at this time.
0 commit comments