gguf : fix resource leaks (#6061)

stevegrubb · web-flow · commit 6e0438da3cc9 · 2024-03-14T20:29:32.000+02:00
There several places where a gguf context is allocated. A call to gguf_free
is missing in some error paths. Also on linux, llama-bench was missing a
fclose.
diff --git a/examples/gguf/gguf.cpp b/examples/gguf/gguf.cpp
@@ -211,6 +211,7 @@ static bool gguf_ex_read_1(const std::string & fname) {
                 for (int j = 0; j < ggml_nelements(cur); ++j) {
                     if (data[j] != 100 + i) {
                         fprintf(stderr, "%s: tensor[%d]: data[%d] = %f\n", __func__, i, j, data[j]);
+                        gguf_free(ctx);
                         return false;
                     }
                 }
diff --git a/examples/llama-bench/llama-bench.cpp b/examples/llama-bench/llama-bench.cpp
@@ -103,6 +103,7 @@ static std::string get_cpu_info() {
                 }
             }
         }
+        fclose(f);
     }
 #endif
     // TODO: other platforms
diff --git a/examples/llava/clip.cpp b/examples/llava/clip.cpp
@@ -995,13 +995,15 @@ struct clip_ctx * clip_model_load(const char * fname, const int verbosity = 1) {
         if (!new_clip->ctx_data) {
             fprintf(stderr, "%s: ggml_init() failed\n", __func__);
             clip_free(new_clip);
+            gguf_free(ctx);
             return nullptr;
         }
 
         auto fin = std::ifstream(fname, std::ios::binary);
         if (!fin) {
             printf("cannot open model file for loading tensors\n");
             clip_free(new_clip);
+            gguf_free(ctx);
             return nullptr;
         }
 
@@ -1023,6 +1025,7 @@ struct clip_ctx * clip_model_load(const char * fname, const int verbosity = 1) {
             if (!fin) {
                 printf("%s: failed to seek for tensor %s\n", __func__, name);
                 clip_free(new_clip);
+                gguf_free(ctx);
                 return nullptr;
             }
             int num_bytes = ggml_nbytes(cur);
@@ -1908,6 +1911,7 @@ bool clip_model_quantize(const char * fname_inp, const char * fname_out, const i
                 break;
             default:
                 printf("Please use an input file in f32 or f16\n");
+                gguf_free(ctx_out);
                 return false;
             }
 
diff --git a/examples/train-text-from-scratch/train-text-from-scratch.cpp b/examples/train-text-from-scratch/train-text-from-scratch.cpp
@@ -711,6 +711,7 @@ static bool load_checkpoint_file(const char * filename, struct my_llama_model *
 
     load_checkpoint_gguf(fctx, f_ggml_ctx, model, train);
 
+    gguf_free(fctx);
     return true;
 }
 

Original file line number	Diff line number	Diff line change
`@@ -211,6 +211,7 @@ static bool gguf_ex_read_1(const std::string & fname) {`
`211`	`211`	`for (int j = 0; j < ggml_nelements(cur); ++j) {`
`212`	`212`	`if (data[j] != 100 + i) {`
`213`	`213`	`fprintf(stderr, "%s: tensor[%d]: data[%d] = %f\n", __func__, i, j, data[j]);`
	`214`	`+ gguf_free(ctx);`
`214`	`215`	`return false;`
`215`	`216`	`}`
`216`	`217`	`}`
Original file line number	Diff line number	Diff line change
`@@ -103,6 +103,7 @@ static std::string get_cpu_info() {`
`103`	`103`	`}`
`104`	`104`	`}`
`105`	`105`	`}`
	`106`	`+ fclose(f);`
`106`	`107`	`}`
`107`	`108`	`#endif`
`108`	`109`	`// TODO: other platforms`
Original file line number	Diff line number	Diff line change
`@@ -711,6 +711,7 @@ static bool load_checkpoint_file(const char * filename, struct my_llama_model *`
`711`	`711`
`712`	`712`	`load_checkpoint_gguf(fctx, f_ggml_ctx, model, train);`
`713`	`713`
	`714`	`+ gguf_free(fctx);`
`714`	`715`	`return true;`
`715`	`716`	`}`
`716`	`717`