Skip to content

Commit 51dbcf2

Browse files
committed
Bugfix: wrong signature for quantize function
1 parent 8279fb7 commit 51dbcf2

File tree

1 file changed

+3
-3
lines changed

1 file changed

+3
-3
lines changed

llama_cpp/llama_cpp.py

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -125,12 +125,12 @@ def llama_free(ctx: llama_context_p):
125125
# TODO: not great API - very likely to change
126126
# Returns 0 on success
127127
def llama_model_quantize(
128-
fname_inp: bytes, fname_out: bytes, itype: c_int, qk: c_int
128+
fname_inp: bytes, fname_out: bytes, itype: c_int
129129
) -> c_int:
130-
return _lib.llama_model_quantize(fname_inp, fname_out, itype, qk)
130+
return _lib.llama_model_quantize(fname_inp, fname_out, itype)
131131

132132

133-
_lib.llama_model_quantize.argtypes = [c_char_p, c_char_p, c_int, c_int]
133+
_lib.llama_model_quantize.argtypes = [c_char_p, c_char_p, c_int]
134134
_lib.llama_model_quantize.restype = c_int
135135

136136
# Returns the KV cache that will contain the context for the

0 commit comments

Comments
 (0)