Skip to content

Commit 186626d

Browse files
committed
Update llama.cpp
1 parent 47de3ab commit 186626d

File tree

2 files changed

+3
-1
lines changed

2 files changed

+3
-1
lines changed

llama_cpp/llama_cpp.py

Lines changed: 2 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -294,13 +294,15 @@ class llama_context_params(Structure):
294294
# enum llama_ftype ftype; // quantize to this llama_ftype
295295
# bool allow_requantize; // allow quantizing non-f32/f16 tensors
296296
# bool quantize_output_tensor; // quantize output.weight
297+
# bool only_copy; // only copy tensors - ftype, allow_requantize and quantize_output_tensor are ignored
297298
# } llama_model_quantize_params;
298299
class llama_model_quantize_params(Structure):
299300
_fields_ = [
300301
("nthread", c_int),
301302
("ftype", c_int),
302303
("allow_requantize", c_bool),
303304
("quantize_output_tensor", c_bool),
305+
("only_copy", c_bool),
304306
]
305307

306308

vendor/llama.cpp

0 commit comments

Comments
 (0)