File tree Expand file tree Collapse file tree 2 files changed +5
-1
lines changed
Expand file tree Collapse file tree 2 files changed +5
-1
lines changed Original file line number Diff line number Diff line change @@ -526,6 +526,7 @@ class llama_context_params(Structure):
526526# bool quantize_output_tensor; // quantize output.weight
527527# bool only_copy; // only copy tensors - ftype, allow_requantize and quantize_output_tensor are ignored
528528# bool pure; // disable k-quant mixtures and quantize all tensors to the same type
529+ # void * imatrix; // pointer to importance matrix data
529530# } llama_model_quantize_params;
530531class llama_model_quantize_params (Structure ):
531532 """Parameters for llama_model_quantize
@@ -537,6 +538,7 @@ class llama_model_quantize_params(Structure):
537538 quantize_output_tensor (bool): quantize output.weight
538539 only_copy (bool): only copy tensors - ftype, allow_requantize and quantize_output_tensor are ignored
539540 pure (bool): disable k-quant mixtures and quantize all tensors to the same type
541+ imatrix (ctypes.c_void_p): pointer to importance matrix data
540542 """
541543
542544 _fields_ = [
@@ -545,6 +547,8 @@ class llama_model_quantize_params(Structure):
545547 ("allow_requantize" , c_bool ),
546548 ("quantize_output_tensor" , c_bool ),
547549 ("only_copy" , c_bool ),
550+ ("pure" , c_bool ),
551+ ("imatrix" , c_void_p ),
548552 ]
549553
550554
You can’t perform that action at this time.
0 commit comments