File tree 1 file changed +2
-0
lines changed
1 file changed +2
-0
lines changed Original file line number Diff line number Diff line change @@ -181,6 +181,7 @@ class llama_token_data_array(Structure):
181
181
182
182
# // Keep the booleans together to avoid misalignment during copy-by-value.
183
183
# bool low_vram; // if true, reduce VRAM usage at the cost of performance
184
+ # bool mul_mat_q; // if true, use experimental mul_mat_q kernels
184
185
# bool f16_kv; // use fp16 for KV cache
185
186
# bool logits_all; // the llama_eval() call computes all logits, not just the last one
186
187
# bool vocab_only; // only load the vocabulary, no weights
@@ -203,6 +204,7 @@ class llama_context_params(Structure):
203
204
("progress_callback" , llama_progress_callback ),
204
205
("progress_callback_user_data" , c_void_p ),
205
206
("low_vram" , c_bool ),
207
+ ("mul_mat_q" , c_bool ),
206
208
("f16_kv" , c_bool ),
207
209
("logits_all" , c_bool ),
208
210
("vocab_only" , c_bool ),
You can’t perform that action at this time.
0 commit comments