File tree Expand file tree Collapse file tree 2 files changed +3
-3
lines changed
Filter options
Expand file tree Collapse file tree 2 files changed +3
-3
lines changed
Original file line number Diff line number Diff line change @@ -405,7 +405,7 @@ class llama_model_params(Structure):
405
405
406
406
# // Keep the booleans together to avoid misalignment during copy-by-value.
407
407
# bool mul_mat_q; // if true, use experimental mul_mat_q kernels (DEPRECATED - always true)
408
- # bool logits_all; // the llama_eval() call computes all logits, not just the last one
408
+ # bool logits_all; // the llama_eval() call computes all logits, not just the last one (DEPRECATED - set llama_batch.logits instead)
409
409
# bool embedding; // embedding mode only
410
410
# bool offload_kqv; // whether to offload the KQV ops (including the KV cache) to GPU
411
411
# };
@@ -430,7 +430,7 @@ class llama_context_params(Structure):
430
430
type_v (int): data type for V cache
431
431
mul_mat_q (bool): if true, use experimental mul_mat_q kernels (DEPRECATED - always true)
432
432
f16_kv (bool): use fp16 for KV cache, fp32 otherwise
433
- logits_all (bool): the llama_eval() call computes all logits, not just the last one
433
+ logits_all (bool): the llama_eval() call computes all logits, not just the last one (DEPRECATED - set llama_batch.logits instead)
434
434
embedding (bool): embedding mode only"""
435
435
_fields_ = [
436
436
("seed" , c_uint32 ),
You can’t perform that action at this time.
0 commit comments