221
221
# LLAMA_VOCAB_PRE_TYPE_GPT3_FINNISH = 24,
222
222
# LLAMA_VOCAB_PRE_TYPE_EXAONE = 25,
223
223
# LLAMA_VOCAB_PRE_TYPE_CHAMELEON = 26,
224
+ # LLAMA_VOCAB_PRE_TYPE_MINERVA = 27,
224
225
# };
225
226
LLAMA_VOCAB_PRE_TYPE_DEFAULT = 0
226
227
LLAMA_VOCAB_PRE_TYPE_LLAMA3 = 1
249
250
LLAMA_VOCAB_PRE_TYPE_GPT3_FINNISH = 24
250
251
LLAMA_VOCAB_PRE_TYPE_EXAONE = 25
251
252
LLAMA_VOCAB_PRE_TYPE_CHAMELEON = 26
253
+ LLAMA_VOCAB_PRE_TYPE_MINERVA = 27
252
254
253
255
254
256
# // note: these values should be synchronized with ggml_rope
392
394
# LLAMA_ROPE_SCALING_TYPE_NONE = 0,
393
395
# LLAMA_ROPE_SCALING_TYPE_LINEAR = 1,
394
396
# LLAMA_ROPE_SCALING_TYPE_YARN = 2,
397
+ # LLAMA_ROPE_SCALING_TYPE_LONGROPE = 3,
395
398
# LLAMA_ROPE_SCALING_TYPE_MAX_VALUE = LLAMA_ROPE_SCALING_TYPE_YARN,
396
399
# };
397
400
LLAMA_ROPE_SCALING_TYPE_UNSPECIFIED = - 1
398
401
LLAMA_ROPE_SCALING_TYPE_NONE = 0
399
402
LLAMA_ROPE_SCALING_TYPE_LINEAR = 1
400
403
LLAMA_ROPE_SCALING_TYPE_YARN = 2
404
+ LLAMA_ROPE_SCALING_TYPE_LONGROPE = 3
401
405
LLAMA_ROPE_SCALING_TYPE_MAX_VALUE = LLAMA_ROPE_SCALING_TYPE_YARN
402
406
403
407
# enum llama_pooling_type {
@@ -2933,6 +2937,34 @@ def llama_chat_apply_template(
2933
2937
...
2934
2938
2935
2939
2940
+ # // Get list of built-in chat templates
2941
+ # LLAMA_API int32_t llama_chat_builtin_templates(const char ** output, size_t len);
2942
+ @ctypes_function (
2943
+ "llama_chat_builtin_templates" ,
2944
+ [
2945
+ ctypes .POINTER (ctypes .c_char_p ),
2946
+ ctypes .c_size_t ,
2947
+ ],
2948
+ ctypes .c_int32 ,
2949
+ )
2950
+ def llama_chat_builtin_templates (
2951
+ output : CtypesArray [bytes ],
2952
+ len : Union [ctypes .c_size_t , int ],
2953
+ / ,
2954
+ ) -> int :
2955
+ """Get list of built-in chat templates.
2956
+
2957
+ Args:
2958
+ output: Output buffer to store template names.
2959
+ len: Length of the output buffer.
2960
+
2961
+ Returns:
2962
+ Number of templates available.
2963
+ Returns a negative number on error.
2964
+ """
2965
+ ...
2966
+
2967
+
2936
2968
# //
2937
2969
# // Sampling API
2938
2970
# //
0 commit comments