|
221 | 221 | # LLAMA_VOCAB_PRE_TYPE_GPT3_FINNISH = 24,
|
222 | 222 | # LLAMA_VOCAB_PRE_TYPE_EXAONE = 25,
|
223 | 223 | # LLAMA_VOCAB_PRE_TYPE_CHAMELEON = 26,
|
| 224 | +# LLAMA_VOCAB_PRE_TYPE_MINERVA = 27, |
224 | 225 | # };
|
225 | 226 | LLAMA_VOCAB_PRE_TYPE_DEFAULT = 0
|
226 | 227 | LLAMA_VOCAB_PRE_TYPE_LLAMA3 = 1
|
|
249 | 250 | LLAMA_VOCAB_PRE_TYPE_GPT3_FINNISH = 24
|
250 | 251 | LLAMA_VOCAB_PRE_TYPE_EXAONE = 25
|
251 | 252 | LLAMA_VOCAB_PRE_TYPE_CHAMELEON = 26
|
| 253 | +LLAMA_VOCAB_PRE_TYPE_MINERVA = 27 |
252 | 254 |
|
253 | 255 |
|
254 | 256 | # // note: these values should be synchronized with ggml_rope
|
|
392 | 394 | # LLAMA_ROPE_SCALING_TYPE_NONE = 0,
|
393 | 395 | # LLAMA_ROPE_SCALING_TYPE_LINEAR = 1,
|
394 | 396 | # LLAMA_ROPE_SCALING_TYPE_YARN = 2,
|
| 397 | +# LLAMA_ROPE_SCALING_TYPE_LONGROPE = 3, |
395 | 398 | # LLAMA_ROPE_SCALING_TYPE_MAX_VALUE = LLAMA_ROPE_SCALING_TYPE_YARN,
|
396 | 399 | # };
|
397 | 400 | LLAMA_ROPE_SCALING_TYPE_UNSPECIFIED = -1
|
398 | 401 | LLAMA_ROPE_SCALING_TYPE_NONE = 0
|
399 | 402 | LLAMA_ROPE_SCALING_TYPE_LINEAR = 1
|
400 | 403 | LLAMA_ROPE_SCALING_TYPE_YARN = 2
|
| 404 | +LLAMA_ROPE_SCALING_TYPE_LONGROPE = 3 |
401 | 405 | LLAMA_ROPE_SCALING_TYPE_MAX_VALUE = LLAMA_ROPE_SCALING_TYPE_YARN
|
402 | 406 |
|
403 | 407 | # enum llama_pooling_type {
|
@@ -2933,6 +2937,34 @@ def llama_chat_apply_template(
|
2933 | 2937 | ...
|
2934 | 2938 |
|
2935 | 2939 |
|
| 2940 | +# // Get list of built-in chat templates |
| 2941 | +# LLAMA_API int32_t llama_chat_builtin_templates(const char ** output, size_t len); |
| 2942 | +@ctypes_function( |
| 2943 | + "llama_chat_builtin_templates", |
| 2944 | + [ |
| 2945 | + ctypes.POINTER(ctypes.c_char_p), |
| 2946 | + ctypes.c_size_t, |
| 2947 | + ], |
| 2948 | + ctypes.c_int32, |
| 2949 | +) |
| 2950 | +def llama_chat_builtin_templates( |
| 2951 | + output: CtypesArray[bytes], |
| 2952 | + len: Union[ctypes.c_size_t, int], |
| 2953 | + /, |
| 2954 | +) -> int: |
| 2955 | + """Get list of built-in chat templates. |
| 2956 | +
|
| 2957 | + Args: |
| 2958 | + output: Output buffer to store template names. |
| 2959 | + len: Length of the output buffer. |
| 2960 | +
|
| 2961 | + Returns: |
| 2962 | + Number of templates available. |
| 2963 | + Returns a negative number on error. |
| 2964 | + """ |
| 2965 | + ... |
| 2966 | + |
| 2967 | + |
2936 | 2968 | # //
|
2937 | 2969 | # // Sampling API
|
2938 | 2970 | # //
|
|
0 commit comments