llama : fix order of pre-tokenizers

ggml-org · ggerganov · Jul 20, 2024 · Jul 18, 2024 · Jul 19, 2024 · Jul 19, 2024
commit 447c08092dac9ced3058e5fcf1282c1ad8153e27
diff --git a/src/llama.cpp b/src/llama.cpp
@@ -5517,14 +5517,14 @@ static void llm_load_vocab(
                 tokenizer_pre == "viking") {
                 vocab.type_pre = LLAMA_VOCAB_PRE_TYPE_VIKING;
                 vocab.tokenizer_clean_spaces = false;
+            } else if (
+                tokenizer_pre == "jais") {
+                vocab.type_pre = LLAMA_VOCAB_PRE_TYPE_JAIS;
             } else if (
                 tokenizer_pre == "tekken") {
                 vocab.type_pre = LLAMA_VOCAB_PRE_TYPE_TEKKEN;
                 vocab.tokenizer_ignore_merges = true;
                 vocab.tokenizer_add_bos = true;
-            } else if (
-                tokenizer_pre == "jais") {
-                vocab.type_pre = LLAMA_VOCAB_PRE_TYPE_JAIS;
             } else {
                 throw std::runtime_error(format("unknown pre-tokenizer type: '%s'", tokenizer_pre.c_str()));
             }