From d05c13b3b91a867658732905f9ca7ce157b413ca Mon Sep 17 00:00:00 2001
From: Jared Van Bortel <jared@nomic.ai>
Date: Sat, 23 Mar 2024 14:03:16 -0400
Subject: [PATCH] llama : fix BPE LF token on MSVC

---
 llama.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)
diff --git a/llama.cpp b/llama.cpp
index 11620043e..71d1b0fbc 100644
--- a/llama.cpp
+++ b/llama.cpp
@@ -3971,7 +3971,7 @@ static void llm_load_vocab(
     } else if (vocab.type == LLAMA_VOCAB_TYPE_WPM) {
         vocab.linefeed_id = vocab.special_pad_id;
     } else {
-        const std::vector<int> ids = llama_tokenize_internal(vocab, "\u010A", false);
+        const std::vector<int> ids = llama_tokenize_internal(vocab, "\xC4\x8A", false); // U+010A
         GGML_ASSERT(!ids.empty() && "model vocab missing newline token");
         vocab.linefeed_id = ids[0];
     }