llama : rename n_ctx -> cache.size, less confusing (#0)

2024-12-25 02:44:36 +00:00 · 2024-05-23 12:38:18 +03:00 · 2024-05-23 12:38:18 +03:00 · a61a94e543
commit a61a94e543
parent 152da28ae5
1 changed files with 5 additions and 6 deletions
--- a/llama.cpp
+++ b/llama.cpp
@ -2475,7 +2475,6 @@ static bool llama_kv_cache_init(
 static bool llama_kv_cache_find_slot(
           struct llama_kv_cache & cache,
        const struct llama_batch & batch) {
-    const uint32_t n_ctx    = cache.size;
    const uint32_t n_tokens = batch.n_tokens;

    if (cache.recurrent) {
@ -2526,16 +2525,16 @@ static bool llama_kv_cache_find_slot(
    }
    // otherwise, one cell per token.

-    if (n_tokens > n_ctx) {
-        LLAMA_LOG_ERROR("%s: n_tokens=%d > n_ctx=%d\n", __func__, n_tokens, n_ctx);
+    if (n_tokens > cache.size) {
+        LLAMA_LOG_ERROR("%s: n_tokens=%d > cache.size=%d\n", __func__, n_tokens, cache.size);
        return false;
    }

    uint32_t n_tested = 0;

    while (true) {
-        if (cache.head + n_tokens > n_ctx) {
-            n_tested += n_ctx - cache.head;
+        if (cache.head + n_tokens > cache.size) {
+            n_tested += cache.size - cache.head;
            cache.head = 0;
            continue;
        }
@ -2554,7 +2553,7 @@ static bool llama_kv_cache_find_slot(
            break;
        }

-        if (n_tested >= n_ctx) {
+        if (n_tested >= cache.size) {
            //LLAMA_LOG_ERROR("%s: failed to find a slot for %d tokens\n", __func__, n_tokens);
            return false;
        }