llama : fix t5 segfault

2026-05-10 02:54:06 +00:00 · 2024-07-17 15:36:56 -04:00
parent 1fb5d4fdee
commit 1725de768e
1 changed files with 4 additions and 2 deletions
--- a/src/llama.cpp
+++ b/src/llama.cpp
@@ -15377,11 +15377,13 @@ static int llama_encode_internal(

        ggml_backend_tensor_get_async(backend_embd, embd, embd_out, 0, n_tokens*n_embd*sizeof(float));

+        GGML_ASSERT(!ubatch.equal_seqs); // TODO: use batch.n_seqs instead of failing
+
        // remember the sequence ids used during the encoding - needed for cross attention later
        lctx.seq_ids_enc.resize(n_tokens);
        for (uint32_t i = 0; i < n_tokens; i++) {
-            for (int s = 0; s < batch.n_seq_id[i]; s++) {
-                llama_seq_id seq_id = batch.seq_id[i][s];
+            for (int s = 0; s < ubatch.n_seq_id[i]; s++) {
+                llama_seq_id seq_id = ubatch.seq_id[i][s];
                lctx.seq_ids_enc[i].insert(seq_id);
            }
        }