llama : do not allocate KV cache for "vocab_only == true" (#682)

Fixes sanitizer CI
pull/706/head master-81040f1
Stephan Walter 1 year ago committed by GitHub
parent c4f89d8d73
commit 81040f10aa
No known key found for this signature in database
GPG Key ID: 4AEE18F83AFDEB23

@ -1608,7 +1608,7 @@ struct llama_context * llama_init_from_file(
}
// reserve memory for context buffers
{
if (!params.vocab_only) {
if (!kv_cache_init(ctx->model.hparams, ctx->model.kv_self, memory_type, ctx->model.hparams.n_ctx)) {
fprintf(stderr, "%s: kv_cache_init() failed for self-attention cache\n", __func__);
llama_free(ctx);

Loading…
Cancel
Save