diff --git a/main.cpp b/main.cpp index ca0fca8b36455..85fb2c900d354 100644 --- a/main.cpp +++ b/main.cpp @@ -246,7 +246,7 @@ bool llama_model_load(const std::string & fname, llama_model & model, gpt_vocab const int n_embd = hparams.n_embd; const int n_layer = hparams.n_layer; const int n_ctx = hparams.n_ctx; - const int n_vocab = hparams.n_vocab; + const int n_vocab = hparams.n_vocab + 1; model.layers.resize(n_layer);