diff --git a/convert.py b/convert.py index e38ee5315af30e..980e6fc720aa63 100755 --- a/convert.py +++ b/convert.py @@ -348,7 +348,7 @@ def load_torch_params(model: LazyModel, config_path: Path) -> "Params": f_rope_freq_base = 1e6 return Params( - n_vocab=config.get("vocab_size", model["tok_embeddings.weight"].shape[0]), + n_vocab=model["tok_embeddings.weight"].shape[0], n_embd=config["dim"], n_layer=config["n_layers"], n_ctx=n_ctx,