Skip to content

Commit 00c361f

Browse files
authored
fix: llama arch implementation (#17665)
1 parent ec18edf commit 00c361f

File tree

1 file changed

+2
-0
lines changed

1 file changed

+2
-0
lines changed

src/llama-model.cpp

Lines changed: 2 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -626,6 +626,8 @@ void llama_model::load_hparams(llama_model_loader & ml) {
626626
switch (arch) {
627627
case LLM_ARCH_LLAMA:
628628
{
629+
ml.get_key(LLM_KV_ATTENTION_LAYERNORM_RMS_EPS, hparams.f_norm_rms_eps);
630+
629631
if (hparams.n_expert == 8) {
630632
switch (hparams.n_layer) {
631633
case 32: type = LLM_TYPE_8x7B; break;

0 commit comments

Comments
 (0)