convert.py : export rope freq_base when converting CodeLlama from an HF model (#2773)

This commit is contained in:
slaren 2023-08-25 14:08:53 +02:00 committed by GitHub
parent 29674ab4e8
commit 12e2e33a97
No known key found for this signature in database
GPG Key ID: 4AEE18F83AFDEB23

View File

@ -167,6 +167,7 @@ class Params:
n_head = config["num_attention_heads"]
n_head_kv = config["num_key_value_heads"] if "num_key_value_heads" in config else n_head
f_norm_eps = config["rms_norm_eps"]
f_rope_freq_base = config["rope_theta"] if "rope_theta" in config else None
n_mult = Params.find_n_mult(n_ff, n_embd)
@ -188,6 +189,7 @@ class Params:
n_head = n_head,
n_head_kv = n_head_kv,
f_norm_eps = f_norm_eps,
f_rope_freq_base = f_rope_freq_base,
)
# LLaMA v2 70B params.json