Update convert_hf_to_gguf.py
Co-authored-by: compilade <git@compilade.net>
This commit is contained in:
parent
184a4c676f
commit
349426546b
1 changed files with 1 additions and 1 deletions
|
@ -2744,7 +2744,7 @@ class MambaModel(Model):
|
||||||
rms_norm_eps = self.find_hparam(["layer_norm_epsilon", "rms_norm_eps"], optional=True) or 1e-5
|
rms_norm_eps = self.find_hparam(["layer_norm_epsilon", "rms_norm_eps"], optional=True) or 1e-5
|
||||||
use_b_dt_norm = False
|
use_b_dt_norm = False
|
||||||
# For falconmamba we do apply RMS norm on B / DT and C layers
|
# For falconmamba we do apply RMS norm on B / DT and C layers
|
||||||
if self.find_hparam(["model_type"]) in ["falcon_mamba"]:
|
if self.find_hparam(["model_type"], optional=True) in ("falcon_mamba",):
|
||||||
use_b_dt_norm = True
|
use_b_dt_norm = True
|
||||||
# Fail early for models which don't have a block expansion factor of 2
|
# Fail early for models which don't have a block expansion factor of 2
|
||||||
assert d_inner == 2 * d_model
|
assert d_inner == 2 * d_model
|
||||||
|
|
Loading…
Add table
Add a link
Reference in a new issue