Model: Read scale_pos_emb from config
In newer versions of exllamav2, this value is read from the model's config.json. This value will still default to 1.0 anyways. Signed-off-by: kingbri <bdashore3@proton.me>
This commit is contained in:
parent
e70729b0c0
commit
ec929728d9
2 changed files with 4 additions and 1 deletions
|
|
@ -60,6 +60,7 @@ model:
|
|||
# Rope scale (default: 1.0)
|
||||
# Same thing as compress_pos_emb
|
||||
# Only use if your model was trained on long context with rope (check config.json)
|
||||
# Leave blank to pull the value from the model
|
||||
rope_scale: 1.0
|
||||
|
||||
# Rope alpha (default: 1.0)
|
||||
|
|
|
|||
4
model.py
4
model.py
|
|
@ -126,7 +126,9 @@ class ModelContainer:
|
|||
self.config.max_seq_len = target_max_seq_len
|
||||
|
||||
# Set the rope scale
|
||||
self.config.scale_pos_emb = unwrap(kwargs.get("rope_scale"), 1.0)
|
||||
self.config.scale_pos_emb = unwrap(
|
||||
kwargs.get("rope_scale"), self.config.scale_pos_emb
|
||||
)
|
||||
|
||||
# Automatically calculate rope alpha
|
||||
self.config.scale_alpha_value = unwrap(
|
||||
|
|
|
|||
Loading…
Add table
Add a link
Reference in a new issue