mirror of
https://github.com/turboderp-org/exui.git
synced 2026-04-20 14:29:52 +00:00
Merge pull request #21 from SinanAkkoyun/speculative-decoding-fix
Set ropescale of draft model
This commit is contained in:
8
.gitignore
vendored
Normal file
8
.gitignore
vendored
Normal file
@@ -0,0 +1,8 @@
|
||||
*.egg-info/
|
||||
build/
|
||||
|
||||
*.pyc
|
||||
__pycache__/
|
||||
.idea
|
||||
venv
|
||||
dist
|
||||
@@ -228,6 +228,7 @@ class ModelContainer:
|
||||
self.draft_config.max_seq_len = self.config.max_seq_len
|
||||
|
||||
self.draft_config.scale_alpha_value = alpha
|
||||
self.draft_config.scale_pos_emb = model["rope_scale"]
|
||||
self.draft_config.max_input_len = model["chunk_size"]
|
||||
self.draft_config.max_attn_size = model["chunk_size"] ** 2
|
||||
|
||||
|
||||
Reference in New Issue
Block a user