Merge pull request #21 from SinanAkkoyun/speculative-decoding-fix

Set ropescale of draft model
This commit is contained in:
turboderp
2023-12-07 22:26:47 +01:00
committed by GitHub
2 changed files with 9 additions and 0 deletions

8
.gitignore vendored Normal file
View File

@@ -0,0 +1,8 @@
*.egg-info/
build/
*.pyc
__pycache__/
.idea
venv
dist

View File

@@ -228,6 +228,7 @@ class ModelContainer:
self.draft_config.max_seq_len = self.config.max_seq_len
self.draft_config.scale_alpha_value = alpha
self.draft_config.scale_pos_emb = model["rope_scale"]
self.draft_config.max_input_len = model["chunk_size"]
self.draft_config.max_attn_size = model["chunk_size"] ** 2