diff --git a/backends/exllamav2/model.py b/backends/exllamav2/model.py index 58a965f..647f2fa 100644 --- a/backends/exllamav2/model.py +++ b/backends/exllamav2/model.py @@ -937,6 +937,7 @@ class ExllamaV2Container: self.generator, input_ids=input_ids, max_new_tokens=max_tokens, + min_new_tokens=min_tokens, gen_settings=gen_settings, stop_conditions=stop_conditions, decode_special_tokens=decode_special_tokens,