mirror of
https://github.com/turboderp-org/exllamav2.git
synced 2026-04-20 14:29:28 +00:00
Remove TODO items
This commit is contained in:
@@ -42,8 +42,6 @@ class ExLlamaV2BaseGenerator:
|
||||
return self.sequence_ids.shape[-1] >= self.model.config.max_seq_len
|
||||
|
||||
|
||||
# TODO: Argument to allow different random samples over batch dimension
|
||||
|
||||
def generate_simple(self, prompt: str or list,
|
||||
gen_settings: ExLlamaV2Sampler.Settings,
|
||||
num_tokens: int,
|
||||
|
||||
@@ -173,7 +173,6 @@ class ExLlamaV2:
|
||||
constant_size = sincos_size * 2
|
||||
|
||||
# Max size of hidden state
|
||||
# TODO: Option to reserve space for cache while loading model
|
||||
|
||||
state_size = self.config.hidden_size * self.config.max_input_len * self.config.max_batch_size * 2
|
||||
mask_size = self.config.max_input_len ** 2 * self.config.max_batch_size * 2
|
||||
|
||||
Reference in New Issue
Block a user