mirror of
https://github.com/ostris/ai-toolkit.git
synced 2026-04-24 16:29:26 +00:00
fixed various issues with llm attention masking. Added block training on the llm adapter.
This commit is contained in:
@@ -212,6 +212,7 @@ class CustomAdapter(torch.nn.Module):
|
||||
sd=self.sd_ref(),
|
||||
llm=self.te,
|
||||
tokenizer=self.tokenizer,
|
||||
num_cloned_blocks=self.config.num_cloned_blocks,
|
||||
)
|
||||
self.llm_adapter.to(self.device, torch_dtype)
|
||||
elif self.adapter_type == 'te_augmenter':
|
||||
|
||||
Reference in New Issue
Block a user