Added some additional experimental things to the vision direct encoder

2026-01-26 16:39:47 +00:00 · 2024-10-10 19:42:26 +00:00
parent ab22674980
commit 3922981996
4 changed files with 101 additions and 23 deletions
--- a/toolkit/config_modules.py
+++ b/toolkit/config_modules.py
@@ -211,6 +211,11 @@ class AdapterConfig:
        self.pixtral_random_image_size: int = kwargs.get('pixtral_random_image_size', False)

        self.flux_only_double: bool = kwargs.get('flux_only_double', False)
+        
+        # train and use a conv layer to pool the embedding
+        self.conv_pooling: bool = kwargs.get('conv_pooling', False)
+        self.conv_pooling_stacks: int = kwargs.get('conv_pooling_stacks', 1)
+        self.sparse_autoencoder_dim: Optional[int] = kwargs.get('sparse_autoencoder_dim', None)


 class EmbeddingConfig: