Use pooler embeddings for DFE v6 with dino v3

This commit is contained in:
Jaret Burkett
2026-03-27 07:02:07 -06:00
parent a802014ec5
commit f85bf065bf
2 changed files with 3 additions and 3 deletions

View File

@@ -775,11 +775,11 @@ class DiffusionFeatureExtractor6(nn.Module):
# go from -1 to 1 to 0 to 1
target_img = (target_img + 1) / 2
target_dino_input = self.prepare_inputs(target_img)
target_dino_output = self.model(**target_dino_input, output_hidden_states=True)['hidden_states'][-1].detach()
target_dino_output = self.model(**target_dino_input).pooler_output.detach()
# normalize
target_dino_output = (target_dino_output - target_dino_output.mean()) / (target_dino_output.std() + 1e-6)
pred_dino_input = self.prepare_inputs(pred_images)
pred_dino_output = self.model(**pred_dino_input, output_hidden_states=True)['hidden_states'][-1]
pred_dino_output = self.model(**pred_dino_input).pooler_output
# normalize
pred_dino_output = (pred_dino_output - pred_dino_output.mean()) / (pred_dino_output.std() + 1e-6)
dino_loss = torch.nn.functional.mse_loss(

View File

@@ -1 +1 @@
VERSION = "0.7.31"
VERSION = "0.7.32"