mirror of
https://github.com/ostris/ai-toolkit.git
synced 2026-05-11 08:20:35 +00:00
Fix saving for hidream-o1
This commit is contained in:
@@ -2104,7 +2104,7 @@ class Qwen3VLCausalLMOutputWithPast(ModelOutput):
|
||||
|
||||
class Qwen3VLForConditionalGeneration(Qwen3VLPreTrainedModel, GenerationMixin):
|
||||
_checkpoint_conversion_mapping = {}
|
||||
_tied_weights_keys = ["lm_head.weight"]
|
||||
_tied_weights_keys = {"lm_head.weight": "model.language_model.embed_tokens.weight"}
|
||||
# Reference: fix gemma3 grad acc #37208
|
||||
accepts_loss_kwargs = False
|
||||
config: Qwen3VLConfig
|
||||
|
||||
Reference in New Issue
Block a user