From 05b3b7c171424d36869b284f82cfc3a91e91a387 Mon Sep 17 00:00:00 2001 From: unanmed <1319491857@qq.com> Date: Tue, 20 Jan 2026 23:53:31 +0800 Subject: [PATCH] =?UTF-8?q?feat:=20=E7=BC=96=E7=A0=81=E5=99=A8=E7=89=B9?= =?UTF-8?q?=E5=BE=81=E8=9E=8D=E5=90=88=E6=B7=BB=E5=8A=A0=E5=BD=92=E4=B8=80?= =?UTF-8?q?=E5=8C=96?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit --- ginka/vae_rnn/decoder.py | 6 +++++- 1 file changed, 5 insertions(+), 1 deletion(-) diff --git a/ginka/vae_rnn/decoder.py b/ginka/vae_rnn/decoder.py index 6a9c679..2317333 100644 --- a/ginka/vae_rnn/decoder.py +++ b/ginka/vae_rnn/decoder.py @@ -104,7 +104,11 @@ class DecoderInputFusion(nn.Module): num_layers=2 ) self.norm = nn.LayerNorm(d_model) - self.fusion = nn.Linear(d_model * 2, d_model) + self.fusion = nn.Sequential( + nn.Linear(d_model * 2, d_model), + nn.LayerNorm(d_model), + nn.GELU() + ) def forward( self, tile_embed: torch.Tensor, cond_vec: torch.Tensor,