From dcb85dc1f8c46bda3ed7b4e4c843d86f81fa292d Mon Sep 17 00:00:00 2001 From: unanmed <1319491857@qq.com> Date: Tue, 28 Apr 2026 17:51:39 +0800 Subject: [PATCH] =?UTF-8?q?chore:=20=E8=B0=83=E6=95=B4=E8=B6=85=E5=8F=82?= =?UTF-8?q?=E6=95=B0?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit --- ginka/train_pretrain.py | 4 ++-- ginka/train_vq.py | 4 ++-- 2 files changed, 4 insertions(+), 4 deletions(-) diff --git a/ginka/train_pretrain.py b/ginka/train_pretrain.py index 9e304aa..ab2df99 100644 --- a/ginka/train_pretrain.py +++ b/ginka/train_pretrain.py @@ -41,7 +41,7 @@ MAP_H = MAP_W = 13 # VQ-VAE 超参(保持与 train_vq.py 一致) VQ_L = 2 -VQ_K = 4 +VQ_K = 8 VQ_D_Z = 128 VQ_D_MODEL= 192 VQ_NHEAD = 8 @@ -291,7 +291,7 @@ def train(): f"[{datetime.now().strftime('%Y-%m-%d %H:%M:%S')}] " f"Epoch {epoch + 1:4d} | " f"Loss {loss_total/n:.5f} " - f"CE {ce_total/n:.5f} " + f"Focal {ce_total/n:.5f} " f"Commit {commit_total/n:.5f} " f"Entropy {entropy_total/n:.5f} | " f"LR {scheduler.get_last_lr()[0]:.6f}" diff --git a/ginka/train_vq.py b/ginka/train_vq.py index 2f0bc50..3071252 100644 --- a/ginka/train_vq.py +++ b/ginka/train_vq.py @@ -47,7 +47,7 @@ WALL_MASK_RATIO = 0.8 # VQ-VAE 超参 VQ_L = 2 # summary token 数量(即 z 的序列长度) -VQ_K = 4 # codebook 大小 +VQ_K = 8 # codebook 大小 VQ_D_Z = 128 # codebook 嵌入维度 VQ_D_MODEL= 192 VQ_NHEAD = 8 @@ -695,7 +695,7 @@ def train(): f"[{datetime.now().strftime('%Y-%m-%d %H:%M:%S')}] " f"Epoch {epoch + 1:4d} | " f"Loss {loss_total/n:.5f} " - f"CE {ce_total/n:.5f} " + f"Focal {ce_total/n:.5f} " f"VQ {vq_loss_total/n:.5f} " f"Commit {commit_total/n:.5f} " f"Entropy {entropy_total/n:.5f} "