From 6b2b36f20ce542e9a131b3ffd360d73eb4ad280a Mon Sep 17 00:00:00 2001 From: unanmed <1319491857@qq.com> Date: Tue, 28 Apr 2026 15:34:36 +0800 Subject: [PATCH] =?UTF-8?q?chore:=20=E8=B0=83=E6=95=B4=E8=B6=85=E5=8F=82?= =?UTF-8?q?=E6=95=B0?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit --- ginka/train_vq.py | 22 +++++++++++----------- 1 file changed, 11 insertions(+), 11 deletions(-) diff --git a/ginka/train_vq.py b/ginka/train_vq.py index 9649412..6d9eb37 100644 --- a/ginka/train_vq.py +++ b/ginka/train_vq.py @@ -46,21 +46,21 @@ LABEL_SMOOTHING = 0.0 WALL_MASK_RATIO = 0.8 # VQ-VAE 超参 -VQ_L = 16 # summary token 数量(即 z 的序列长度) -VQ_K = 2 # codebook 大小 -VQ_D_Z = 64 # codebook 嵌入维度 -VQ_D_MODEL= 128 -VQ_NHEAD = 4 -VQ_LAYERS = 3 -VQ_DIM_FF = 256 -VQ_BETA = 0.25 # commit loss 权重 -VQ_GAMMA = 0.1 # entropy loss 权重 +VQ_L = 32 # summary token 数量(即 z 的序列长度) +VQ_K = 1 # codebook 大小 +VQ_D_Z = 128 # codebook 嵌入维度 +VQ_D_MODEL= 192 +VQ_NHEAD = 8 +VQ_LAYERS = 4 +VQ_DIM_FF = 512 +VQ_BETA = 0.5 # commit loss 权重 +VQ_GAMMA = 0.0 # entropy loss 权重 # MaskGIT 超参 MG_D_MODEL = 256 MG_NHEAD = 8 -MG_LAYERS = 4 -MG_DIM_FF = 1024 +MG_LAYERS = 6 +MG_DIM_FF = 2048 MG_Z_DROPOUT = 0.1 # 训练时以此概率把 z 替换为随机噪声 MG_STRUCT_DROPOUT= 0.1 # 训练时以此概率将结构标签替换为 null(无条件占位)