Update 第二章 Transformer架构.md

This commit is contained in:
Logan Zou
2025-07-25 16:20:46 +08:00
committed by GitHub
parent 5ac954f813
commit 1d226be0ff

View File

@@ -813,7 +813,7 @@ class Transformer(nn.Module):
n_params = sum(p.numel() for p in self.parameters())
# 如果不统计 embedding 的参数,就减去
if non_embedding:
n_params -= self.transformer.wpe.weight.numel()
n_params -= self.transformer.wte.weight.numel()
return n_params
'''初始化权重'''