mirror of
https://github.com/deepseek-ai/DeepSeek-V3.git
synced 2025-02-22 05:38:59 -05:00
Fix Linear Layer Bias Initialization
This commit is contained in:
parent
b5d872ead0
commit
6a30b43249
@ -185,7 +185,7 @@ class Linear(nn.Module):
|
||||
else:
|
||||
self.register_parameter("scale", None)
|
||||
if bias:
|
||||
self.bias = nn.Parameter(torch.empty(self.part_out_features))
|
||||
self.bias = nn.Parameter(torch.empty(out_features))
|
||||
else:
|
||||
self.register_parameter("bias", None)
|
||||
|
||||
|
Loading…
Reference in New Issue
Block a user