mirror of
https://github.com/deepseek-ai/DeepSeek-Math.git
synced 2025-06-20 16:33:47 -04:00
Add commented options for output attentions and hidden states in DeepSeekMathConfig
This commit is contained in:
parent
735546a4f9
commit
2b3c49c9cb
@ -21,6 +21,8 @@ class DeepSeekMathConfig:
|
||||
use_cache: bool = True
|
||||
rope_scaling: Optional[dict] = None
|
||||
tie_word_embeddings: bool = False
|
||||
# output_attentions:bool=True
|
||||
# output_hidden_states:int=12
|
||||
|
||||
class RMSNorm(nn.Module):
|
||||
def __init__(self, hidden_size, eps=1e-6):
|
||||
|
Loading…
Reference in New Issue
Block a user