mirror of
https://github.com/rasbt/LLMs-from-scratch.git
synced 2025-08-04 14:52:17 +00:00
note about dropout
This commit is contained in:
parent
bbb2a0c3d5
commit
85827e0a0b
@ -180,7 +180,7 @@ if __name__ == "__main__":
|
|||||||
"emb_dim": 12, # Embedding dimension
|
"emb_dim": 12, # Embedding dimension
|
||||||
"n_heads": 2, # Number of attention heads
|
"n_heads": 2, # Number of attention heads
|
||||||
"n_layers": 2, # Number of layers
|
"n_layers": 2, # Number of layers
|
||||||
"drop_rate": 0.0, # Dropout rate
|
"drop_rate": 0.0, # Dropout rate, deactivated via 0.0 as dropout in LLMs is not recommended anymore
|
||||||
"qkv_bias": False # Query-key-value bias
|
"qkv_bias": False # Query-key-value bias
|
||||||
}
|
}
|
||||||
|
|
||||||
|
Loading…
x
Reference in New Issue
Block a user