mirror of
https://github.com/rasbt/LLMs-from-scratch.git
synced 2025-08-28 02:20:13 +00:00
Fix code comment: embed_dim -> d_out (#698)
This commit is contained in:
parent
a5ea296259
commit
984cca3f64
@ -352,7 +352,7 @@
|
||||
" def __init__(self, d_in, d_out, num_heads, context_length, dropout=0.0, qkv_bias=False):\n",
|
||||
" super().__init__()\n",
|
||||
"\n",
|
||||
" assert d_out % num_heads == 0, \"embed_dim is indivisible by num_heads\"\n",
|
||||
" assert d_out % num_heads == 0, \"d_out is indivisible by num_heads\"\n",
|
||||
"\n",
|
||||
" self.num_heads = num_heads\n",
|
||||
" self.context_length = context_length\n",
|
||||
@ -588,7 +588,7 @@
|
||||
" def __init__(self, d_in, d_out, num_heads, context_length, dropout=0.0, qkv_bias=False):\n",
|
||||
" super().__init__()\n",
|
||||
"\n",
|
||||
" assert d_out % num_heads == 0, \"embed_dim is indivisible by num_heads\"\n",
|
||||
" assert d_out % num_heads == 0, \"d_out is indivisible by num_heads\"\n",
|
||||
"\n",
|
||||
" self.num_heads = num_heads\n",
|
||||
" self.context_length = context_length\n",
|
||||
|
@ -65,7 +65,7 @@ class PyTorchMultiHeadAttention(nn.Module):
|
||||
def __init__(self, d_in, d_out, num_heads, dropout=0.0, qkv_bias=False):
|
||||
super().__init__()
|
||||
|
||||
assert d_out % num_heads == 0, "embed_dim is indivisible by num_heads"
|
||||
assert d_out % num_heads == 0, "d_out is indivisible by num_heads"
|
||||
|
||||
self.num_heads = num_heads
|
||||
self.head_dim = d_out // num_heads
|
||||
|
@ -108,7 +108,7 @@ class PyTorchMultiHeadAttention(nn.Module):
|
||||
def __init__(self, d_in, d_out, num_heads, dropout=0.0, qkv_bias=False):
|
||||
super().__init__()
|
||||
|
||||
assert d_out % num_heads == 0, "embed_dim is indivisible by num_heads"
|
||||
assert d_out % num_heads == 0, "d_out is indivisible by num_heads"
|
||||
|
||||
self.num_heads = num_heads
|
||||
self.head_dim = d_out // num_heads
|
||||
|
Loading…
x
Reference in New Issue
Block a user