We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 2ecea90 commit 768f369Copy full SHA for 768f369
gateloop_transformer/gateloop_transformer.py
@@ -200,8 +200,8 @@ def __init__(
200
self.to_qkv = nn.Linear(dim, dim_inner * 3, bias = False)
201
202
self.to_a = nn.Sequential(
203
- nn.Linear(dim, dim_inner * 2),
204
- Rearrange('b n (h d c) -> (b h) n d c', h = heads, c = 2)
+ nn.Linear(dim, heads * 2),
+ Rearrange('b n (h c) -> (b h) n 1 c', h = heads, c = 2)
205
)
206
207
self.merge_heads = Rearrange('(b h) n d -> b n (h d)', h = heads)
setup.py
@@ -3,7 +3,7 @@
3
setup(
4
name = 'gateloop-transformer',
5
packages = find_packages(exclude=[]),
6
- version = '0.0.15',
+ version = '0.0.16',
7
license='MIT',
8
description = 'GateLoop Transformer',
9
author = 'Phil Wang',
0 commit comments