Skip to content

Commit 78405cc

Browse files
committed
increase default frac gradient for state transition projection
1 parent 4c02b43 commit 78405cc

File tree

2 files changed

+3
-3
lines changed

2 files changed

+3
-3
lines changed

gateloop_transformer/gateloop_transformer.py

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -181,7 +181,7 @@ def __init__(
181181
heads = None,
182182
dim_inner = None,
183183
checkpoint_gate_looped_attn = True,
184-
frac_gradient_state_transition = 0.5
184+
frac_gradient_state_transition = 0.9
185185
):
186186
super().__init__()
187187
self.frac_gradient_state_transition = frac_gradient_state_transition
@@ -259,7 +259,7 @@ def __init__(
259259
dim_gate_looped_attn = None,
260260
attn_softmax_normalize = None,
261261
data_dependent_rel_pos = False,
262-
frac_gradient_state_transition = 0.5,
262+
frac_gradient_state_transition = 0.9,
263263
ablate_complex = False,
264264
ablate_state_transition = False,
265265
rotary_emb = False

setup.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -3,7 +3,7 @@
33
setup(
44
name = 'gateloop-transformer',
55
packages = find_packages(exclude=[]),
6-
version = '0.0.14',
6+
version = '0.0.15',
77
license='MIT',
88
description = 'GateLoop Transformer',
99
author = 'Phil Wang',

0 commit comments

Comments
 (0)