File tree Expand file tree Collapse file tree 2 files changed +3
-3
lines changed Expand file tree Collapse file tree 2 files changed +3
-3
lines changed Original file line number Diff line number Diff line change @@ -181,7 +181,7 @@ def __init__(
181181 heads = None ,
182182 dim_inner = None ,
183183 checkpoint_gate_looped_attn = True ,
184- frac_gradient_state_transition = 0.5
184+ frac_gradient_state_transition = 0.9
185185 ):
186186 super ().__init__ ()
187187 self .frac_gradient_state_transition = frac_gradient_state_transition
@@ -259,7 +259,7 @@ def __init__(
259259 dim_gate_looped_attn = None ,
260260 attn_softmax_normalize = None ,
261261 data_dependent_rel_pos = False ,
262- frac_gradient_state_transition = 0.5 ,
262+ frac_gradient_state_transition = 0.9 ,
263263 ablate_complex = False ,
264264 ablate_state_transition = False ,
265265 rotary_emb = False
Original file line number Diff line number Diff line change 33setup (
44 name = 'gateloop-transformer' ,
55 packages = find_packages (exclude = []),
6- version = '0.0.14 ' ,
6+ version = '0.0.15 ' ,
77 license = 'MIT' ,
88 description = 'GateLoop Transformer' ,
99 author = 'Phil Wang' ,
You can’t perform that action at this time.
0 commit comments