Skip to content

Commit

Permalink
increase default frac gradient for state transition projection
Browse files Browse the repository at this point in the history
  • Loading branch information
lucidrains committed Nov 10, 2023
1 parent 4c02b43 commit 78405cc
Show file tree
Hide file tree
Showing 2 changed files with 3 additions and 3 deletions.
4 changes: 2 additions & 2 deletions gateloop_transformer/gateloop_transformer.py
Original file line number Diff line number Diff line change
Expand Up @@ -181,7 +181,7 @@ def __init__(
heads = None,
dim_inner = None,
checkpoint_gate_looped_attn = True,
frac_gradient_state_transition = 0.5
frac_gradient_state_transition = 0.9
):
super().__init__()
self.frac_gradient_state_transition = frac_gradient_state_transition
Expand Down Expand Up @@ -259,7 +259,7 @@ def __init__(
dim_gate_looped_attn = None,
attn_softmax_normalize = None,
data_dependent_rel_pos = False,
frac_gradient_state_transition = 0.5,
frac_gradient_state_transition = 0.9,
ablate_complex = False,
ablate_state_transition = False,
rotary_emb = False
Expand Down
2 changes: 1 addition & 1 deletion setup.py
Original file line number Diff line number Diff line change
Expand Up @@ -3,7 +3,7 @@
setup(
name = 'gateloop-transformer',
packages = find_packages(exclude=[]),
version = '0.0.14',
version = '0.0.15',
license='MIT',
description = 'GateLoop Transformer',
author = 'Phil Wang',
Expand Down

0 comments on commit 78405cc

Please sign in to comment.