diff --git a/local_attention/rotary.py b/local_attention/rotary.py index 800223a..7427bad 100644 --- a/local_attention/rotary.py +++ b/local_attention/rotary.py @@ -30,7 +30,7 @@ def __init__( scale = (torch.arange(0, dim, 2) + 0.4 * dim) / (1.4 * dim) self.register_buffer('scale', scale, persistent = False) - self.apply_rotary_pos_emb = apply_rotary_pos_emb + self.apply_rotary_pos_emb = staticmethod(apply_rotary_pos_emb) @autocast(enabled = False) def forward(self, x): diff --git a/setup.py b/setup.py index 9dc348f..901227e 100644 --- a/setup.py +++ b/setup.py @@ -3,7 +3,7 @@ setup( name = 'local-attention', packages = find_packages(), - version = '1.9.9', + version = '1.9.10', license='MIT', description = 'Local attention, window with lookback, for language modeling', long_description_content_type = 'text/markdown',