Source code for torch_brain.nn.rotary_embedding

import torch
import torch.nn as nn
from einops import repeat, rearrange



[docs]
class RotaryEmbedding(nn.Module):
    r"""Custom rotary positional embedding layer. This function generates sinusoids of
    different frequencies, which are then used to modulate the input data. Half of the
    dimensions are not rotated.

    The frequencies are computed as follows:

    .. math::
        f(i) = {t_{\min}} \cdot \frac{t_{\max}}{t_{\min}}^{2i/dim}

    To rotate the input data, use :func:`apply_rotary_pos_emb`.

    Args:
        dim (int): Dimensionality of the input data.
        t_min (float, optional): Minimum period of the sinusoids.
        t_max (float, optional): Maximum period of the sinusoids.
    """

    def __init__(self, dim, t_min=1e-4, t_max=4.0):
        super().__init__()
        omega = torch.zeros(dim // 2)
        omega[: dim // 4] = (
            2
            * torch.pi
            / (
                t_min
                * (
                    (t_max / t_min)
                    ** (torch.arange(0, dim // 2, 2).float() / (dim // 2))
                )
            )
        )

        self.register_buffer("omega", omega)


[docs]
    def forward(self, timestamps):
        r"""Computes the rotation matrices for given timestamps.

        Args:
            timestamps (torch.Tensor): timestamps tensor.
        """
        angles = torch.einsum("..., f -> ... f", timestamps, self.omega)
        angles = repeat(angles, "... n -> ... (n r)", r=2)
        return angles




def rotate_half(x):
    x = rearrange(x, "... (d r) -> ... d r", r=2)
    x1, x2 = x.unbind(dim=-1)
    x = torch.stack((-x2, x1), dim=-1)
    return rearrange(x, "... d r -> ... (d r)")



[docs]
def apply_rotary_pos_emb(pos_emb, x, head_dim=2):
    r"""Apply the rotary positional embedding to the input data.

    Args:
        pos_emb (torch.Tensor): Angles for different rotations.
        x (torch.Tensor): Input data.
        head_dim (int, optional): Dimension of the head. Defaults to 2.
    """
    dtype = x.dtype
    # TODO this basically unsqueeze, fix it
    if head_dim == 1:
        pos_emb = rearrange(pos_emb, "n ... -> n () ...")
    elif head_dim == 2:
        pos_emb = rearrange(pos_emb, "n m ... -> n m () ...")

    x = (x * pos_emb.cos().to(dtype)) + (rotate_half(x) * pos_emb.sin().to(dtype))
    return x