Function bodies 170 total

Name: Aljefra Mapper analysis
Creator: Repobility
License: https://repobility.com/legal/terms/

__init__ method · python · L262-L297 (36 LOC)

models/spatial_rope.py

    def __init__(
        self,
        head_dim: int,
        n_reference_types: int = 7,
        max_seq_len: int = 2048,
        base: float = 10000.0,
        spatial_weight: float = 0.5,  # Balance between spatial and temporal
    ):
        super().__init__()
        self.head_dim = head_dim
        self.spatial_weight = spatial_weight

        # Split head_dim between spatial and temporal
        # Each gets half, then split further for sin/cos
        self.spatial_dim = head_dim // 2
        self.temporal_dim = head_dim - self.spatial_dim

        # Ensure dimensions are even for rotation
        if self.spatial_dim % 4 != 0:
            # Adjust to make spatial_dim divisible by 4
            self.spatial_dim = (self.spatial_dim // 4) * 4
            self.temporal_dim = head_dim - self.spatial_dim

        if self.spatial_dim > 0:
            self.spatial_rope = Spatial2DRoPE(
                head_dim=self.spatial_dim,
                n_reference_types=n_reference_types,

forward method · python · L299-L349 (51 LOC)

models/spatial_rope.py

    def forward(
        self,
        q: torch.Tensor,
        k: torch.Tensor,
        channel_indices: torch.Tensor,
        time_indices: torch.Tensor,
        reference_type_ids: Optional[torch.Tensor] = None,
    ) -> Tuple[torch.Tensor, torch.Tensor]:
        """
        Apply combined spatial and temporal RoPE.

        Args:
            q, k: Shape (batch, n_heads, seq_len, head_dim)
            channel_indices: Which channel each position corresponds to (batch, seq_len)
            time_indices: Which time step each position corresponds to (batch, seq_len)
            reference_type_ids: Reference type IDs (batch,)

        Returns:
            q_rotated, k_rotated: Rotated tensors
        """
        batch_size, n_heads, seq_len, head_dim = q.shape

        # Split into spatial and temporal parts
        q_spatial = q[..., :self.spatial_dim]
        q_temporal = q[..., self.spatial_dim:]
        k_spatial = k[..., :self.spatial_dim]
        k_temporal = k[..., self.spatial_d

SpatialAttention class · python · L352-L447 (96 LOC)

models/spatial_rope.py

class SpatialAttention(nn.Module):
    """
    Multi-Head Attention with 2D Spatial RoPE for EEG.

    This attention operates on channels as positions (not time patches).
    Each channel has a 2D position on the scalp, and the attention learns
    spatial relationships modulated by the reference type.

    Use this for cross-channel attention within a time window.
    """

    def __init__(
        self,
        hidden_dim: int,
        n_heads: int,
        n_reference_types: int = 7,
        dropout: float = 0.1,
        use_qk_norm: bool = True,
    ):
        super().__init__()
        self.hidden_dim = hidden_dim
        self.n_heads = n_heads
        self.head_dim = hidden_dim // n_heads
        self.scale = self.head_dim ** -0.5

        if hidden_dim % n_heads != 0:
            raise ValueError(f"hidden_dim ({hidden_dim}) must be divisible by n_heads ({n_heads})")

        # QKV projection
        self.qkv = nn.Linear(hidden_dim, 3 * hidden_dim, bias=False)
        self.out_p

__init__ method · python · L363-L396 (34 LOC)

models/spatial_rope.py

    def __init__(
        self,
        hidden_dim: int,
        n_heads: int,
        n_reference_types: int = 7,
        dropout: float = 0.1,
        use_qk_norm: bool = True,
    ):
        super().__init__()
        self.hidden_dim = hidden_dim
        self.n_heads = n_heads
        self.head_dim = hidden_dim // n_heads
        self.scale = self.head_dim ** -0.5

        if hidden_dim % n_heads != 0:
            raise ValueError(f"hidden_dim ({hidden_dim}) must be divisible by n_heads ({n_heads})")

        # QKV projection
        self.qkv = nn.Linear(hidden_dim, 3 * hidden_dim, bias=False)
        self.out_proj = nn.Linear(hidden_dim, hidden_dim, bias=False)

        # 2D Spatial RoPE
        self.spatial_rope = Spatial2DRoPE(
            head_dim=self.head_dim,
            n_reference_types=n_reference_types,
        )

        # QK normalization
        self.use_qk_norm = use_qk_norm
        if use_qk_norm:
            self.q_norm = RMSNorm(self.head_dim)
            self.k_no

forward method · python · L398-L447 (50 LOC)

models/spatial_rope.py

    def forward(
        self,
        x: torch.Tensor,
        reference_type_ids: Optional[torch.Tensor] = None,
        mask: Optional[torch.Tensor] = None,
    ) -> torch.Tensor:
        """
        Apply spatial attention.

        Args:
            x: Input tensor of shape (batch, n_channels, hidden_dim)
               where n_channels = 19 for standard EEG
            reference_type_ids: Reference type IDs of shape (batch,)
            mask: Optional attention mask

        Returns:
            Output tensor of shape (batch, n_channels, hidden_dim)
        """
        B, N, D = x.shape

        # QKV projection
        qkv = self.qkv(x).reshape(B, N, 3, self.n_heads, self.head_dim)
        q, k, v = qkv.unbind(2)  # Each: (B, N, n_heads, head_dim)
        q = q.transpose(1, 2)  # (B, n_heads, N, head_dim)
        k = k.transpose(1, 2)
        v = v.transpose(1, 2)

        # QK normalization
        if self.use_qk_norm:
            q = self.q_norm(q)
            k = self.k_norm(

SpatialTransformerBlock class · python · L450-L506 (57 LOC)

models/spatial_rope.py

class SpatialTransformerBlock(nn.Module):
    """
    Transformer block with 2D Spatial RoPE for EEG.

    Pre-norm architecture with RMSNorm and SwiGLU FFN.
    """

    def __init__(
        self,
        hidden_dim: int,
        n_heads: int,
        n_reference_types: int = 7,
        dropout: float = 0.1,
        use_qk_norm: bool = True,
    ):
        super().__init__()

        self.norm1 = RMSNorm(hidden_dim)
        self.attn = SpatialAttention(
            hidden_dim=hidden_dim,
            n_heads=n_heads,
            n_reference_types=n_reference_types,
            dropout=dropout,
            use_qk_norm=use_qk_norm,
        )

        self.norm2 = RMSNorm(hidden_dim)

        # SwiGLU FFN
        hidden_ff = hidden_dim * 4
        self.w1 = nn.Linear(hidden_dim, hidden_ff, bias=False)
        self.w2 = nn.Linear(hidden_ff, hidden_dim, bias=False)
        self.w3 = nn.Linear(hidden_dim, hidden_ff, bias=False)
        self.dropout = nn.Dropout(dropout)

    def forward(

__init__ method · python · L457-L483 (27 LOC)

models/spatial_rope.py

    def __init__(
        self,
        hidden_dim: int,
        n_heads: int,
        n_reference_types: int = 7,
        dropout: float = 0.1,
        use_qk_norm: bool = True,
    ):
        super().__init__()

        self.norm1 = RMSNorm(hidden_dim)
        self.attn = SpatialAttention(
            hidden_dim=hidden_dim,
            n_heads=n_heads,
            n_reference_types=n_reference_types,
            dropout=dropout,
            use_qk_norm=use_qk_norm,
        )

        self.norm2 = RMSNorm(hidden_dim)

        # SwiGLU FFN
        hidden_ff = hidden_dim * 4
        self.w1 = nn.Linear(hidden_dim, hidden_ff, bias=False)
        self.w2 = nn.Linear(hidden_ff, hidden_dim, bias=False)
        self.w3 = nn.Linear(hidden_dim, hidden_ff, bias=False)
        self.dropout = nn.Dropout(dropout)

Want this analysis on your repo? https://repobility.com/scan/

forward method · python · L485-L506 (22 LOC)

models/spatial_rope.py

    def forward(
        self,
        x: torch.Tensor,
        reference_type_ids: Optional[torch.Tensor] = None,
        mask: Optional[torch.Tensor] = None,
    ) -> torch.Tensor:
        """
        Forward pass.

        Args:
            x: Input of shape (batch, n_channels, hidden_dim)
            reference_type_ids: Reference type IDs of shape (batch,)
            mask: Optional attention mask
        """
        # Pre-norm attention with spatial RoPE
        x = x + self.attn(self.norm1(x), reference_type_ids, mask)

        # Pre-norm SwiGLU FFN
        h = self.norm2(x)
        x = x + self.dropout(self.w2(F.silu(self.w1(h)) * self.w3(h)))

        return x

SpatialChannelEncoder class · python · L509-L598 (90 LOC)

models/spatial_rope.py

class SpatialChannelEncoder(nn.Module):
    """
    Encode EEG channels with spatial awareness.

    This encoder treats each channel as a position with 2D coordinates.
    It processes each time window across all channels, learning spatial
    relationships that are modulated by the reference type.

    Input: (batch, n_channels, time_samples)
    Output: (batch, n_windows, hidden_dim)
    """

    def __init__(
        self,
        n_channels: int = 19,
        hidden_dim: int = 768,
        n_heads: int = 12,
        n_layers: int = 2,  # Fewer layers for spatial processing
        n_reference_types: int = 7,
        window_size: int = 32,
        dropout: float = 0.1,
    ):
        super().__init__()

        self.n_channels = n_channels
        self.hidden_dim = hidden_dim
        self.window_size = window_size

        # Per-channel embedding (window_size -> hidden_dim)
        self.channel_embed = nn.Linear(window_size, hidden_dim)

        # Spatial transformer blocks

__init__ method · python · L521-L555 (35 LOC)

models/spatial_rope.py

    def __init__(
        self,
        n_channels: int = 19,
        hidden_dim: int = 768,
        n_heads: int = 12,
        n_layers: int = 2,  # Fewer layers for spatial processing
        n_reference_types: int = 7,
        window_size: int = 32,
        dropout: float = 0.1,
    ):
        super().__init__()

        self.n_channels = n_channels
        self.hidden_dim = hidden_dim
        self.window_size = window_size

        # Per-channel embedding (window_size -> hidden_dim)
        self.channel_embed = nn.Linear(window_size, hidden_dim)

        # Spatial transformer blocks
        self.spatial_blocks = nn.ModuleList([
            SpatialTransformerBlock(
                hidden_dim=hidden_dim,
                n_heads=n_heads,
                n_reference_types=n_reference_types,
                dropout=dropout,
            )
            for _ in range(n_layers)
        ])

        # Pool across channels to get window representation
        self.channel_pool = nn.Sequential(

forward method · python · L557-L598 (42 LOC)

models/spatial_rope.py

    def forward(
        self,
        x: torch.Tensor,
        reference_type_ids: Optional[torch.Tensor] = None,
    ) -> torch.Tensor:
        """
        Encode EEG with spatial awareness.

        Args:
            x: Input EEG of shape (batch, n_channels, time_samples)
            reference_type_ids: Reference type IDs of shape (batch,)

        Returns:
            Encoded representation of shape (batch, n_windows, hidden_dim)
        """
        batch_size, n_channels, total_samples = x.shape
        n_windows = total_samples // self.window_size

        # Reshape to windows: (batch, n_channels, n_windows, window_size)
        x = x[:, :, :n_windows * self.window_size]
        x = x.view(batch_size, n_channels, n_windows, self.window_size)

        # Process each window with spatial attention
        outputs = []
        for w in range(n_windows):
            # Get window: (batch, n_channels, window_size)
            window = x[:, :, w, :]

            # Embed each channel: (ba

get_reference_type_tensor function · python · L601-L620 (20 LOC)

models/spatial_rope.py

def get_reference_type_tensor(
    reference_names: list,
    device: torch.device = None,
) -> torch.Tensor:
    """
    Convert a list of reference names to type IDs.

    Args:
        reference_names: List of reference name strings (e.g., ['A1-A2', 'FCz', 'average'])
        device: Target device

    Returns:
        Tensor of shape (batch,) with reference type IDs
    """
    ids = [EEGConfig.REFERENCE_TYPES.get(name, EEGConfig.REFERENCE_TYPES['unknown'])
           for name in reference_names]
    tensor = torch.tensor(ids, dtype=torch.long)
    if device is not None:
        tensor = tensor.to(device)
    return tensor

VariableSpatial2DRoPE class · python · L28-L105 (78 LOC)