Source code for alphagenome_pytorch.embeddings

import torch
import torch.nn as nn
import torch.nn.functional as F
from . import layers



[docs]
class OutputEmbedder(nn.Module):
    """Output embedder using Conv1d for NCL format (B, C, S).

    Matches JAX `alphagenome_research.model.embeddings.OutputEmbedder`.

    Logic:
    1. Conv1d projection to output channels.
    2. Optional skip connection addition (with projection if needed).
    3. Add Organism Embedding.
    4. Norm + GELU.
    """

    def __init__(self, in_channels, out_channels, num_organisms=2):
        super().__init__()
        self.num_organisms = num_organisms
        self.out_channels = out_channels

        # Use Conv1d(k=1) instead of Linear - same math, native NCL
        # For 128bp: Input 1536 -> Output 3072
        # For 1bp: Input 768 -> Output 1536
        self.project_in = nn.Conv1d(in_channels, out_channels, kernel_size=1)

        # Skip projection - set externally if needed (e.g., for 1bp embedder)
        self.project_skip = None

        self.organism_embed = nn.Embedding(num_organisms, out_channels)
        self.norm = layers.RMSBatchNorm(channels=out_channels)


[docs]
    def forward(self, x, organism_index, skip_x=None, channels_last=False):
        # x: (B, C, S) - NCL format

        # Project main input
        x_proj = self.project_in(x)

        if skip_x is not None and self.project_skip is not None:
            # skip_x: (B, C_skip, S_skip)
            s_proj = self.project_skip(skip_x)

            # Upsample sequence if needed (dim 2 in NCL)
            repeat_factor = x_proj.shape[2] // s_proj.shape[2]
            if repeat_factor > 1:
                s_proj = s_proj.repeat_interleave(repeat_factor, dim=2)

            x_proj = x_proj + s_proj

        # Apply norm
        out = self.norm(x_proj)

        # Add organism embedding: (B, C) → (B, C, 1) for NCL broadcast
        emb = self.organism_embed(organism_index).unsqueeze(2)
        out = out + emb
        
        out = layers.gelu(out)

        if channels_last:
            # (B, C, S) -> (B, S, C)
            out = out.transpose(1, 2)
            
        return out




[docs]
class OutputPair(nn.Module):
    """Output embedder for pair activations (B, S, S, D).

    Note: Pair activations use a different format than sequence data.
    LayerNorm operates over the last dimension (features).
    """

    def __init__(self, dim=128, num_organisms=2):
        super().__init__()
        self.num_organisms = num_organisms
        self.organism_embed = nn.Embedding(num_organisms, dim)
        self.norm = layers.LayerNorm(normalized_shape=dim, rms_norm=True)


[docs]
    def forward(self, x, organism_index):
        # x: (B, S, S, D) - pair activations
        # Symmetrize
        x = (x + x.transpose(1, 2)) / 2.0

        # Apply norm, then add organism embedding, then gelu
        x = self.norm(x)

        emb = self.organism_embed(organism_index)  # (B, D)
        x = x + emb[:, None, None, :]

        return layers.gelu(x)