Mask

`DiscreteMaskedPrior`

Bases: DiscretePriorDistribution

A subclass representing a Discrete Masked prior distribution.

Source code in bionemo/moco/distributions/prior/discrete/mask.py

class DiscreteMaskedPrior(DiscretePriorDistribution):
    """A subclass representing a Discrete Masked prior distribution."""

    def __init__(self, num_classes: int = 10, mask_dim: Optional[int] = None, inclusive: bool = True) -> None:
        """Discrete Masked prior distribution.

        Theres 3 ways I can think of defining the problem that are hard to mesh together.

        1. [..., M, ....] inclusive anywhere --> exisiting LLM tokenizer where the mask has a specific location not at the end
        2. [......, M] inclusive on end --> mask_dim = None with inclusive set to True default stick on the end
        3. [.....] + [M] exclusive --> the number of classes representes the number of data classes and one wishes to add a separate MASK dimension.
            - Note the pad_sample function is provided to help add this extra external dimension.

        Args:
            num_classes (int): The number of classes in the distribution. Defaults to 10.
            mask_dim (int): The index for the mask token. Defaults to num_classes - 1 if inclusive or num_classes if exclusive.
            inclusive (bool): Whether the mask is included in the specified number of classes.
                                If True, the mask is considered as one of the classes.
                                If False, the mask is considered as an additional class. Defaults to True.
        """
        if inclusive:
            if mask_dim is None:
                mask_dim = num_classes - 1
            else:
                if mask_dim >= num_classes:
                    raise ValueError(
                        "As Inclusive accounts for the mask as one of the specified num_classes, the provided mask_dim cannot be >= to num_classes"
                    )
            prior_dist = torch.zeros((num_classes))
            prior_dist[-1] = 1.0
            super().__init__(num_classes, prior_dist)
            self.mask_dim = mask_dim
        else:
            prior_dist = torch.zeros((num_classes + 1))
            prior_dist[-1] = 1.0
            super().__init__(num_classes + 1, prior_dist)
            self.mask_dim = num_classes
        if torch.sum(self.prior_dist).item() - 1.0 >= 1e-5:
            raise ValueError("Invalid probability distribution. Must sum to 1.0")

    def sample(
        self,
        shape: Tuple,
        mask: Optional[Tensor] = None,
        device: Union[str, torch.device] = "cpu",
        rng_generator: Optional[torch.Generator] = None,
    ) -> Tensor:
        """Generates a specified number of samples.

        Args:
            shape (Tuple): The shape of the samples to generate.
            device (str): cpu or gpu.
            mask (Optional[Tensor]): An optional mask to apply to the samples. Defaults to None.
            rng_generator: An optional :class:`torch.Generator` for reproducible sampling. Defaults to None.

        Returns:
            Float: A tensor of samples.
        """
        samples = torch.ones(shape, dtype=torch.int64, device=device) * self.mask_dim
        if mask is not None:
            samples = samples * mask[(...,) + (None,) * (len(samples.shape) - len(mask.shape))]
        return samples

    def is_masked(self, sample: Tensor) -> Tensor:
        """Creates a mask for whether a state is masked.

        Args:
            sample (Tensor): The sample to check.

        Returns:
            Tensor: A float tensor indicating whether the sample is masked.
        """
        return (sample == self.mask_dim).float()

    def pad_sample(self, sample: Tensor) -> Tensor:
        """Pads the input sample with zeros along the last dimension.

        Args:
            sample (Tensor): The input sample to be padded.

        Returns:
            Tensor: The padded sample.
        """
        # Create a zeros tensor with the same shape as the original tensor, except the last dimension is 1
        zeros = torch.zeros((*sample.shape[:-1], 1), dtype=torch.float, device=sample.device)
        # Concatenate along the last dimension to make the shape (..., N+1)
        padded_sample = torch.cat((sample, zeros), dim=-1)
        return padded_sample

`init(num_classes=10, mask_dim=None, inclusive=True)`

Discrete Masked prior distribution.

Theres 3 ways I can think of defining the problem that are hard to mesh together.

[..., M, ....] inclusive anywhere --> exisiting LLM tokenizer where the mask has a specific location not at the end
[......, M] inclusive on end --> mask_dim = None with inclusive set to True default stick on the end
[.....] + [M] exclusive --> the number of classes representes the number of data classes and one wishes to add a separate MASK dimension.
- Note the pad_sample function is provided to help add this extra external dimension.

Parameters:

Name	Type	Description	Default
`num_classes`	`int`	The number of classes in the distribution. Defaults to 10.	`10`
`mask_dim`	`int`	The index for the mask token. Defaults to num_classes - 1 if inclusive or num_classes if exclusive.	`None`
`inclusive`	`bool`	Whether the mask is included in the specified number of classes. If True, the mask is considered as one of the classes. If False, the mask is considered as an additional class. Defaults to True.	`True`

Source code in bionemo/moco/distributions/prior/discrete/mask.py

def __init__(self, num_classes: int = 10, mask_dim: Optional[int] = None, inclusive: bool = True) -> None:
    """Discrete Masked prior distribution.

    Theres 3 ways I can think of defining the problem that are hard to mesh together.

    1. [..., M, ....] inclusive anywhere --> exisiting LLM tokenizer where the mask has a specific location not at the end
    2. [......, M] inclusive on end --> mask_dim = None with inclusive set to True default stick on the end
    3. [.....] + [M] exclusive --> the number of classes representes the number of data classes and one wishes to add a separate MASK dimension.
        - Note the pad_sample function is provided to help add this extra external dimension.

    Args:
        num_classes (int): The number of classes in the distribution. Defaults to 10.
        mask_dim (int): The index for the mask token. Defaults to num_classes - 1 if inclusive or num_classes if exclusive.
        inclusive (bool): Whether the mask is included in the specified number of classes.
                            If True, the mask is considered as one of the classes.
                            If False, the mask is considered as an additional class. Defaults to True.
    """
    if inclusive:
        if mask_dim is None:
            mask_dim = num_classes - 1
        else:
            if mask_dim >= num_classes:
                raise ValueError(
                    "As Inclusive accounts for the mask as one of the specified num_classes, the provided mask_dim cannot be >= to num_classes"
                )
        prior_dist = torch.zeros((num_classes))
        prior_dist[-1] = 1.0
        super().__init__(num_classes, prior_dist)
        self.mask_dim = mask_dim
    else:
        prior_dist = torch.zeros((num_classes + 1))
        prior_dist[-1] = 1.0
        super().__init__(num_classes + 1, prior_dist)
        self.mask_dim = num_classes
    if torch.sum(self.prior_dist).item() - 1.0 >= 1e-5:
        raise ValueError("Invalid probability distribution. Must sum to 1.0")

`is_masked(sample)`

Creates a mask for whether a state is masked.

Parameters:

Name	Type	Description	Default
`sample`	`Tensor`	The sample to check.	required

Returns:

Name	Type	Description
`Tensor`	`Tensor`	A float tensor indicating whether the sample is masked.

Source code in bionemo/moco/distributions/prior/discrete/mask.py

def is_masked(self, sample: Tensor) -> Tensor:
    """Creates a mask for whether a state is masked.

    Args:
        sample (Tensor): The sample to check.

    Returns:
        Tensor: A float tensor indicating whether the sample is masked.
    """
    return (sample == self.mask_dim).float()

`pad_sample(sample)`

Pads the input sample with zeros along the last dimension.

Parameters:

Name	Type	Description	Default
`sample`	`Tensor`	The input sample to be padded.	required

Returns:

Name	Type	Description
`Tensor`	`Tensor`	The padded sample.

Source code in bionemo/moco/distributions/prior/discrete/mask.py

def pad_sample(self, sample: Tensor) -> Tensor:
    """Pads the input sample with zeros along the last dimension.

    Args:
        sample (Tensor): The input sample to be padded.

    Returns:
        Tensor: The padded sample.
    """
    # Create a zeros tensor with the same shape as the original tensor, except the last dimension is 1
    zeros = torch.zeros((*sample.shape[:-1], 1), dtype=torch.float, device=sample.device)
    # Concatenate along the last dimension to make the shape (..., N+1)
    padded_sample = torch.cat((sample, zeros), dim=-1)
    return padded_sample

`sample(shape, mask=None, device='cpu', rng_generator=None)`

Generates a specified number of samples.

Parameters:

Name	Type	Description	Default
`shape`	`Tuple`	The shape of the samples to generate.	required
`device`	`str`	cpu or gpu.	`'cpu'`
`mask`	`Optional[Tensor]`	An optional mask to apply to the samples. Defaults to None.	`None`
`rng_generator`	`Optional[Generator]`	An optional :class:`torch.Generator` for reproducible sampling. Defaults to None.	`None`

Returns:

Name	Type	Description
`Float`	`Tensor`	A tensor of samples.

Source code in bionemo/moco/distributions/prior/discrete/mask.py

def sample(
    self,
    shape: Tuple,
    mask: Optional[Tensor] = None,
    device: Union[str, torch.device] = "cpu",
    rng_generator: Optional[torch.Generator] = None,
) -> Tensor:
    """Generates a specified number of samples.

    Args:
        shape (Tuple): The shape of the samples to generate.
        device (str): cpu or gpu.
        mask (Optional[Tensor]): An optional mask to apply to the samples. Defaults to None.
        rng_generator: An optional :class:`torch.Generator` for reproducible sampling. Defaults to None.

    Returns:
        Float: A tensor of samples.
    """
    samples = torch.ones(shape, dtype=torch.int64, device=device) * self.mask_dim
    if mask is not None:
        samples = samples * mask[(...,) + (None,) * (len(samples.shape) - len(mask.shape))]
    return samples

Mask

DiscreteMaskedPrior

__init__(num_classes=10, mask_dim=None, inclusive=True)

is_masked(sample)

pad_sample(sample)

sample(shape, mask=None, device='cpu', rng_generator=None)

`DiscreteMaskedPrior`

`init(num_classes=10, mask_dim=None, inclusive=True)`

`is_masked(sample)`

`pad_sample(sample)`

`sample(shape, mask=None, device='cpu', rng_generator=None)`