Source code for llm_samplers.base

from abc import ABC, abstractmethod
from typing import Any

import torch



[docs]
class BaseSampler(ABC):
    """Base class for all samplers."""


[docs]
    def __init__(self):
        self.device = torch.device("cuda" if torch.cuda.is_available() else "cpu")



[docs]
    @abstractmethod
    def sample(
        self,
        model: Any,
        input_ids: torch.Tensor,
        max_length: int = 100,
        num_return_sequences: int = 1,
        **kwargs,
    ) -> torch.Tensor:
        """
        Sample from the model using the specific sampling strategy.

        Args:
            model: The language model to sample from
            input_ids: Input token IDs
            max_length: Maximum length of the generated sequence
            num_return_sequences: Number of sequences to return
            **kwargs: Additional arguments specific to the sampler

        Returns:
            torch.Tensor: Generated token IDs
        """
        pass


    def _get_logits(self, model: Any, input_ids: torch.Tensor) -> torch.Tensor:
        """
        Get the logits from the model for the given input.

        Args:
            model: The language model
            input_ids: Input token IDs

        Returns:
            torch.Tensor: Logits from the model
        """
        with torch.no_grad():
            outputs = model(input_ids)
            logits = outputs.logits[:, -1, :]
        return logits

    def _apply_sampling(self, logits: torch.Tensor) -> torch.Tensor:
        """
        Apply the sampling strategy to the logits.

        Args:
            logits: Raw logits from the model

        Returns:
            torch.Tensor: Processed logits ready for sampling
        """
        return logits

    def _sample_from_logits(
        self, logits: torch.Tensor, num_samples: int = 1
    ) -> torch.Tensor:
        """
        Sample from the processed logits.

        Args:
            logits: Processed logits
            num_samples: Number of samples to generate

        Returns:
            torch.Tensor: Sampled token IDs
        """
        probs = torch.softmax(logits, dim=-1)
        return torch.multinomial(probs, num_samples=num_samples)