Source code for prompt_optimizer.poptim.pulp_optim

from pulp import LpBinary, LpMinimize, LpProblem, LpVariable, lpSum

from prompt_optimizer.poptim.base import PromptOptim


[docs]class PulpOptim(PromptOptim):
    """
    PulpOptim is a prompt optimization technique based on integer linear programming using the Pulp library.

    It inherits from the PromptOptim base class.

    Example:
        >>> from prompt_optimizer.poptim import PulpOptim
        >>> p_optimizer = PulpOptim(p=0.1)
        >>> res = p_optimizer("example prompt...")
        >>> optimized_prompt = res.content
    """

    def __init__(self, p: float = 0.1, verbose: bool = False, metrics: list = []):
        """
        Initializes the PulpOptim.

        Args:
            p (float, optional): The aggression factor controlling the reduction in the number of tokens. Defaults to 0.1. Higher `p` corresponds to lower token output count.
            verbose (bool, optional): Flag indicating whether to enable verbose output. Defaults to False.
            metrics (list, optional): A list of metric names to evaluate during optimization. Defaults to an empty list.
        """
        super().__init__(verbose, metrics)
        self.aggression = p  # will reduce num tokens by aggression*100%

[docs]    def optimize(self, prompt: str) -> str:
        """
        Runs the prompt optimization technique on the prompt.

        Args:
            prompt (str): The prompt text.

        Returns:
            str: The optimized prompt text.
        """
        tokens = prompt.split()
        target_length = int(len(tokens) * (1 - self.aggression))

        x = LpVariable.dicts("x", range(len(tokens)), cat=LpBinary)

        # Define the objective function to minimize the number of deleted tokens
        model = LpProblem("Extractive Compression", LpMinimize)
        model += lpSum([1 - x[i] for i in range(len(tokens))])

        # Constraints to ensure that the compressed text has the target length
        model += lpSum([x[i] for i in range(len(tokens))]) == target_length

        # Constraints for compressed text is a subsequence of the original text
        for i in range(len(tokens)):
            for j in range(i + 1, len(tokens)):
                if tokens[i] == tokens[j]:
                    model += x[i] <= x[j]

        # Solve the optimization problem
        model.solve()

        # Extract the indices of the selected tokens
        selected_indices = [i for i in range(len(tokens)) if x[i].value() == 1]

        # Generate the compressed text
        opti_prompt = " ".join([tokens[i] for i in selected_indices])
        return opti_prompt