Metric Interfaces - API Reference¶

`warprec.evaluation.metrics.base_metric.BaseMetric` ¶

Bases: Metric, ABC

The base definition of a metric using Torchmetrics.

Source code in warprec/evaluation/metrics/base_metric.py

class BaseMetric(Metric, ABC):
    """The base definition of a metric using Torchmetrics."""

    _REQUIRED_COMPONENTS: Set[MetricBlock] = (
        set()
    )  # This defines the data that needs to be pre-computed

    @abstractmethod
    def compute(self) -> dict[str, float]:
        pass

    @classmethod
    def binary_relevance(cls, target: Tensor) -> Tensor:
        """Compute the binary relevance tensor.

        Args:
            target (Tensor): The target tensor.

        Returns:
            Tensor: The binary relevance tensor.
        """
        return (target > 0).float()

    @classmethod
    def discounted_relevance(cls, target: Tensor) -> Tensor:
        """Compute the discounted relevance tensor.

        Args:
            target (Tensor): The target tensor.

        Returns:
            Tensor: The discounted relevance tensor.
        """
        return torch.where(target > 0, 2 ** (target + 1) - 1, target)

    @classmethod
    def valid_users(cls, target: Tensor) -> Tensor:
        """Compute the number of valid users.

        Args:
            target (Tensor): The target tensor.

        Returns:
            Tensor: A Tensor containing 1 if a user is valid
                or 0 otherwise.
        """
        return (target > 0).any(dim=1).float()

    @classmethod
    def top_k_values_indices(cls, preds: Tensor, k: int) -> Tuple[Tensor, Tensor]:
        """Compute the top k indices and values.

        Args:
            preds (Tensor): The prediction tensor
            k (int): The value of cutoff.

        Returns:
            Tuple[Tensor, Tensor]:
                - Tensor: The values tensor.
                - Tensor: The indices tensor
        """
        return torch.topk(preds, k, dim=1)

    @classmethod
    def top_k_relevance_from_indices(
        cls, target: Tensor, top_k_indices: Tensor
    ) -> Tensor:
        """Compute the top k relevance tensor.

        Args:
            target (Tensor): The target tensor.
            top_k_indices (Tensor): The top k indices.

        Returns:
            Tensor: The top k relevance tensor.
        """
        return torch.gather(target, dim=1, index=top_k_indices)

    @classmethod
    def top_k_relevance(cls, preds: Tensor, target: Tensor, k: int) -> Tensor:
        """Compute the top k relevance tensor.

        Args:
            preds (Tensor): The prediction tensor
            target (Tensor): The target tensor.
            k (int): The value of cutoff.

        Returns:
            Tensor: The top k relevance tensor.
        """
        _, top_k_indices = torch.topk(preds, k, dim=1)
        return torch.gather(target, dim=1, index=top_k_indices)

    def compute_head_tail(
        self, item_interactions: Tensor, pop_ratio: float = 0.8
    ) -> Tuple[Tensor, Tensor]:
        """Compute popularity as tensors of the short head and long tail.

        Args:
            item_interactions (Tensor): The counts for item interactions in training set.
            pop_ratio (float): The percentile considered popular.

        Returns:
            Tuple[Tensor, Tensor]:
                - Tensor: The tensor containing indices of short head items.
                - Tensor: The tensor containing indices of long tail items.
        """
        # Order item popularity
        sorted_interactions, sorted_indices = torch.sort(
            item_interactions, descending=True
        )

        # Determine short head cutoff based on cumulative popularity
        cumulative_pop = torch.cumsum(sorted_interactions, dim=0)
        total_interactions = item_interactions.sum()
        cutoff_index = torch.where(cumulative_pop > total_interactions * pop_ratio)[0][
            0
        ]

        # Extract indexes from sorted interactions
        short_head_indices = sorted_indices[
            : cutoff_index + 1
        ]  # Include the item at the cutoff
        long_tail_indices = sorted_indices[cutoff_index + 1 :]

        return short_head_indices, long_tail_indices

    def compute_popularity(self, item_interactions: Tensor) -> Tensor:
        """Compute popularity tensor based on the interactions.

        Args:
            item_interactions (Tensor): The counts for item interactions in training set.

        Returns:
            Tensor: The interaction count for each item.
        """
        # Avoid division by zero: set minimum interaction
        # count to 1 if any item has zero interactions
        item_interactions = torch.clamp(item_interactions, min=1)
        return item_interactions

    def compute_novelty_profile(
        self, item_interactions: Tensor, num_users: int, log_discount: bool = False
    ) -> Tensor:
        """Compute the novelty profile based on the count of interactions.

        Args:
            item_interactions (Tensor): The counts for item interactions in training set.
            num_users (int): Number of users in the training set.
            log_discount (bool): Whether or not to compute the discounted novelty.

        Returns:
            Tensor: A tensor that contains the novelty score for each item.
        """
        total_interactions = item_interactions.sum()

        # Avoid division by zero: set minimum interaction
        # count to 1 if any item has zero interactions
        item_interactions = torch.clamp(item_interactions, min=1)

        # Add padding value
        padding_value = torch.zeros(1, device=item_interactions.device)
        item_interactions = torch.cat((item_interactions, padding_value), dim=0)

        # Compute novelty scores
        if log_discount:
            return -torch.log2(item_interactions / total_interactions).unsqueeze(0)
        return (1 - (item_interactions / num_users)).unsqueeze(0)

    def compute_area_stats(
        self, preds: Tensor, target: Tensor, num_items: int, k: Optional[int] = None
    ) -> Tuple[Tensor, Tensor]:
        """Computes the Area per user and the Number of Positives per user.

        Args:
            preds (Tensor): Predictions tensor.
            target (Tensor): Binary relevance tensor.
            num_items (int): Total number of items.
            k (Optional[int]): Cutoff for top-k evaluation. If None, considers all items.

        Returns:
            Tuple[Tensor, Tensor]:
                - Tensor: Area per user.
                - Tensor: Number of positives per user.
        """
        device = preds.device
        batch_size = preds.shape[0]

        # Negative samples count
        # Logic: Total - Train(masked) - Target + 1
        train_set = torch.isinf(preds).logical_and(preds < 0).sum(dim=1)
        target_set = target.sum(dim=1)
        neg_num = (num_items - train_set - target_set + 1).unsqueeze(1)

        # Sorting
        _, sorted_preds = torch.sort(preds, dim=1, descending=True)
        sorted_target = torch.gather(target, 1, sorted_preds)

        # Optional Slicing for top-l
        if k is not None:
            sorted_target = sorted_target[:, :k]

        # Effective Rank and Progressive Position
        # Create column indices [0, 1, 2, ...]
        col_indices = torch.arange(sorted_target.shape[1], device=device).expand(
            batch_size, -1
        )

        effective_rank = torch.where(
            sorted_target == 1, col_indices, torch.tensor(0.0, device=device)
        )

        cumsum = torch.cumsum(sorted_target, dim=1)
        progressive_position = torch.where(
            sorted_target == 1, cumsum - 1, sorted_target
        )

        # AUC Matrix Calculation
        # Formula: (Neg - Eff + Prog) / Neg
        auc_matrix = torch.where(
            sorted_target > 0,
            ((neg_num - effective_rank + progressive_position) / neg_num),
            sorted_target,  # This puts 0 where target is 0
        )

        # Aggregation per user
        area_per_user = auc_matrix.sum(dim=1)
        positives_per_user = sorted_target.sum(dim=1)

        return area_per_user, positives_per_user

    @property
    def name(self):
        """The name of the metric."""
        return self.__class__.__name__

    @property
    def components(self):
        """The required components to compute the metric."""
        return self._REQUIRED_COMPONENTS

`components` `property` ¶

The required components to compute the metric.

`name` `property` ¶

The name of the metric.

`binary_relevance(target)` `classmethod` ¶

Compute the binary relevance tensor.

Parameters:

Name	Type	Description	Default
`target`	`Tensor`	The target tensor.	required

Returns:

Name	Type	Description
`Tensor`	`Tensor`	The binary relevance tensor.

Source code in warprec/evaluation/metrics/base_metric.py

@classmethod
def binary_relevance(cls, target: Tensor) -> Tensor:
    """Compute the binary relevance tensor.

    Args:
        target (Tensor): The target tensor.

    Returns:
        Tensor: The binary relevance tensor.
    """
    return (target > 0).float()

`compute_area_stats(preds, target, num_items, k=None)` ¶

Computes the Area per user and the Number of Positives per user.

Parameters:

Name	Type	Description	Default
`preds`	`Tensor`	Predictions tensor.	required
`target`	`Tensor`	Binary relevance tensor.	required
`num_items`	`int`	Total number of items.	required
`k`	`Optional[int]`	Cutoff for top-k evaluation. If None, considers all items.	`None`

Returns:

Type	Description
`Tuple[Tensor, Tensor]`	Tuple[Tensor, Tensor]: - Tensor: Area per user. - Tensor: Number of positives per user.

Source code in warprec/evaluation/metrics/base_metric.py

def compute_area_stats(
    self, preds: Tensor, target: Tensor, num_items: int, k: Optional[int] = None
) -> Tuple[Tensor, Tensor]:
    """Computes the Area per user and the Number of Positives per user.

    Args:
        preds (Tensor): Predictions tensor.
        target (Tensor): Binary relevance tensor.
        num_items (int): Total number of items.
        k (Optional[int]): Cutoff for top-k evaluation. If None, considers all items.

    Returns:
        Tuple[Tensor, Tensor]:
            - Tensor: Area per user.
            - Tensor: Number of positives per user.
    """
    device = preds.device
    batch_size = preds.shape[0]

    # Negative samples count
    # Logic: Total - Train(masked) - Target + 1
    train_set = torch.isinf(preds).logical_and(preds < 0).sum(dim=1)
    target_set = target.sum(dim=1)
    neg_num = (num_items - train_set - target_set + 1).unsqueeze(1)

    # Sorting
    _, sorted_preds = torch.sort(preds, dim=1, descending=True)
    sorted_target = torch.gather(target, 1, sorted_preds)

    # Optional Slicing for top-l
    if k is not None:
        sorted_target = sorted_target[:, :k]

    # Effective Rank and Progressive Position
    # Create column indices [0, 1, 2, ...]
    col_indices = torch.arange(sorted_target.shape[1], device=device).expand(
        batch_size, -1
    )

    effective_rank = torch.where(
        sorted_target == 1, col_indices, torch.tensor(0.0, device=device)
    )

    cumsum = torch.cumsum(sorted_target, dim=1)
    progressive_position = torch.where(
        sorted_target == 1, cumsum - 1, sorted_target
    )

    # AUC Matrix Calculation
    # Formula: (Neg - Eff + Prog) / Neg
    auc_matrix = torch.where(
        sorted_target > 0,
        ((neg_num - effective_rank + progressive_position) / neg_num),
        sorted_target,  # This puts 0 where target is 0
    )

    # Aggregation per user
    area_per_user = auc_matrix.sum(dim=1)
    positives_per_user = sorted_target.sum(dim=1)

    return area_per_user, positives_per_user

`compute_head_tail(item_interactions, pop_ratio=0.8)` ¶

Compute popularity as tensors of the short head and long tail.

Parameters:

Name	Type	Description	Default
`item_interactions`	`Tensor`	The counts for item interactions in training set.	required
`pop_ratio`	`float`	The percentile considered popular.	`0.8`

Returns:

Type	Description
`Tuple[Tensor, Tensor]`	Tuple[Tensor, Tensor]: - Tensor: The tensor containing indices of short head items. - Tensor: The tensor containing indices of long tail items.

Source code in warprec/evaluation/metrics/base_metric.py

def compute_head_tail(
    self, item_interactions: Tensor, pop_ratio: float = 0.8
) -> Tuple[Tensor, Tensor]:
    """Compute popularity as tensors of the short head and long tail.

    Args:
        item_interactions (Tensor): The counts for item interactions in training set.
        pop_ratio (float): The percentile considered popular.

    Returns:
        Tuple[Tensor, Tensor]:
            - Tensor: The tensor containing indices of short head items.
            - Tensor: The tensor containing indices of long tail items.
    """
    # Order item popularity
    sorted_interactions, sorted_indices = torch.sort(
        item_interactions, descending=True
    )

    # Determine short head cutoff based on cumulative popularity
    cumulative_pop = torch.cumsum(sorted_interactions, dim=0)
    total_interactions = item_interactions.sum()
    cutoff_index = torch.where(cumulative_pop > total_interactions * pop_ratio)[0][
        0
    ]

    # Extract indexes from sorted interactions
    short_head_indices = sorted_indices[
        : cutoff_index + 1
    ]  # Include the item at the cutoff
    long_tail_indices = sorted_indices[cutoff_index + 1 :]

    return short_head_indices, long_tail_indices

`compute_novelty_profile(item_interactions, num_users, log_discount=False)` ¶

Compute the novelty profile based on the count of interactions.

Parameters:

Name	Type	Description	Default
`item_interactions`	`Tensor`	The counts for item interactions in training set.	required
`num_users`	`int`	Number of users in the training set.	required
`log_discount`	`bool`	Whether or not to compute the discounted novelty.	`False`

Returns:

Name	Type	Description
`Tensor`	`Tensor`	A tensor that contains the novelty score for each item.

Source code in warprec/evaluation/metrics/base_metric.py

def compute_novelty_profile(
    self, item_interactions: Tensor, num_users: int, log_discount: bool = False
) -> Tensor:
    """Compute the novelty profile based on the count of interactions.

    Args:
        item_interactions (Tensor): The counts for item interactions in training set.
        num_users (int): Number of users in the training set.
        log_discount (bool): Whether or not to compute the discounted novelty.

    Returns:
        Tensor: A tensor that contains the novelty score for each item.
    """
    total_interactions = item_interactions.sum()

    # Avoid division by zero: set minimum interaction
    # count to 1 if any item has zero interactions
    item_interactions = torch.clamp(item_interactions, min=1)

    # Add padding value
    padding_value = torch.zeros(1, device=item_interactions.device)
    item_interactions = torch.cat((item_interactions, padding_value), dim=0)

    # Compute novelty scores
    if log_discount:
        return -torch.log2(item_interactions / total_interactions).unsqueeze(0)
    return (1 - (item_interactions / num_users)).unsqueeze(0)

`compute_popularity(item_interactions)` ¶

Compute popularity tensor based on the interactions.

Parameters:

Name	Type	Description	Default
`item_interactions`	`Tensor`	The counts for item interactions in training set.	required

Returns:

Name	Type	Description
`Tensor`	`Tensor`	The interaction count for each item.

Source code in warprec/evaluation/metrics/base_metric.py

def compute_popularity(self, item_interactions: Tensor) -> Tensor:
    """Compute popularity tensor based on the interactions.

    Args:
        item_interactions (Tensor): The counts for item interactions in training set.

    Returns:
        Tensor: The interaction count for each item.
    """
    # Avoid division by zero: set minimum interaction
    # count to 1 if any item has zero interactions
    item_interactions = torch.clamp(item_interactions, min=1)
    return item_interactions

`discounted_relevance(target)` `classmethod` ¶

Compute the discounted relevance tensor.

Parameters:

Name	Type	Description	Default
`target`	`Tensor`	The target tensor.	required

Returns:

Name	Type	Description
`Tensor`	`Tensor`	The discounted relevance tensor.

Source code in warprec/evaluation/metrics/base_metric.py

@classmethod
def discounted_relevance(cls, target: Tensor) -> Tensor:
    """Compute the discounted relevance tensor.

    Args:
        target (Tensor): The target tensor.

    Returns:
        Tensor: The discounted relevance tensor.
    """
    return torch.where(target > 0, 2 ** (target + 1) - 1, target)

`top_k_relevance(preds, target, k)` `classmethod` ¶

Compute the top k relevance tensor.

Parameters:

Name	Type	Description	Default
`preds`	`Tensor`	The prediction tensor	required
`target`	`Tensor`	The target tensor.	required
`k`	`int`	The value of cutoff.	required

Returns:

Name	Type	Description
`Tensor`	`Tensor`	The top k relevance tensor.

Source code in warprec/evaluation/metrics/base_metric.py

@classmethod
def top_k_relevance(cls, preds: Tensor, target: Tensor, k: int) -> Tensor:
    """Compute the top k relevance tensor.

    Args:
        preds (Tensor): The prediction tensor
        target (Tensor): The target tensor.
        k (int): The value of cutoff.

    Returns:
        Tensor: The top k relevance tensor.
    """
    _, top_k_indices = torch.topk(preds, k, dim=1)
    return torch.gather(target, dim=1, index=top_k_indices)

`top_k_relevance_from_indices(target, top_k_indices)` `classmethod` ¶

Compute the top k relevance tensor.

Parameters:

Name	Type	Description	Default
`target`	`Tensor`	The target tensor.	required
`top_k_indices`	`Tensor`	The top k indices.	required

Returns:

Name	Type	Description
`Tensor`	`Tensor`	The top k relevance tensor.

Source code in warprec/evaluation/metrics/base_metric.py

@classmethod
def top_k_relevance_from_indices(
    cls, target: Tensor, top_k_indices: Tensor
) -> Tensor:
    """Compute the top k relevance tensor.

    Args:
        target (Tensor): The target tensor.
        top_k_indices (Tensor): The top k indices.

    Returns:
        Tensor: The top k relevance tensor.
    """
    return torch.gather(target, dim=1, index=top_k_indices)

`top_k_values_indices(preds, k)` `classmethod` ¶

Compute the top k indices and values.

Parameters:

Name	Type	Description	Default
`preds`	`Tensor`	The prediction tensor	required
`k`	`int`	The value of cutoff.	required

Returns:

Type	Description
`Tuple[Tensor, Tensor]`	Tuple[Tensor, Tensor]: - Tensor: The values tensor. - Tensor: The indices tensor

Source code in warprec/evaluation/metrics/base_metric.py

@classmethod
def top_k_values_indices(cls, preds: Tensor, k: int) -> Tuple[Tensor, Tensor]:
    """Compute the top k indices and values.

    Args:
        preds (Tensor): The prediction tensor
        k (int): The value of cutoff.

    Returns:
        Tuple[Tensor, Tensor]:
            - Tensor: The values tensor.
            - Tensor: The indices tensor
    """
    return torch.topk(preds, k, dim=1)

`valid_users(target)` `classmethod` ¶

Compute the number of valid users.

Parameters:

Name	Type	Description	Default
`target`	`Tensor`	The target tensor.	required

Returns:

Name	Type	Description
`Tensor`	`Tensor`	A Tensor containing 1 if a user is valid or 0 otherwise.

Source code in warprec/evaluation/metrics/base_metric.py

@classmethod
def valid_users(cls, target: Tensor) -> Tensor:
    """Compute the number of valid users.

    Args:
        target (Tensor): The target tensor.

    Returns:
        Tensor: A Tensor containing 1 if a user is valid
            or 0 otherwise.
    """
    return (target > 0).any(dim=1).float()

`warprec.evaluation.metrics.base_metric.RatingMetric` ¶

Bases: BaseMetric

The definition of Rating Metric.

Attributes:

Name	Type	Description
`error_sum`	`Tensor`	The tensor to store per-user error sum.
`total_count`	`Tensor`	The tensor to store per-user count of ratings.

Parameters:

Name	Type	Description	Default
`num_users`	`int`	Number of users in the training set.	required
`dist_sync_on_step`	`bool`	Torchmetrics parameter.	`False`
`**kwargs`	`Any`	Additional keyword arguments to pass to the parent class.	`{}`

Source code in warprec/evaluation/metrics/base_metric.py

class RatingMetric(BaseMetric):
    """The definition of Rating Metric.

    Attributes:
        error_sum (Tensor): The tensor to store per-user error sum.
        total_count (Tensor): The tensor to store per-user count of ratings.

    Args:
        num_users (int): Number of users in the training set.
        dist_sync_on_step (bool): Torchmetrics parameter.
        **kwargs (Any): Additional keyword arguments to pass to the parent class.
    """

    error_sum: Tensor
    total_count: Tensor

    def __init__(
        self,
        num_users: int,
        dist_sync_on_step: bool = False,
        **kwargs: Any,
    ):
        super().__init__(dist_sync_on_step=dist_sync_on_step)
        self.add_state(
            "error_sum", default=torch.zeros(num_users), dist_reduce_fx="sum"
        )  # Initialize a tensor to store per-user error sum
        self.add_state(
            "total_count", default=torch.zeros(num_users), dist_reduce_fx="sum"
        )  # Initialize a tensor to store per-user count of ratings

    @abstractmethod
    def _compute_element_error(self, preds: Tensor, target: Tensor) -> Tensor:
        """Computes the error between predictions and target."""
        pass

    def update(self, preds: Tensor, user_indices: Tensor, **kwargs: Any):
        """Unified update logic using index_add_."""
        target = kwargs.get("ground", torch.zeros_like(preds))

        # Mask for valid ratings
        mask = target > 0

        # Compute error
        errors = self._compute_element_error(preds, target)

        # Zero out errors for non-rated items to be safe
        errors = errors * mask.float()

        # Accumulate per user
        self.error_sum.index_add_(0, user_indices, errors.sum(dim=1))
        self.total_count.index_add_(0, user_indices, mask.sum(dim=1).float())

    def compute(self):
        """Computes the final metric value."""
        results = self.error_sum / self.total_count  # Calculate metric per user
        results[self.total_count == 0] = float(
            "nan"
        )  # Set nan for users with no interactions
        return {self.name: results}

`compute()` ¶

Computes the final metric value.

Source code in warprec/evaluation/metrics/base_metric.py

def compute(self):
    """Computes the final metric value."""
    results = self.error_sum / self.total_count  # Calculate metric per user
    results[self.total_count == 0] = float(
        "nan"
    )  # Set nan for users with no interactions
    return {self.name: results}

`update(preds, user_indices, **kwargs)` ¶

Unified update logic using index_add_.

Source code in warprec/evaluation/metrics/base_metric.py

def update(self, preds: Tensor, user_indices: Tensor, **kwargs: Any):
    """Unified update logic using index_add_."""
    target = kwargs.get("ground", torch.zeros_like(preds))

    # Mask for valid ratings
    mask = target > 0

    # Compute error
    errors = self._compute_element_error(preds, target)

    # Zero out errors for non-rated items to be safe
    errors = errors * mask.float()

    # Accumulate per user
    self.error_sum.index_add_(0, user_indices, errors.sum(dim=1))
    self.total_count.index_add_(0, user_indices, mask.sum(dim=1).float())

`warprec.evaluation.metrics.base_metric.TopKMetric` ¶

Bases: BaseMetric

The definition of a Top-K metric.

Attributes:

Name	Type	Description
`k`	`int`	The cutoff value.

Parameters:

Name	Type	Description	Default
`k`	`int`	The cutoff for recommendations.	required
`dist_sync_on_step`	`bool`	Torchmetrics parameter.	`False`
`**kwargs`	`Any`	Additional keyword arguments to pass to the parent class.	`{}`

Source code in warprec/evaluation/metrics/base_metric.py

class TopKMetric(BaseMetric):
    """The definition of a Top-K metric.

    Attributes:
        k (int): The cutoff value.

    Args:
        k (int): The cutoff for recommendations.
        dist_sync_on_step (bool): Torchmetrics parameter.
        **kwargs (Any): Additional keyword arguments to pass to the parent class.
    """

    k: int

    def __init__(
        self,
        k: int,
        dist_sync_on_step: bool = False,
        **kwargs: Any,
    ):
        super().__init__(dist_sync_on_step=dist_sync_on_step)
        self.k = k

    def dcg(self, rel: Tensor) -> Tensor:
        """The Discounted Cumulative Gain definition.

        Args:
            rel (Tensor): The relevance tensor.

        Returns:
            Tensor: The discounted tensor.
        """
        return (
            rel / torch.log2(torch.arange(2, rel.size(1) + 2, device=rel.device))
        ).sum(dim=1)

    def discounted_sum(self, k: int) -> Tensor:
        """Computes the discounted sum for k values.

        Args:
            k (int): The length of the tensor to discount.

        Returns:
            Tensor: The sum of the discounts for k values.
        """
        ranks = torch.arange(k)
        return torch.sum(1.0 / torch.log2(ranks.float() + 2))

    def remap_indices(self, top_k_indices: Tensor, item_indices: Tensor) -> Tensor:
        """Remap local batch indices to global item IDs if item_indices is provided.

        Args:
            top_k_indices (Tensor): The top k indices tensor.
            item_indices (Tensor): The global item indices tensor.

        Returns:
            Tensor: The remapped top k indices tensor.
        """
        if item_indices is not None:
            return torch.gather(item_indices, 1, top_k_indices)
        return top_k_indices

`dcg(rel)` ¶

The Discounted Cumulative Gain definition.

Parameters:

Name	Type	Description	Default
`rel`	`Tensor`	The relevance tensor.	required

Returns:

Name	Type	Description
`Tensor`	`Tensor`	The discounted tensor.

Source code in warprec/evaluation/metrics/base_metric.py

def dcg(self, rel: Tensor) -> Tensor:
    """The Discounted Cumulative Gain definition.

    Args:
        rel (Tensor): The relevance tensor.

    Returns:
        Tensor: The discounted tensor.
    """
    return (
        rel / torch.log2(torch.arange(2, rel.size(1) + 2, device=rel.device))
    ).sum(dim=1)

`discounted_sum(k)` ¶

Computes the discounted sum for k values.

Parameters:

Name	Type	Description	Default
`k`	`int`	The length of the tensor to discount.	required

Returns:

Name	Type	Description
`Tensor`	`Tensor`	The sum of the discounts for k values.

Source code in warprec/evaluation/metrics/base_metric.py

def discounted_sum(self, k: int) -> Tensor:
    """Computes the discounted sum for k values.

    Args:
        k (int): The length of the tensor to discount.

    Returns:
        Tensor: The sum of the discounts for k values.
    """
    ranks = torch.arange(k)
    return torch.sum(1.0 / torch.log2(ranks.float() + 2))

`remap_indices(top_k_indices, item_indices)` ¶

Remap local batch indices to global item IDs if item_indices is provided.

Parameters:

Name	Type	Description	Default
`top_k_indices`	`Tensor`	The top k indices tensor.	required
`item_indices`	`Tensor`	The global item indices tensor.	required

Returns:

Name	Type	Description
`Tensor`	`Tensor`	The remapped top k indices tensor.

Source code in warprec/evaluation/metrics/base_metric.py

def remap_indices(self, top_k_indices: Tensor, item_indices: Tensor) -> Tensor:
    """Remap local batch indices to global item IDs if item_indices is provided.

    Args:
        top_k_indices (Tensor): The top k indices tensor.
        item_indices (Tensor): The global item indices tensor.

    Returns:
        Tensor: The remapped top k indices tensor.
    """
    if item_indices is not None:
        return torch.gather(item_indices, 1, top_k_indices)
    return top_k_indices

`warprec.evaluation.metrics.base_metric.UserAverageTopKMetric` ¶

Bases: TopKMetric

The definition of a User Average Top-K metric.

Attributes:

Name	Type	Description
`scores`	`Tensor`	The tensor to store metric values.
`user_interactions`	`Tensor`	The tensor to store number of interactions per user.

Parameters:

Name	Type	Description	Default
`k`	`int`	The cutoff.	required
`num_users`	`int`	Number of users in the training set.	required
`*args`	`Any`	The argument list.	`()`
`dist_sync_on_step`	`bool`	Torchmetrics parameter.	`False`
`**kwargs`	`Any`	Additional keyword arguments to pass to the parent class.	`{}`

Source code in warprec/evaluation/metrics/base_metric.py

class UserAverageTopKMetric(TopKMetric):
    """The definition of a User Average Top-K metric.

    Attributes:
        scores (Tensor): The tensor to store metric values.
        user_interactions (Tensor): The tensor to store number of interactions per user.

    Args:
        k (int): The cutoff.
        num_users (int): Number of users in the training set.
        *args (Any): The argument list.
        dist_sync_on_step (bool): Torchmetrics parameter.
        **kwargs (Any): Additional keyword arguments to pass to the parent class.
    """

    scores: Tensor
    user_interactions: Tensor

    def __init__(
        self,
        k: int,
        num_users: int,
        *args: Any,
        dist_sync_on_step: bool = False,
        **kwargs: Any,
    ):
        super().__init__(k=k, dist_sync_on_step=dist_sync_on_step)
        self.add_state(
            "scores", default=torch.zeros(num_users), dist_reduce_fx="sum"
        )  # Initialize a tensor to store metric value for each user
        self.add_state(
            "user_interactions", default=torch.zeros(num_users), dist_reduce_fx="sum"
        )  # Initialize a tensor to store number of interactions per user

    def unpack_inputs(
        self, preds: Tensor, **kwargs: Any
    ) -> Tuple[Tensor, Tensor, Tensor]:
        """Default unpacking method used by most metrics.

        Retrieves the binary relevance, valid users and top-k binary relevance.

        Args:
            preds (Tensor): The prediction tensor.
            **kwargs (Any): The keyword argument dictionary.

        Returns:
            Tuple[Tensor, Tensor, Tensor]:
                - Tensor: The target tensor.
                - Tensor: The valid users tensor.
                - Tensor: The top-k relevance tensor.
        """
        target = kwargs.get("binary_relevance", torch.zeros_like(preds))
        users = kwargs.get("valid_users", self.valid_users(target))
        top_k_rel = kwargs.get(
            f"top_{self.k}_binary_relevance",
            self.top_k_relevance(preds, target, self.k),
        )
        return target, users, top_k_rel

    @abstractmethod
    def compute_scores(
        self, preds: Tensor, target: Tensor, top_k_rel: Tensor, **kwargs: Any
    ) -> Tensor:
        """Math formula for the specific metric.

        Metrics must implement this method.

        Args:
            preds (Tensor): The prediction tensor.
            target (Tensor): The target tensor.
            top_k_rel (Tensor): The top-k relevance tensor.
            **kwargs (Any): The keyword argument dictionary.

        Returns:
            Tensor: The computed metric values per user.
        """
        pass

    def update(self, preds: Tensor, user_indices: Tensor, **kwargs: Any):
        """Unified update logic."""
        target, users, top_k_data = self.unpack_inputs(preds, **kwargs)
        batch_scores = self.compute_scores(preds, target, top_k_data, **kwargs)

        # Safety masking
        batch_scores = torch.where(
            users > 0, batch_scores, torch.tensor(0.0, device=preds.device)
        )

        # Accumulate per user
        self.scores.index_add_(0, user_indices, batch_scores)
        self.user_interactions.index_add_(0, user_indices, users)

    def compute(self):
        """Computes the final metric value."""
        scores = self.scores / self.user_interactions  # Normalize the metric score
        scores[self.user_interactions == 0] = float(
            "nan"
        )  # Set nan for users with no interactions
        return {self.name: scores}

`compute()` ¶

Computes the final metric value.

Source code in warprec/evaluation/metrics/base_metric.py

def compute(self):
    """Computes the final metric value."""
    scores = self.scores / self.user_interactions  # Normalize the metric score
    scores[self.user_interactions == 0] = float(
        "nan"
    )  # Set nan for users with no interactions
    return {self.name: scores}

`compute_scores(preds, target, top_k_rel, **kwargs)` `abstractmethod` ¶

Math formula for the specific metric.

Metrics must implement this method.

Parameters:

Name	Type	Description	Default
`preds`	`Tensor`	The prediction tensor.	required
`target`	`Tensor`	The target tensor.	required
`top_k_rel`	`Tensor`	The top-k relevance tensor.	required
`**kwargs`	`Any`	The keyword argument dictionary.	`{}`

Returns:

Name	Type	Description
`Tensor`	`Tensor`	The computed metric values per user.

Source code in warprec/evaluation/metrics/base_metric.py

@abstractmethod
def compute_scores(
    self, preds: Tensor, target: Tensor, top_k_rel: Tensor, **kwargs: Any
) -> Tensor:
    """Math formula for the specific metric.

    Metrics must implement this method.

    Args:
        preds (Tensor): The prediction tensor.
        target (Tensor): The target tensor.
        top_k_rel (Tensor): The top-k relevance tensor.
        **kwargs (Any): The keyword argument dictionary.

    Returns:
        Tensor: The computed metric values per user.
    """
    pass

`unpack_inputs(preds, **kwargs)` ¶

Default unpacking method used by most metrics.

Retrieves the binary relevance, valid users and top-k binary relevance.

Parameters:

Name	Type	Description	Default
`preds`	`Tensor`	The prediction tensor.	required
`**kwargs`	`Any`	The keyword argument dictionary.	`{}`

Returns:

Type	Description
`Tuple[Tensor, Tensor, Tensor]`	Tuple[Tensor, Tensor, Tensor]: - Tensor: The target tensor. - Tensor: The valid users tensor. - Tensor: The top-k relevance tensor.

Source code in warprec/evaluation/metrics/base_metric.py

def unpack_inputs(
    self, preds: Tensor, **kwargs: Any
) -> Tuple[Tensor, Tensor, Tensor]:
    """Default unpacking method used by most metrics.

    Retrieves the binary relevance, valid users and top-k binary relevance.

    Args:
        preds (Tensor): The prediction tensor.
        **kwargs (Any): The keyword argument dictionary.

    Returns:
        Tuple[Tensor, Tensor, Tensor]:
            - Tensor: The target tensor.
            - Tensor: The valid users tensor.
            - Tensor: The top-k relevance tensor.
    """
    target = kwargs.get("binary_relevance", torch.zeros_like(preds))
    users = kwargs.get("valid_users", self.valid_users(target))
    top_k_rel = kwargs.get(
        f"top_{self.k}_binary_relevance",
        self.top_k_relevance(preds, target, self.k),
    )
    return target, users, top_k_rel

`update(preds, user_indices, **kwargs)` ¶

Unified update logic.

Source code in warprec/evaluation/metrics/base_metric.py

def update(self, preds: Tensor, user_indices: Tensor, **kwargs: Any):
    """Unified update logic."""
    target, users, top_k_data = self.unpack_inputs(preds, **kwargs)
    batch_scores = self.compute_scores(preds, target, top_k_data, **kwargs)

    # Safety masking
    batch_scores = torch.where(
        users > 0, batch_scores, torch.tensor(0.0, device=preds.device)
    )

    # Accumulate per user
    self.scores.index_add_(0, user_indices, batch_scores)
    self.user_interactions.index_add_(0, user_indices, users)

Metric Interfaces - API Reference¶

warprec.evaluation.metrics.base_metric.BaseMetric ¶

components property ¶

name property ¶

binary_relevance(target) classmethod ¶

compute_area_stats(preds, target, num_items, k=None) ¶

compute_head_tail(item_interactions, pop_ratio=0.8) ¶

compute_novelty_profile(item_interactions, num_users, log_discount=False) ¶

compute_popularity(item_interactions) ¶

discounted_relevance(target) classmethod ¶

top_k_relevance(preds, target, k) classmethod ¶

top_k_relevance_from_indices(target, top_k_indices) classmethod ¶

top_k_values_indices(preds, k) classmethod ¶

valid_users(target) classmethod ¶

warprec.evaluation.metrics.base_metric.RatingMetric ¶

compute() ¶

update(preds, user_indices, **kwargs) ¶

warprec.evaluation.metrics.base_metric.TopKMetric ¶

dcg(rel) ¶

discounted_sum(k) ¶

remap_indices(top_k_indices, item_indices) ¶

warprec.evaluation.metrics.base_metric.UserAverageTopKMetric ¶

compute() ¶

compute_scores(preds, target, top_k_rel, **kwargs) abstractmethod ¶

unpack_inputs(preds, **kwargs) ¶

update(preds, user_indices, **kwargs) ¶

`warprec.evaluation.metrics.base_metric.BaseMetric` ¶

`components` `property` ¶

`name` `property` ¶

`binary_relevance(target)` `classmethod` ¶

`compute_area_stats(preds, target, num_items, k=None)` ¶

`compute_head_tail(item_interactions, pop_ratio=0.8)` ¶

`compute_novelty_profile(item_interactions, num_users, log_discount=False)` ¶

`compute_popularity(item_interactions)` ¶

`discounted_relevance(target)` `classmethod` ¶

`top_k_relevance(preds, target, k)` `classmethod` ¶

`top_k_relevance_from_indices(target, top_k_indices)` `classmethod` ¶

`top_k_values_indices(preds, k)` `classmethod` ¶

`valid_users(target)` `classmethod` ¶

`warprec.evaluation.metrics.base_metric.RatingMetric` ¶

`compute()` ¶

`update(preds, user_indices, **kwargs)` ¶

`warprec.evaluation.metrics.base_metric.TopKMetric` ¶

`dcg(rel)` ¶

`discounted_sum(k)` ¶

`remap_indices(top_k_indices, item_indices)` ¶

`warprec.evaluation.metrics.base_metric.UserAverageTopKMetric` ¶

`compute()` ¶

`compute_scores(preds, target, top_k_rel, **kwargs)` `abstractmethod` ¶

`unpack_inputs(preds, **kwargs)` ¶

`update(preds, user_indices, **kwargs)` ¶