Source code for transformers4rec.tf.ranking_metric

#
# Copyright (c) 2021, NVIDIA CORPORATION.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
#

# Adapted from source code: https://github.com/karlhigley/ranking-metrics-torch
from abc import abstractmethod

import tensorflow as tf

from merlin_standard_lib import Registry

from .utils import tf_utils

ranking_metrics_registry = Registry.class_registry("tf.ranking_metrics")

METRIC_PARAMETERS_DOCSTRING = """
    ks : tf.Tensor
        tensor of cutoffs.
    scores : tf.Tensor
        scores of predicted item-ids.
    labels : tf.Tensor
        true item-ids labels.
"""


[docs]class RankingMetric(tf.keras.metrics.Metric):
    """
    Metric wrapper for computing ranking metrics@K for session-based task.

    Parameters
    ----------
    top_ks : list, default [2, 5])
        list of cutoffs
    labels_onehot : bool
        Enable transform the encoded labels to one-hot representation
    """

    def __init__(self, name=None, dtype=None, top_ks=[2, 5], labels_onehot=False, **kwargs):
        super(RankingMetric, self).__init__(name=name, **kwargs)
        self.top_ks = top_ks
        self.labels_onehot = labels_onehot
        # Store the mean vector of the batch metrics (for each cut-off at topk) in ListWrapper
        self.metric_mean = []

[docs]    def update_state(self, y_true: tf.Tensor, y_pred: tf.Tensor, **kwargs):
        # Computing the metrics at different cut-offs
        if self.labels_onehot:
            y_true = tf_utils.tranform_label_to_onehot(y_true, y_pred.shape[-1])
        metric = self._metric(
            tf.convert_to_tensor(self.top_ks), tf.reshape(y_pred, [-1, y_pred.shape[-1]]), y_true
        )
        self.metric_mean.append(metric)

[docs]    def result(self):
        # Computing the mean of the batch metrics (for each cut-off at topk)
        return tf.reduce_mean(tf.concat(self.metric_mean, axis=0), axis=0)

[docs]    def reset_state(self):
        self.metric_mean = []

    @abstractmethod
    def _metric(self, ks: tf.Tensor, preds: tf.Tensor, target: tf.Tensor) -> tf.Tensor:
        """
        Compute ranking metric over predictions and one-hot targets for different cut-offs.
        This method should be overridden by subclasses.

        Parameters
        ----------
        {METRIC_PARAMETERS_DOCSTRING}
        """
        raise NotImplementedError


[docs]@ranking_metrics_registry.register_with_multiple_names("precision_at", "precision")
class PrecisionAt(RankingMetric):
    def __init__(self, top_ks=None, labels_onehot=False):
        super(PrecisionAt, self).__init__(top_ks=top_ks, labels_onehot=labels_onehot)

    def _metric(self, ks: tf.Tensor, scores: tf.Tensor, labels: tf.Tensor) -> tf.Tensor:
        """
        Compute precision@K for each provided cutoff in ks

        Parameters
        ----------
        {METRIC_PARAMETERS_DOCSTRING}
        """

        ks, scores, labels = check_inputs(ks, scores, labels)
        _, _, topk_labels = tf_utils.extract_topk(ks, scores, labels)
        precisions = tf_utils.create_output_placeholder(scores, ks)

        for index, k in enumerate(ks):
            precisions[:, index].assign(tf.reduce_sum(topk_labels[:, : int(k)], axis=1) / float(k))

        return precisions


[docs]@ranking_metrics_registry.register_with_multiple_names("recall_at", "recall")
class RecallAt(RankingMetric):
    def __init__(self, top_ks=None, labels_onehot=False):
        super(RecallAt, self).__init__(top_ks=top_ks, labels_onehot=labels_onehot)

    def _metric(self, ks: tf.Tensor, scores: tf.Tensor, labels: tf.Tensor) -> tf.Tensor:
        """
        Compute recall@K for each provided cutoff in ks

        Parameters
        ----------
        {METRIC_PARAMETERS_DOCSTRING}
        """

        ks, scores, labels = check_inputs(ks, scores, labels)
        _, _, topk_labels = tf_utils.extract_topk(ks, scores, labels)
        recalls = tf_utils.create_output_placeholder(scores, ks)

        # Compute recalls at K
        num_relevant = tf.reduce_sum(labels, axis=-1)
        rel_indices = tf.where(num_relevant != 0)
        rel_count = tf.gather_nd(num_relevant, rel_indices)

        if rel_indices.shape[0] > 0:
            for index, k in enumerate(ks):
                rel_labels = tf.cast(
                    tf.gather_nd(topk_labels, rel_indices)[:, : int(k)], tf.float32
                )
                batch_recall_k = tf.cast(
                    tf.reshape(
                        tf.math.divide(tf.reduce_sum(rel_labels, axis=-1), rel_count),
                        (len(rel_indices), 1),
                    ),
                    tf.float32,
                )
                # Ensuring type is double, because it can be float if --fp16

                update_indices = tf.concat(
                    [
                        rel_indices,
                        tf.expand_dims(index * tf.ones(rel_indices.shape[0], tf.int64), -1),
                    ],
                    axis=1,
                )
                recalls = tf.tensor_scatter_nd_update(
                    recalls, indices=update_indices, updates=tf.reshape(batch_recall_k, -1)
                )

        return recalls


[docs]@ranking_metrics_registry.register_with_multiple_names("avg_precision_at", "avg_precision", "map")
class AvgPrecisionAt(RankingMetric):
    def __init__(self, top_ks=None, labels_onehot=False):
        super(AvgPrecisionAt, self).__init__(top_ks=top_ks, labels_onehot=labels_onehot)
        self.precision_at = PrecisionAt(top_ks)._metric

    def _metric(self, ks: tf.Tensor, scores: tf.Tensor, labels: tf.Tensor) -> tf.Tensor:
        """
        Compute average precision @K for provided cutoff in ks

        Parameters
        ----------
        {METRIC_PARAMETERS_DOCSTRING}
        """
        ks, scores, labels = check_inputs(ks, scores, labels)
        topk_scores, _, topk_labels = tf_utils.extract_topk(ks, scores, labels)
        avg_precisions = tf_utils.create_output_placeholder(scores, ks)

        num_relevant = tf.reduce_sum(labels, axis=-1)
        max_k = tf.reduce_max(ks)

        precisions = self.precision_at(1 + tf.range(max_k), topk_scores, topk_labels)
        rel_precisions = precisions * topk_labels

        for index, k in enumerate(ks):
            tf_total_prec = tf.reduce_sum(rel_precisions[:, :k], axis=1)
            clip_value = tf.clip_by_value(
                num_relevant, clip_value_min=1, clip_value_max=tf.cast(k, tf.float32)
            )
            avg_precisions[:, index].assign(tf_total_prec / clip_value)
            # Ensuring type is double, because it can be float if --fp16
        return avg_precisions


[docs]@ranking_metrics_registry.register_with_multiple_names("dcg_at", "dcg")
class DCGAt(RankingMetric):
    def __init__(self, top_ks=None, labels_onehot=False):
        super(DCGAt, self).__init__(top_ks=top_ks, labels_onehot=labels_onehot)

    def _metric(
        self, ks: tf.Tensor, scores: tf.Tensor, labels: tf.Tensor, log_base: int = 2
    ) -> tf.Tensor:

        """
        Compute discounted cumulative gain @K for each provided cutoff in ks
        (ignoring ties)

        Parameters
        ----------
        {METRIC_PARAMETERS_DOCSTRING}
        """
        ks, scores, labels = check_inputs(ks, scores, labels)
        _, _, topk_labels = tf_utils.extract_topk(ks, scores, labels)
        dcgs = tf_utils.create_output_placeholder(scores, ks)

        # Compute discounts
        max_k = tf.reduce_max(ks)
        discount_positions = tf.cast(tf.range(max_k), tf.float32)
        discount_log_base = tf.math.log(tf.convert_to_tensor([log_base], dtype=tf.float32))

        discounts = 1 / (tf.math.log(discount_positions + 2) / discount_log_base)

        # Compute DCGs at K
        for index, k in enumerate(ks):
            m = topk_labels[:, :k] * tf.repeat(
                tf.expand_dims(discounts[:k], 0), topk_labels.shape[0], axis=0
            )
            dcgs[:, index].assign(tf.cast(tf.reduce_sum(m, axis=1), tf.float32))
            # Ensuring type is double, because it can be float if --fp16

        return dcgs


[docs]@ranking_metrics_registry.register_with_multiple_names("ndcg_at", "ndcg")
class NDCGAt(RankingMetric):
    def __init__(self, top_ks=None, labels_onehot=False):
        super(NDCGAt, self).__init__(top_ks=top_ks, labels_onehot=labels_onehot)
        self.dcg_at = DCGAt(top_ks)._metric

    def _metric(
        self, ks: tf.Tensor, scores: tf.Tensor, labels: tf.Tensor, log_base: int = 2
    ) -> tf.Tensor:

        """
        Compute normalized discounted cumulative gain @K for each provided cutoffs in ks
        (ignoring ties)

        Parameters
        ----------
        {METRIC_PARAMETERS_DOCSTRING}
        """
        ks, scores, labels = check_inputs(ks, scores, labels)
        topk_scores, _, topk_labels = tf_utils.extract_topk(ks, scores, labels)

        # Compute discounted cumulative gains
        gains = self.dcg_at(ks, topk_scores, topk_labels, log_base=log_base)
        normalizing_gains = self.dcg_at(ks, topk_labels, topk_labels, log_base=log_base)

        # Prevent divisions by zero
        relevant_pos = tf.where(normalizing_gains != 0)
        tf.where(normalizing_gains == 0, 0, gains)

        updates = tf.gather_nd(gains, relevant_pos) / tf.gather_nd(normalizing_gains, relevant_pos)
        gains = tf.tensor_scatter_nd_update(gains, relevant_pos, updates)

        return gains


[docs]def check_inputs(ks, scores, labels):
    if len(ks.shape) > 1:
        raise ValueError("ks should be a 1-dimensional tensor")

    if len(scores.shape) != 2:
        raise ValueError("scores must be a 2-dimensional tensor")

    if len(labels.shape) != 2:
        raise ValueError("labels must be a 2-dimensional tensor")

    if scores.shape != labels.shape:
        raise ValueError("scores and labels must be the same shape")

    return (tf.cast(ks, tf.int32), tf.cast(scores, tf.float32), tf.cast(labels, tf.float32))