Basic Attention Model

Implementation of an attention-based model for item recommendation.

`AttentionBasedContextEmbedding`

Bases: BaseBasketModel

Class for the attention-based model.

Wang, Shoujin, Liang Hu, Longbing Cao, Xiaoshui Huang, Defu Lian, and Wei Liu. "Attention-based transactional context embedding for next-item recommendation." In Proceedings of the AAAI conference on artificial intelligence, vol. 32, no. 1. 2018.

Source code in choice_learn/basket_models/basic_attention_model.py

class AttentionBasedContextEmbedding(BaseBasketModel):
    """Class for the attention-based model.

    Wang, Shoujin, Liang Hu, Longbing Cao, Xiaoshui Huang, Defu Lian,
    and Wei Liu. "Attention-based transactional context embedding for
    next-item recommendation." In Proceedings of the AAAI conference on
    artificial intelligence, vol. 32, no. 1. 2018.
    """

    def __init__(
        self,
        latent_size: int = 4,
        n_negative_samples: int = 2,
        nce_distribution="natural",
        optimizer: str = "adam",
        callbacks: Union[tf.keras.callbacks.CallbackList, None] = None,
        lr: float = 1e-3,
        epochs: int = 10,
        batch_size: int = 32,
        grad_clip_value: Union[float, None] = None,
        weight_decay: Union[float, None] = None,
        momentum: float = 0.0,
        **kwargs,
    ) -> None:
        """Initialize the model with hyperparameters.

        Parameters
        ----------
        epochs : int
            Number of training epochs.
        lr : float
            Learning rate for the optimizer.
        latent_size : int
            Size of the item embeddings.
        n_negative_samples : int
            Number of negative samples to use in training.
        batch_size : int
            Size of the batches for training. Default is 50.
        optimizer : str
            Optimizer to use for training. Default is "Adam".
        nce_distribution: str
            Items distribution to be used to compute the NCE Loss
            Currently available: 'natural' to estimate the distribution
            from the train dataset and 'uniform' where all items have the
            same disitrbution, 1/n_items. Default is 'natural'.
        """
        self.instantiated = False

        self.latent_size = latent_size
        self.n_negative_samples = n_negative_samples
        self.nce_distribution = nce_distribution

        super().__init__(
            optimizer=optimizer,
            callbacks=callbacks,
            lr=lr,
            epochs=epochs,
            batch_size=batch_size,
            grad_clip_value=grad_clip_value,
            weight_decay=weight_decay,
            momentum=momentum,
            **kwargs,
        )

    def instantiate(
        self,
        n_items: int,
    ) -> None:
        """Initialize the model parameters.

        Parameters
        ----------
        n_items : int
            Number of unique items in the dataset.
        """
        self.n_items = n_items

        self.Wi = tf.Variable(
            tf.random.normal((self.n_items, self.latent_size), stddev=0.1, seed=42),
            name="Wi",
        )
        self.Wo = tf.Variable(
            tf.random.normal((self.n_items, self.latent_size), stddev=0.1, seed=42),
            name="Wo",
        )
        self.wa = tf.Variable(tf.random.normal((self.latent_size,), stddev=0.1, seed=42), name="wa")

        self.empty_context_embedding = tf.Variable(
            tf.random.normal((self.latent_size,), stddev=0.1, seed=42),
            name="empty_context_embedding",
        )

        self.loss = NoiseConstrastiveEstimation()
        self.is_trained = False
        self.instantiated = True

    @property
    def trainable_weights(self):
        """Return the trainable weights of the model.

        Returns
        -------
            list
                List of trainable weights (Wi, wa, Wo).
        """
        return [self.Wi, self.wa, self.Wo, self.empty_context_embedding]

    @property
    def train_iter_method(self) -> str:
        """Method used to generate sub-baskets from a purchased one.

        Available methods are:
        - 'shopper': randomly orders the purchases and creates the ordered sub-baskets:
                        (1|0); (2|1); (3|1,2); (4|1,2,3); etc...
        - 'aleacarta': creates all the sub-baskets with N-1 items:
                        (4|1,2,3); (3|1,2,4); (2|1,3,4); (1|2,3,4)

        Returns
        -------
        str
            Data generation method.
        """
        return "aleacarta"

    def embed_context(self, context_items: tf.Tensor) -> tf.Tensor:
        """Return the context embedding matrix.

        Parameters
        ----------
            context_items : tf.Tensor
                [batch_size, variable_length] tf.RaggedTensor
                Tensor containing the list of the context items.

        Returns
        -------
            tf.Tensor
                [batch_size, latent_size] tf.Tensor
                Tensor containing the matrix of contexts embeddings.
        """
        context_embedding = tf.gather(
            tf.concat([tf.zeros((1, self.latent_size)), self.Wi], axis=0), context_items + 1
        )
        e_values = tf.reduce_sum(context_embedding * self.wa, axis=-1)
        alphas = softmax_with_availabilities(
            items_logit_by_choice=e_values,
            available_items_by_choice=tf.where(context_items == -1, 0.0, 1.0),
        )
        final_embeddings = tf.reduce_sum(
            tf.expand_dims(alphas, axis=-1) * context_embedding, axis=1
        )
        return tf.where(
            tf.reduce_sum(final_embeddings, axis=-1, keepdims=True) == 0.0,
            tf.tile(
                tf.expand_dims(self.empty_context_embedding, axis=0), (len(final_embeddings), 1)
            ),
            final_embeddings,
        )

    def compute_batch_utility(
        self,
        item_batch: Union[np.ndarray, tf.Tensor],
        basket_batch: np.ndarray,
        store_batch: np.ndarray,
        week_batch: np.ndarray,
        price_batch: np.ndarray,
        available_item_batch: np.ndarray,
        user_batch: np.ndarray,
    ) -> tf.Tensor:
        """Compute the utility of all the items in item_batch given the items in basket_batch.

        Parameters
        ----------
        item_batch: np.ndarray or tf.Tensor
            Batch of the purchased items ID (integers) for which to compute the utility
            Shape must be (batch_size,)
            (positive and negative samples concatenated together)
        basket_batch: np.ndarray
            Batch of baskets (ID of items already in the baskets) (arrays) for each purchased item
            Shape must be (batch_size, max_basket_size)
        store_batch: np.ndarray
            Batch of store IDs (integers) for each purchased item
            Shape must be (batch_size,)
        week_batch: np.ndarray
            Batch of week numbers (integers) for each purchased item
            Shape must be (batch_size,)
        price_batch: np.ndarray
            Batch of prices (floats) for each purchased item
            Shape must be (batch_size,)
        available_item_batch: np.ndarray
            Batch of availability matrices (indicating the availability (1) or not (0)
            of the products) (arrays) for each purchased item
            Shape must be (batch_size, n_items)

        Returns
        -------
        item_utilities: tf.Tensor
            Utility of all the items in item_batch
            Shape must be (batch_size,)
        """
        _ = store_batch
        _ = price_batch
        _ = week_batch
        _ = available_item_batch
        _ = user_batch
        if len(tf.shape(item_batch)) == 1:
            item_batch = tf.expand_dims(item_batch, axis=1)
            squeeze = True
        else:
            squeeze = False

        context_embedding = self.embed_context(basket_batch)
        utilities = tf.einsum(
            "kj,klj->kl", context_embedding, tf.gather(self.Wo, tf.cast(item_batch, tf.int32))
        )
        if squeeze:
            return tf.gather(utilities, 0, axis=1)
        return utilities

    def get_negative_samples(
        self,
        available_items: np.ndarray,
        purchased_items: np.ndarray,
        next_item: int,
        n_samples: int,
    ) -> list[int]:
        """Sample randomly a set of items.

        (set of items not already purchased and *not necessarily* from the basket)

        Parameters
        ----------
        available_items: np.ndarray
            Matrix indicating the availability (1) or not (0) of the products
            Shape must be (n_items,)
        purchased_items: np.ndarray
            List of items already purchased (already in the basket)
        next_item: int
            Next item (to be added in the basket)
        n_samples: int
            Number of samples to draw

        Returns
        -------
        list[int]
            Random sample of items, each of them distinct from
            the next item and from the items already in the basket
        """
        # Convert inputs to tensors
        available_items = tf.cast(tf.convert_to_tensor(available_items), dtype=tf.int32)
        purchased_items = tf.cast(tf.convert_to_tensor(purchased_items), dtype=tf.int32)
        next_item = tf.cast(tf.convert_to_tensor(next_item), dtype=tf.int32)

        # Get the list of available items based on the availability matrix
        item_ids = tf.range(self.n_items)
        available_mask = tf.equal(available_items, 1)
        assortment = tf.boolean_mask(item_ids, available_mask)

        not_to_be_chosen = tf.concat([purchased_items, tf.expand_dims(next_item, axis=0)], axis=0)

        # Sample negative items from the assortment excluding not_to_be_chosen
        negative_samples = tf.boolean_mask(
            tensor=assortment,
            # Reduce the 2nd dimension of the boolean mask to get a 1D mask
            mask=~tf.reduce_any(
                tf.equal(tf.expand_dims(assortment, axis=1), not_to_be_chosen), axis=1
            ),
        )

        error_message = (
            "The number of negative samples to draw must be less than "
            "the number of available items not already purchased and "
            "distinct from the next item."
        )
        # Raise an error if n_samples > tf.size(negative_samples)
        tf.debugging.assert_greater_equal(
            tf.size(negative_samples), n_samples, message=error_message
        )

        # Randomize the sampling
        negative_samples = tf.random.shuffle(negative_samples)

        # Keep only n_samples
        return negative_samples[:n_samples]

    def _get_items_frequencies(self, dataset: TripDataset) -> tf.Tensor:
        """Count the occurrences of each item in the dataset.

        Parameters
        ----------
            dataset : TripDataset
                Dataset containing the baskets.

        Returns
        -------
            tf.Tensor
                Tensor containing the count of each item.
        """
        item_counts = np.zeros(self.n_items, dtype=np.int32)
        for trip in dataset.trips:
            for item in trip.purchases:
                item_counts[item] += 1
        items_distribution = item_counts / item_counts.sum()
        return tf.constant(items_distribution, dtype=tf.float32)

    def compute_batch_loss(
        self,
        item_batch: np.ndarray,
        basket_batch: np.ndarray,
        future_batch: np.ndarray,
        store_batch: np.ndarray,
        week_batch: np.ndarray,
        price_batch: np.ndarray,
        available_item_batch: np.ndarray,
        user_batch: np.ndarray,
    ) -> tuple[tf.Variable]:
        """Compute log-likelihood and loss for one batch of items.

        Parameters
        ----------
        item_batch: np.ndarray
            Batch of purchased items ID (integers)
            Shape must be (batch_size,)
        basket_batch: np.ndarray
            Batch of baskets (ID of items already in the baskets) (arrays) for each purchased item
            Shape must be (batch_size, max_basket_size)
        future_batch: np.ndarray
            Batch of items to be purchased in the future (ID of items not yet in the
            basket) (arrays) for each purchased item
            Shape must be (batch_size, max_basket_size)
            Here for signature reasons, unused for this model
        store_batch: np.ndarray
            Batch of store IDs (integers) for each purchased item
            Shape must be (batch_size,)
        week_batch: np.ndarray
            Batch of week numbers (integers) for each purchased item
            Shape must be (batch_size,)
        price_batch: np.ndarray
            Batch of prices (floats) for each purchased item
            Shape must be (batch_size,)
        available_item_batch: np.ndarray
            List of availability matrices (indicating the availability (1) or not (0)
            of the products) (arrays) for each purchased item
            Shape must be (batch_size, n_items)

        Returns
        -------
        tf.Variable
            Value of the loss for the batch (binary cross-entropy),
            Shape must be (1,)
        loglikelihood: tf.Variable
            Computed log-likelihood of the batch of items
            Approximated by difference of utilities between positive and negative samples
            Shape must be (1,)
        """
        _ = future_batch
        _ = user_batch
        negative_samples = tf.stack(
            [
                self.get_negative_samples(
                    available_items=available_item_batch[idx],
                    purchased_items=basket_batch[idx],
                    next_item=item_batch[idx],
                    n_samples=self.n_negative_samples,
                )
                for idx in range(len(item_batch))
            ],
            axis=0,
        )
        pos_score = self.compute_batch_utility(
            item_batch,
            basket_batch,
            store_batch,
            week_batch,
            price_batch,
            available_item_batch,
            user_batch,
        )
        neg_scores = self.compute_batch_utility(
            item_batch=negative_samples,
            basket_batch=basket_batch,
            store_batch=store_batch,
            week_batch=week_batch,
            price_batch=price_batch,
            available_item_batch=available_item_batch,
            user_batch=user_batch,
        )

        return self.loss(
            logit_true=pos_score,
            logit_negative=neg_scores,
            freq_true=tf.gather(self.negative_samples_distribution, tf.cast(item_batch, tf.int32)),
            freq_negative=tf.gather(
                self.negative_samples_distribution,
                tf.cast(negative_samples, tf.int32),
            ),
        ), 1e-10

    def fit(
        self,
        trip_dataset: TripDataset,
        val_dataset: Union[TripDataset, None] = None,
        verbose: int = 0,
    ) -> None:
        """Trains the model for a specified number of epochs.

        Parameters
        ----------
            dataset : TripDataset
                Dataset of baskets to train the model on.
        """
        if not self.instantiated:
            self.instantiate(n_items=trip_dataset.n_items)

        if not isinstance(trip_dataset, TripDataset):
            raise TypeError("Dataset must be a TripDataset.")

        if (
            max([len(trip.purchases) for trip in trip_dataset.trips]) + self.n_negative_samples
            > self.n_items
        ):
            raise ValueError(
                "The number of items in the dataset is less than the number of negative samples."
            )

        if self.nce_distribution == "natural":
            self.negative_samples_distribution = self._get_items_frequencies(trip_dataset)
        else:
            self.negative_samples_distribution = (1 / trip_dataset.n_items) * np.ones(
                (trip_dataset.n_items,)
            ).astype("float32")

        history = super().fit(trip_dataset=trip_dataset, val_dataset=val_dataset, verbose=verbose)

        self.is_trained = True

        return history

`train_iter_method: str` `property`

Method used to generate sub-baskets from a purchased one.

Available methods are: - 'shopper': randomly orders the purchases and creates the ordered sub-baskets: (1|0); (2|1); (3|1,2); (4|1,2,3); etc... - 'aleacarta': creates all the sub-baskets with N-1 items: (4|1,2,3); (3|1,2,4); (2|1,3,4); (1|2,3,4)

Returns:

Type	Description
`str`	Data generation method.

`trainable_weights` `property`

Return the trainable weights of the model.

Returns:

Type	Description
`list`	List of trainable weights (Wi, wa, Wo).

`init(latent_size=4, n_negative_samples=2, nce_distribution='natural', optimizer='adam', callbacks=None, lr=0.001, epochs=10, batch_size=32, grad_clip_value=None, weight_decay=None, momentum=0.0, **kwargs)`

Initialize the model with hyperparameters.

Parameters:

Name	Type	Description	Default
`epochs`	`int`	Number of training epochs.	`10`
`lr`	`float`	Learning rate for the optimizer.	`0.001`
`latent_size`	`int`	Size of the item embeddings.	`4`
`n_negative_samples`	`int`	Number of negative samples to use in training.	`2`
`batch_size`	`int`	Size of the batches for training. Default is 50.	`32`
`optimizer`	`str`	Optimizer to use for training. Default is "Adam".	`'adam'`
`nce_distribution`		Items distribution to be used to compute the NCE Loss Currently available: 'natural' to estimate the distribution from the train dataset and 'uniform' where all items have the same disitrbution, 1/n_items. Default is 'natural'.	`'natural'`

Source code in choice_learn/basket_models/basic_attention_model.py

def __init__(
    self,
    latent_size: int = 4,
    n_negative_samples: int = 2,
    nce_distribution="natural",
    optimizer: str = "adam",
    callbacks: Union[tf.keras.callbacks.CallbackList, None] = None,
    lr: float = 1e-3,
    epochs: int = 10,
    batch_size: int = 32,
    grad_clip_value: Union[float, None] = None,
    weight_decay: Union[float, None] = None,
    momentum: float = 0.0,
    **kwargs,
) -> None:
    """Initialize the model with hyperparameters.

    Parameters
    ----------
    epochs : int
        Number of training epochs.
    lr : float
        Learning rate for the optimizer.
    latent_size : int
        Size of the item embeddings.
    n_negative_samples : int
        Number of negative samples to use in training.
    batch_size : int
        Size of the batches for training. Default is 50.
    optimizer : str
        Optimizer to use for training. Default is "Adam".
    nce_distribution: str
        Items distribution to be used to compute the NCE Loss
        Currently available: 'natural' to estimate the distribution
        from the train dataset and 'uniform' where all items have the
        same disitrbution, 1/n_items. Default is 'natural'.
    """
    self.instantiated = False

    self.latent_size = latent_size
    self.n_negative_samples = n_negative_samples
    self.nce_distribution = nce_distribution

    super().__init__(
        optimizer=optimizer,
        callbacks=callbacks,
        lr=lr,
        epochs=epochs,
        batch_size=batch_size,
        grad_clip_value=grad_clip_value,
        weight_decay=weight_decay,
        momentum=momentum,
        **kwargs,
    )

`compute_batch_loss(item_batch, basket_batch, future_batch, store_batch, week_batch, price_batch, available_item_batch, user_batch)`

Compute log-likelihood and loss for one batch of items.

Parameters:

Name	Type	Description	Default
`item_batch`	`ndarray`	Batch of purchased items ID (integers) Shape must be (batch_size,)	required
`basket_batch`	`ndarray`	Batch of baskets (ID of items already in the baskets) (arrays) for each purchased item Shape must be (batch_size, max_basket_size)	required
`future_batch`	`ndarray`	Batch of items to be purchased in the future (ID of items not yet in the basket) (arrays) for each purchased item Shape must be (batch_size, max_basket_size) Here for signature reasons, unused for this model	required
`store_batch`	`ndarray`	Batch of store IDs (integers) for each purchased item Shape must be (batch_size,)	required
`week_batch`	`ndarray`	Batch of week numbers (integers) for each purchased item Shape must be (batch_size,)	required
`price_batch`	`ndarray`	Batch of prices (floats) for each purchased item Shape must be (batch_size,)	required
`available_item_batch`	`ndarray`	List of availability matrices (indicating the availability (1) or not (0) of the products) (arrays) for each purchased item Shape must be (batch_size, n_items)	required

Returns:

Name	Type	Description
	`Variable`	Value of the loss for the batch (binary cross-entropy), Shape must be (1,)
`loglikelihood`	`Variable`	Computed log-likelihood of the batch of items Approximated by difference of utilities between positive and negative samples Shape must be (1,)

Source code in choice_learn/basket_models/basic_attention_model.py

def compute_batch_loss(
    self,
    item_batch: np.ndarray,
    basket_batch: np.ndarray,
    future_batch: np.ndarray,
    store_batch: np.ndarray,
    week_batch: np.ndarray,
    price_batch: np.ndarray,
    available_item_batch: np.ndarray,
    user_batch: np.ndarray,
) -> tuple[tf.Variable]:
    """Compute log-likelihood and loss for one batch of items.

    Parameters
    ----------
    item_batch: np.ndarray
        Batch of purchased items ID (integers)
        Shape must be (batch_size,)
    basket_batch: np.ndarray
        Batch of baskets (ID of items already in the baskets) (arrays) for each purchased item
        Shape must be (batch_size, max_basket_size)
    future_batch: np.ndarray
        Batch of items to be purchased in the future (ID of items not yet in the
        basket) (arrays) for each purchased item
        Shape must be (batch_size, max_basket_size)
        Here for signature reasons, unused for this model
    store_batch: np.ndarray
        Batch of store IDs (integers) for each purchased item
        Shape must be (batch_size,)
    week_batch: np.ndarray
        Batch of week numbers (integers) for each purchased item
        Shape must be (batch_size,)
    price_batch: np.ndarray
        Batch of prices (floats) for each purchased item
        Shape must be (batch_size,)
    available_item_batch: np.ndarray
        List of availability matrices (indicating the availability (1) or not (0)
        of the products) (arrays) for each purchased item
        Shape must be (batch_size, n_items)

    Returns
    -------
    tf.Variable
        Value of the loss for the batch (binary cross-entropy),
        Shape must be (1,)
    loglikelihood: tf.Variable
        Computed log-likelihood of the batch of items
        Approximated by difference of utilities between positive and negative samples
        Shape must be (1,)
    """
    _ = future_batch
    _ = user_batch
    negative_samples = tf.stack(
        [
            self.get_negative_samples(
                available_items=available_item_batch[idx],
                purchased_items=basket_batch[idx],
                next_item=item_batch[idx],
                n_samples=self.n_negative_samples,
            )
            for idx in range(len(item_batch))
        ],
        axis=0,
    )
    pos_score = self.compute_batch_utility(
        item_batch,
        basket_batch,
        store_batch,
        week_batch,
        price_batch,
        available_item_batch,
        user_batch,
    )
    neg_scores = self.compute_batch_utility(
        item_batch=negative_samples,
        basket_batch=basket_batch,
        store_batch=store_batch,
        week_batch=week_batch,
        price_batch=price_batch,
        available_item_batch=available_item_batch,
        user_batch=user_batch,
    )

    return self.loss(
        logit_true=pos_score,
        logit_negative=neg_scores,
        freq_true=tf.gather(self.negative_samples_distribution, tf.cast(item_batch, tf.int32)),
        freq_negative=tf.gather(
            self.negative_samples_distribution,
            tf.cast(negative_samples, tf.int32),
        ),
    ), 1e-10

`compute_batch_utility(item_batch, basket_batch, store_batch, week_batch, price_batch, available_item_batch, user_batch)`

Compute the utility of all the items in item_batch given the items in basket_batch.

Parameters:

Name	Type	Description	Default
`item_batch`	`Union[ndarray, Tensor]`	Batch of the purchased items ID (integers) for which to compute the utility Shape must be (batch_size,) (positive and negative samples concatenated together)	required
`basket_batch`	`ndarray`	Batch of baskets (ID of items already in the baskets) (arrays) for each purchased item Shape must be (batch_size, max_basket_size)	required
`store_batch`	`ndarray`	Batch of store IDs (integers) for each purchased item Shape must be (batch_size,)	required
`week_batch`	`ndarray`	Batch of week numbers (integers) for each purchased item Shape must be (batch_size,)	required
`price_batch`	`ndarray`	Batch of prices (floats) for each purchased item Shape must be (batch_size,)	required
`available_item_batch`	`ndarray`	Batch of availability matrices (indicating the availability (1) or not (0) of the products) (arrays) for each purchased item Shape must be (batch_size, n_items)	required

Returns:

Name	Type	Description
`item_utilities`	`Tensor`	Utility of all the items in item_batch Shape must be (batch_size,)

Source code in choice_learn/basket_models/basic_attention_model.py

def compute_batch_utility(
    self,
    item_batch: Union[np.ndarray, tf.Tensor],
    basket_batch: np.ndarray,
    store_batch: np.ndarray,
    week_batch: np.ndarray,
    price_batch: np.ndarray,
    available_item_batch: np.ndarray,
    user_batch: np.ndarray,
) -> tf.Tensor:
    """Compute the utility of all the items in item_batch given the items in basket_batch.

    Parameters
    ----------
    item_batch: np.ndarray or tf.Tensor
        Batch of the purchased items ID (integers) for which to compute the utility
        Shape must be (batch_size,)
        (positive and negative samples concatenated together)
    basket_batch: np.ndarray
        Batch of baskets (ID of items already in the baskets) (arrays) for each purchased item
        Shape must be (batch_size, max_basket_size)
    store_batch: np.ndarray
        Batch of store IDs (integers) for each purchased item
        Shape must be (batch_size,)
    week_batch: np.ndarray
        Batch of week numbers (integers) for each purchased item
        Shape must be (batch_size,)
    price_batch: np.ndarray
        Batch of prices (floats) for each purchased item
        Shape must be (batch_size,)
    available_item_batch: np.ndarray
        Batch of availability matrices (indicating the availability (1) or not (0)
        of the products) (arrays) for each purchased item
        Shape must be (batch_size, n_items)

    Returns
    -------
    item_utilities: tf.Tensor
        Utility of all the items in item_batch
        Shape must be (batch_size,)
    """
    _ = store_batch
    _ = price_batch
    _ = week_batch
    _ = available_item_batch
    _ = user_batch
    if len(tf.shape(item_batch)) == 1:
        item_batch = tf.expand_dims(item_batch, axis=1)
        squeeze = True
    else:
        squeeze = False

    context_embedding = self.embed_context(basket_batch)
    utilities = tf.einsum(
        "kj,klj->kl", context_embedding, tf.gather(self.Wo, tf.cast(item_batch, tf.int32))
    )
    if squeeze:
        return tf.gather(utilities, 0, axis=1)
    return utilities

`embed_context(context_items)`

Return the context embedding matrix.

Returns:

Type	Description
`tf.Tensor`	[batch_size, latent_size] tf.Tensor Tensor containing the matrix of contexts embeddings.

Source code in choice_learn/basket_models/basic_attention_model.py

def embed_context(self, context_items: tf.Tensor) -> tf.Tensor:
    """Return the context embedding matrix.

    Parameters
    ----------
        context_items : tf.Tensor
            [batch_size, variable_length] tf.RaggedTensor
            Tensor containing the list of the context items.

    Returns
    -------
        tf.Tensor
            [batch_size, latent_size] tf.Tensor
            Tensor containing the matrix of contexts embeddings.
    """
    context_embedding = tf.gather(
        tf.concat([tf.zeros((1, self.latent_size)), self.Wi], axis=0), context_items + 1
    )
    e_values = tf.reduce_sum(context_embedding * self.wa, axis=-1)
    alphas = softmax_with_availabilities(
        items_logit_by_choice=e_values,
        available_items_by_choice=tf.where(context_items == -1, 0.0, 1.0),
    )
    final_embeddings = tf.reduce_sum(
        tf.expand_dims(alphas, axis=-1) * context_embedding, axis=1
    )
    return tf.where(
        tf.reduce_sum(final_embeddings, axis=-1, keepdims=True) == 0.0,
        tf.tile(
            tf.expand_dims(self.empty_context_embedding, axis=0), (len(final_embeddings), 1)
        ),
        final_embeddings,
    )

`fit(trip_dataset, val_dataset=None, verbose=0)`

Trains the model for a specified number of epochs.

Source code in choice_learn/basket_models/basic_attention_model.py

def fit(
    self,
    trip_dataset: TripDataset,
    val_dataset: Union[TripDataset, None] = None,
    verbose: int = 0,
) -> None:
    """Trains the model for a specified number of epochs.

    Parameters
    ----------
        dataset : TripDataset
            Dataset of baskets to train the model on.
    """
    if not self.instantiated:
        self.instantiate(n_items=trip_dataset.n_items)

    if not isinstance(trip_dataset, TripDataset):
        raise TypeError("Dataset must be a TripDataset.")

    if (
        max([len(trip.purchases) for trip in trip_dataset.trips]) + self.n_negative_samples
        > self.n_items
    ):
        raise ValueError(
            "The number of items in the dataset is less than the number of negative samples."
        )

    if self.nce_distribution == "natural":
        self.negative_samples_distribution = self._get_items_frequencies(trip_dataset)
    else:
        self.negative_samples_distribution = (1 / trip_dataset.n_items) * np.ones(
            (trip_dataset.n_items,)
        ).astype("float32")

    history = super().fit(trip_dataset=trip_dataset, val_dataset=val_dataset, verbose=verbose)

    self.is_trained = True

    return history

`get_negative_samples(available_items, purchased_items, next_item, n_samples)`

Sample randomly a set of items.

(set of items not already purchased and not necessarily from the basket)

Parameters:

Name	Type	Description	Default
`available_items`	`ndarray`	Matrix indicating the availability (1) or not (0) of the products Shape must be (n_items,)	required
`purchased_items`	`ndarray`	List of items already purchased (already in the basket)	required
`next_item`	`int`	Next item (to be added in the basket)	required
`n_samples`	`int`	Number of samples to draw	required

Returns:

Type	Description
`list[int]`	Random sample of items, each of them distinct from the next item and from the items already in the basket

Source code in choice_learn/basket_models/basic_attention_model.py

def get_negative_samples(
    self,
    available_items: np.ndarray,
    purchased_items: np.ndarray,
    next_item: int,
    n_samples: int,
) -> list[int]:
    """Sample randomly a set of items.

    (set of items not already purchased and *not necessarily* from the basket)

    Parameters
    ----------
    available_items: np.ndarray
        Matrix indicating the availability (1) or not (0) of the products
        Shape must be (n_items,)
    purchased_items: np.ndarray
        List of items already purchased (already in the basket)
    next_item: int
        Next item (to be added in the basket)
    n_samples: int
        Number of samples to draw

    Returns
    -------
    list[int]
        Random sample of items, each of them distinct from
        the next item and from the items already in the basket
    """
    # Convert inputs to tensors
    available_items = tf.cast(tf.convert_to_tensor(available_items), dtype=tf.int32)
    purchased_items = tf.cast(tf.convert_to_tensor(purchased_items), dtype=tf.int32)
    next_item = tf.cast(tf.convert_to_tensor(next_item), dtype=tf.int32)

    # Get the list of available items based on the availability matrix
    item_ids = tf.range(self.n_items)
    available_mask = tf.equal(available_items, 1)
    assortment = tf.boolean_mask(item_ids, available_mask)

    not_to_be_chosen = tf.concat([purchased_items, tf.expand_dims(next_item, axis=0)], axis=0)

    # Sample negative items from the assortment excluding not_to_be_chosen
    negative_samples = tf.boolean_mask(
        tensor=assortment,
        # Reduce the 2nd dimension of the boolean mask to get a 1D mask
        mask=~tf.reduce_any(
            tf.equal(tf.expand_dims(assortment, axis=1), not_to_be_chosen), axis=1
        ),
    )

    error_message = (
        "The number of negative samples to draw must be less than "
        "the number of available items not already purchased and "
        "distinct from the next item."
    )
    # Raise an error if n_samples > tf.size(negative_samples)
    tf.debugging.assert_greater_equal(
        tf.size(negative_samples), n_samples, message=error_message
    )

    # Randomize the sampling
    negative_samples = tf.random.shuffle(negative_samples)

    # Keep only n_samples
    return negative_samples[:n_samples]

`instantiate(n_items)`

Initialize the model parameters.

Parameters:

Name	Type	Description	Default
`n_items`	`int`	Number of unique items in the dataset.	required

Source code in choice_learn/basket_models/basic_attention_model.py

def instantiate(
    self,
    n_items: int,
) -> None:
    """Initialize the model parameters.

    Parameters
    ----------
    n_items : int
        Number of unique items in the dataset.
    """
    self.n_items = n_items

    self.Wi = tf.Variable(
        tf.random.normal((self.n_items, self.latent_size), stddev=0.1, seed=42),
        name="Wi",
    )
    self.Wo = tf.Variable(
        tf.random.normal((self.n_items, self.latent_size), stddev=0.1, seed=42),
        name="Wo",
    )
    self.wa = tf.Variable(tf.random.normal((self.latent_size,), stddev=0.1, seed=42), name="wa")

    self.empty_context_embedding = tf.Variable(
        tf.random.normal((self.latent_size,), stddev=0.1, seed=42),
        name="empty_context_embedding",
    )

    self.loss = NoiseConstrastiveEstimation()
    self.is_trained = False
    self.instantiated = True

Basic Attention Model

AttentionBasedContextEmbedding

train_iter_method: str property

trainable_weights property

__init__(latent_size=4, n_negative_samples=2, nce_distribution='natural', optimizer='adam', callbacks=None, lr=0.001, epochs=10, batch_size=32, grad_clip_value=None, weight_decay=None, momentum=0.0, **kwargs)

compute_batch_loss(item_batch, basket_batch, future_batch, store_batch, week_batch, price_batch, available_item_batch, user_batch)

compute_batch_utility(item_batch, basket_batch, store_batch, week_batch, price_batch, available_item_batch, user_batch)

embed_context(context_items)

fit(trip_dataset, val_dataset=None, verbose=0)

get_negative_samples(available_items, purchased_items, next_item, n_samples)

instantiate(n_items)

`AttentionBasedContextEmbedding`

`train_iter_method: str` `property`

`trainable_weights` `property`

`init(latent_size=4, n_negative_samples=2, nce_distribution='natural', optimizer='adam', callbacks=None, lr=0.001, epochs=10, batch_size=32, grad_clip_value=None, weight_decay=None, momentum=0.0, **kwargs)`

`compute_batch_loss(item_batch, basket_batch, future_batch, store_batch, week_batch, price_batch, available_item_batch, user_batch)`

`compute_batch_utility(item_batch, basket_batch, store_batch, week_batch, price_batch, available_item_batch, user_batch)`

`embed_context(context_items)`

`fit(trip_dataset, val_dataset=None, verbose=0)`

`get_negative_samples(available_items, purchased_items, next_item, n_samples)`

`instantiate(n_items)`