# Copyright 2018 The Cornac Authors. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
# ============================================================================
import numpy as np
from ...exception import ScoreException
from .recom_ncf_base import NCFBase
[docs]
class NeuMF(NCFBase):
"""Neural Matrix Factorization.
Parameters
----------
num_factors: int, optional, default: 8
Embedding size of MF model.
layers: list, optional, default: [64, 32, 16, 8]
MLP layers. Note that the first layer is the concatenation of
user and item embeddings. So layers[0]/2 is the embedding size.
act_fn: str, default: 'relu'
Name of the activation function used for the MLP layers.
Supported functions: ['sigmoid', 'tanh', 'elu', 'relu', 'selu, 'relu6', 'leaky_relu']
reg: float, optional, default: 0.
Regularization (weight_decay).
reg_layers: list, optional, default: [0., 0., 0., 0.]
Regularization for each MLP layer,
reg_layers[0] is the regularization for embeddings.
num_epochs: int, optional, default: 20
Number of epochs.
batch_size: int, optional, default: 256
Batch size.
num_neg: int, optional, default: 4
Number of negative instances to pair with a positive instance.
lr: float, optional, default: 0.001
Learning rate.
learner: str, optional, default: 'adam'
Specify an optimizer: adagrad, adam, rmsprop, sgd
backend: str, optional, default: 'tensorflow'
Backend used for model training: tensorflow, pytorch
early_stopping: {min_delta: float, patience: int}, optional, default: None
If `None`, no early stopping. Meaning of the arguments:
- `min_delta`: the minimum increase in monitored value on validation set to be considered as improvement, \
i.e. an increment of less than min_delta will count as no improvement.
- `patience`: number of epochs with no improvement after which training should be stopped.
name: string, optional, default: 'NeuMF'
Name of the recommender model.
trainable: boolean, optional, default: True
When False, the model is not trained and Cornac assumes that the model is already \
pre-trained.
verbose: boolean, optional, default: False
When True, some running logs are displayed.
seed: int, optional, default: None
Random seed for parameters initialization.
References
----------
* He, X., Liao, L., Zhang, H., Nie, L., Hu, X., & Chua, T. S. (2017, April). Neural collaborative filtering. \
In Proceedings of the 26th international conference on world wide web (pp. 173-182).
"""
def __init__(
self,
name="NeuMF",
num_factors=8,
layers=(64, 32, 16, 8),
act_fn="relu",
reg=0.0,
num_epochs=20,
batch_size=256,
num_neg=4,
lr=0.001,
learner="adam",
backend="tensorflow",
early_stopping=None,
trainable=True,
verbose=True,
seed=None,
):
super().__init__(
name=name,
trainable=trainable,
verbose=verbose,
num_epochs=num_epochs,
batch_size=batch_size,
num_neg=num_neg,
lr=lr,
learner=learner,
backend=backend,
early_stopping=early_stopping,
seed=seed,
)
self.num_factors = num_factors
self.layers = layers
self.act_fn = act_fn
self.reg = reg
self.pretrained = False
self.ignored_attrs.extend(
[
"gmf_user_id",
"mlp_user_id",
"pretrained_gmf",
"pretrained_mlp",
"alpha",
]
)
[docs]
def from_pretrained(self, pretrained_gmf, pretrained_mlp, alpha=0.5):
"""Provide pre-trained GMF and MLP models. Section 3.4.1 of the paper.
Parameters
----------
pretrained_gmf: object of type GMF, required
Reference to trained/fitted GMF model.
pretrained_mlp: object of type MLP, required
Reference to trained/fitted MLP model.
alpha: float, optional, default: 0.5
Hyper-parameter determining the trade-off between the two pre-trained models.
Details are described in the section 3.4.1 of the paper.
"""
self.pretrained = True
self.pretrained_gmf = pretrained_gmf
self.pretrained_mlp = pretrained_mlp
self.alpha = alpha
return self
########################
## TensorFlow backend ##
########################
def _build_model_tf(self):
import tensorflow as tf
from .backend_tf import GMFLayer, MLPLayer
# Define inputs
user_input = tf.keras.layers.Input(shape=(1,), dtype=tf.int32, name="user_input")
item_input = tf.keras.layers.Input(shape=(1,), dtype=tf.int32, name="item_input")
# GMF layer
gmf_layer = GMFLayer(
num_users=self.num_users,
num_items=self.num_items,
emb_size=self.num_factors,
reg_user=self.reg,
reg_item=self.reg,
seed=self.seed,
name="gmf_layer"
)
# MLP layer
mlp_layer = MLPLayer(
num_users=self.num_users,
num_items=self.num_items,
layers=self.layers,
reg_layers=[self.reg] * len(self.layers),
act_fn=self.act_fn,
seed=self.seed,
name="mlp_layer"
)
# Get embeddings and element-wise product
gmf_vector = gmf_layer([user_input, item_input])
mlp_vector = mlp_layer([user_input, item_input])
# Concatenate GMF and MLP vectors
concat_vector = tf.keras.layers.Concatenate(axis=-1)([gmf_vector, mlp_vector])
# Output layer
logits = tf.keras.layers.Dense(
1,
kernel_initializer=tf.keras.initializers.LecunUniform(seed=self.seed),
name="logits"
)(concat_vector)
prediction = tf.keras.layers.Activation('sigmoid', name="prediction")(logits)
# Create model
model = tf.keras.Model(
inputs=[user_input, item_input],
outputs=prediction,
name="NeuMF"
)
# Handle pretrained models
if self.pretrained:
# Get GMF and MLP models
gmf_model = self.pretrained_gmf.model
mlp_model = self.pretrained_mlp.model
# Copy GMF embeddings
model.get_layer('gmf_layer').user_embedding.set_weights(
gmf_model.get_layer('gmf_layer').user_embedding.get_weights()
)
model.get_layer('gmf_layer').item_embedding.set_weights(
gmf_model.get_layer('gmf_layer').item_embedding.get_weights()
)
# Copy MLP embeddings and layers
model.get_layer('mlp_layer').user_embedding.set_weights(
mlp_model.get_layer('mlp_layer').user_embedding.get_weights()
)
model.get_layer('mlp_layer').item_embedding.set_weights(
mlp_model.get_layer('mlp_layer').item_embedding.get_weights()
)
# Copy dense layers in MLP
for i, layer in enumerate(model.get_layer('mlp_layer').dense_layers):
layer.set_weights(mlp_model.get_layer('mlp_layer').dense_layers[i].get_weights())
# Combine weights for output layer
gmf_logits_weights = gmf_model.get_layer('logits').get_weights()
mlp_logits_weights = mlp_model.get_layer('logits').get_weights()
# Combine kernel weights
combined_kernel = np.concatenate([
self.alpha * gmf_logits_weights[0],
(1.0 - self.alpha) * mlp_logits_weights[0]
], axis=0)
# Combine bias weights
combined_bias = self.alpha * gmf_logits_weights[1] + (1.0 - self.alpha) * mlp_logits_weights[1]
# Set combined weights to output layer
model.get_layer('logits').set_weights([combined_kernel, combined_bias])
return model
#####################
## PyTorch backend ##
#####################
def _build_model_pt(self):
from .backend_pt import NeuMF
model = NeuMF(
num_users=self.num_users,
num_items=self.num_items,
layers=self.layers,
num_factors=self.num_factors,
act_fn=self.act_fn,
)
if self.pretrained:
model.from_pretrained(
self.pretrained_gmf.model, self.pretrained_mlp.model, self.alpha
)
return model
def _score_pt(self, user_idx, item_idx):
import torch
with torch.no_grad():
if item_idx is None:
users = torch.from_numpy(np.ones(self.num_items, dtype=int) * user_idx)
items = (torch.from_numpy(np.arange(self.num_items))).to(self.device)
else:
users = torch.tensor(user_idx).unsqueeze(0)
items = torch.tensor(item_idx).unsqueeze(0)
gmf_users = torch.tensor(user_idx).unsqueeze(0).to(self.device)
output = self.model(
users.to(self.device), items.to(self.device), gmf_users.to(self.device)
)
return output.squeeze().cpu().numpy()