# @Time : 2020/12/17
# @Author : Yuanhang Zhou
# @Email : sdzyh002@gmail
# UPDATE
# @Time : 2021/1/7, 2021/1/4
# @Author : Xiaolei Wang, Yuanhang Zhou
# @email : wxl1999@foxmail.com, sdzyh002@gmail.com
r"""
Profile_BERT
============
References:
Zhou, Kun, et al. `"Towards Topic-Guided Conversational Recommender System."`_ in COLING 2020.
.. _`"Towards Topic-Guided Conversational Recommender System."`:
https://www.aclweb.org/anthology/2020.coling-main.365/
"""
import os
import torch
from torch import nn
from transformers import BertModel
from crslab.config import PRETRAIN_PATH
from crslab.data import dataset_language_map
from crslab.model.base import BaseModel
from crslab.model.pretrained_models import resources
[docs]class ProfileBERTModel(BaseModel):
"""
Attributes:
topic_class_num: A integer indicating the number of topic.
n_sent: A integer indicating sequence length in user profile.
"""
def __init__(self, opt, device, vocab, side_data):
"""
Args:
opt (dict): A dictionary record the hyper parameters.
device (torch.device): A variable indicating which device to place the data and model.
vocab (dict): A dictionary record the vocabulary information.
side_data (dict): A dictionary record the side data.
"""
self.topic_class_num = vocab['n_topic']
self.n_sent = opt.get('n_sent', 10)
language = dataset_language_map[opt['dataset']]
resource = resources['bert'][language]
dpath = os.path.join(PRETRAIN_PATH, "bert", language)
super(ProfileBERTModel, self).__init__(opt, device, dpath, resource)
[docs] def build_model(self, *args, **kwargs):
"""build model"""
self.profile_bert = BertModel.from_pretrained(self.dpath)
self.bert_hidden_size = self.profile_bert.config.hidden_size
self.state2topic_id = nn.Linear(self.bert_hidden_size,
self.topic_class_num)
self.loss = nn.CrossEntropyLoss()
[docs] def forward(self, batch, mode):
# conv_id, message_id, context, context_mask, topic_path_kw, tp_mask, user_profile, profile_mask, y = batch
context, context_mask, topic_path_kw, tp_mask, user_profile, profile_mask, y = batch
bs = user_profile.size(0) // self.n_sent
profile_rep = self.profile_bert(
user_profile, profile_mask).pooler_output # (bs, word_num, hidden)
profile_rep = profile_rep.view(bs, self.n_sent, -1)
profile_rep = torch.mean(profile_rep, dim=1) # (bs, hidden)
topic_scores = self.state2topic_id(profile_rep)
topic_loss = self.loss(topic_scores, y)
return topic_loss, topic_scores