前往小程序,Get更优阅读体验!
立即前往
首页
学习
活动
专区
工具
TVP
发布
社区首页 >专栏 >深度推荐算法——DeepFM [IJCAI 17][Huawei]

深度推荐算法——DeepFM [IJCAI 17][Huawei]

作者头像
小爷毛毛_卓寿杰
发布2021-03-20 14:32:19
5060
发布2021-03-20 14:32:19
举报
文章被收录于专栏:Soul Joy Hub

视频讲解:https://www.yuque.com/chudi/tzqav9/ny150b#aalY8

在这里插入图片描述
在这里插入图片描述
代码语言:javascript
复制
import tensorflow as tf
from tensorflow import keras
from utils import *

EPOCH = 10
BATCH_SIZE = 32
VEC_DIM = 10
DNN_LAYERS = [64, 128, 64]
DROPOUT_RATE = 0.5

base, test = loadData()
# 所有的特征各个类别值个数之和
FEAT_CATE_NUM = base.shape[1] - 1
K = tf.keras.backend


class CrossLayer(keras.layers.Layer):
    def __init__(self, feat_num, vec_dim, **kwargs):
        self.feat_num = feat_num
        self.vec_dim = vec_dim
        super(CrossLayer, self).__init__(**kwargs)

    def build(self, input_shape):
        self.V = self.add_weight(name='V', shape=(self.feat_num, self.vec_dim), initializer='uniform', trainable=True)
        super(CrossLayer, self).build(input_shape)

    def call(self, inputs, **kwargs):
        a = K.pow(K.dot(inputs, self.V), 2)
        b = K.dot(K.pow(inputs, 2), K.pow(self.V, 2))
        return 0.5 * K.mean(a - b, 1, keepdims=True)


def run():
    # 返回id化特征 和 one-hot特征
    val_x_id, val_x_hot, val_y = getAllData(test)
    train_x_id, train_x_hot, train_y = getAllData(base)
    cate_num = val_x_id[0].shape[0]
    hot_num = val_x_hot[0].shape[0]
    sub_emb_arr = []
    product_list = []

    # Deep 部分
    inputs_id = keras.Input((cate_num,))
    emb = keras.layers.Embedding(FEAT_CATE_NUM, VEC_DIM, input_length=cate_num)(inputs_id)
    deep = keras.layers.Flatten()(emb)
    deep = keras.layers.Dropout(DROPOUT_RATE)(deep)
    for units in DNN_LAYERS:
        deep = keras.layers.Dense(units, activation='relu')(deep)
        deep = keras.layers.Dropout(DROPOUT_RATE)(deep)

    # FM 部分
    # 将emb切分成各个field的小emb
    split_arr = tf.split(emb, cate_num, 1)
    for split in split_arr:
        sub_emb_arr.append(keras.layers.Flatten()(split))
    # 内积
    for i in range(0, len(sub_emb_arr)):
        for j in range(i + 1, len(sub_emb_arr)):
            product_list.append(keras.layers.Dot(axes=1)([sub_emb_arr[i], sub_emb_arr[j]]))
    wide = keras.Input((hot_num,))

    deep_fm = keras.layers.concatenate(product_list + [wide] + [deep])
    deep_fm = keras.layers.Dropout(DROPOUT_RATE)(deep_fm)
    outputs = keras.layers.Dense(1, activation='sigmoid',kernel_regularizer=keras.regularizers.l2(0.001))(deep_fm)

    model = keras.Model(inputs=[inputs_id, wide], outputs=outputs)
    model.compile(loss='binary_crossentropy', optimizer=tf.train.AdamOptimizer(0.001), metrics=[keras.metrics.AUC()])
    tbCallBack = keras.callbacks.TensorBoard(log_dir='./logs',
                                             histogram_freq=0,
                                             write_graph=True,
                                             write_grads=True,
                                             write_images=True,
                                             embeddings_freq=0,
                                             embeddings_layer_names=None,
                                             embeddings_metadata=None)

    model.fit([train_x_id, train_x_hot], train_y, batch_size=BATCH_SIZE, epochs=EPOCH, verbose=2,
              validation_data=([val_x_id, val_x_hot], val_y),
              callbacks=[tbCallBack])


run()
本文参与 腾讯云自媒体同步曝光计划,分享自作者个人站点/博客。
原始发表:2021/02/14 ,如有侵权请联系 cloudcommunity@tencent.com 删除

本文分享自 作者个人站点/博客 前往查看

如有侵权,请联系 cloudcommunity@tencent.com 删除。

本文参与 腾讯云自媒体同步曝光计划  ,欢迎热爱写作的你一起参与!

评论
登录后参与评论
0 条评论
热度
最新
推荐阅读
领券
问题归档专栏文章快讯文章归档关键词归档开发者手册归档开发者手册 Section 归档