forked from wangzhegeek/EGES
-
Notifications
You must be signed in to change notification settings - Fork 2
/
EGES_model.py
71 lines (64 loc) · 2.94 KB
/
EGES_model.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
import numpy as np
import tensorflow as tf
class EGES_Model:
def __init__(self, num_nodes, num_feat, feature_lens, n_sampled=100, embedding_dim=128, lr=0.001):
self.n_samped = n_sampled
self.num_feat = num_feat
self.feature_lens = feature_lens
self.embedding_dim = embedding_dim
self.num_nodes = num_nodes
self.lr = lr
self.softmax_w = tf.Variable(tf.truncated_normal((num_nodes, embedding_dim), stddev=0.1), name='softmax_w')
self.softmax_b = tf.Variable(tf.zeros(num_nodes), name='softmax_b')
self.inputs = self.input_init()
self.embedding = self.embedding_init()
self.alpha_embedding = tf.Variable(tf.random_uniform((num_nodes, num_feat), -1, 1))
self.merge_emb = self.attention_merge()
self.cost = self.make_skipgram_loss()
# self.train_op = tf.train.AdagradOptimizer(lr).minimize(self.cost)
self.train_op = tf.train.AdamOptimizer(lr).minimize(self.cost)
def embedding_init(self):
cat_embedding_vars = []
for i in range(self.num_feat):
embedding_var = tf.Variable(tf.random_uniform((self.feature_lens[i], self.embedding_dim), -1, 1), name='embedding'+str(i),
trainable=True)
cat_embedding_vars.append(embedding_var)
return cat_embedding_vars
def attention_merge(self):
embed_list = []
num_embed_list = []
for i in range(self.num_feat):
cat_embed = tf.nn.embedding_lookup(self.embedding[i], self.inputs[i])
embed_list.append(cat_embed)
stack_embed = tf.stack(embed_list, axis=-1)
# attention merge
alpha_embed = tf.nn.embedding_lookup(self.alpha_embedding, self.inputs[0])
alpha_embed_expand = tf.expand_dims(alpha_embed, 1)
alpha_i_sum = tf.reduce_sum(tf.exp(alpha_embed_expand), axis=-1)
merge_emb = tf.reduce_sum(stack_embed * tf.exp(alpha_embed_expand), axis=-1) / alpha_i_sum
return merge_emb
def input_init(self):
input_list = []
for i in range(self.num_feat):
input_col = tf.placeholder(tf.int32, [None], name='inputs_'+str(i))
input_list.append(input_col)
input_list.append(tf.placeholder(tf.int32, shape=[None, 1], name='label'))
return input_list
def make_skipgram_loss(self):
loss = tf.reduce_mean(tf.nn.sampled_softmax_loss(
weights=self.softmax_w,
biases=self.softmax_b,
labels=self.inputs[-1],
inputs=self.merge_emb,
num_sampled=self.n_samped,
num_classes=self.num_nodes,
num_true=1,
sampled_values=tf.random.uniform_candidate_sampler(
true_classes=tf.cast(self.inputs[-1], tf.int64),
num_true=1,
num_sampled=self.n_samped,
unique=True,
range_max=self.num_nodes
)
))
return loss