-
Notifications
You must be signed in to change notification settings - Fork 6
/
Buzz.py
258 lines (186 loc) · 10.4 KB
/
Buzz.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
import tensorflow as tf
import numpy as np
from tf_utils import *
from preprocess import standardize_kpi, complete_timestamp
from math import factorial, pi, pow, log
from tensorflow.python import debug as tf_debug
from tensorflow.contrib.layers import batch_norm, layer_norm
tf.reset_default_graph()
class Buzz():
def __init__(self, z_dim):
self._z_dim = z_dim
# `x\in [-10, 10]`
def build_q_net(self, x, outdimension=64):
# x->z
with tf.variable_scope('build_q_net', reuse=tf.AUTO_REUSE):
lz_x = tf.reshape(x, [-1, 8, 16, 1])
# 4 conv layers
lz_x = conv(lz_x, outdimension*4, 'conv1',stride_size=2, activation_func=tf.nn.leaky_relu, batch_normalization=True)
lz_x = conv(lz_x, outdimension*2, 'conv2', activation_func=tf.nn.leaky_relu, batch_normalization=True)
lz_x = conv(lz_x, outdimension*2, 'conv3', stride_size=2, activation_func=tf.nn.leaky_relu, batch_normalization=True)
lz_x = conv(lz_x, outdimension, 'conv4', activation_func=tf.nn.leaky_relu,batch_normalization=True)
# get z_mean and z_std by fully connection layer
# shape [batch_size, z_dimension]
with tf.name_scope('ZMEAN'):
z_mean = fc(lz_x, self._z_dim, 'z_mean', activation_func=None, batch_normalization=False)
#z_mean = tf.layers.batch_normalization(z_mean)
with tf.name_scope('ZSTD'):
z_std = fc(lz_x, self._z_dim, 'z_std', activation_func=tf.nn.softplus, batch_normalization=False)
# shape [batch_size, z_dimension]
return z_mean, z_std
def genModel(self, z, in_dimension=64, output_num=128):
with tf.variable_scope('genModel', reuse=tf.AUTO_REUSE):
batch_size = z.get_shape().as_list()[0]
# fully connection layer
lx_z = fc(z, 512, 'fc', activation_func=None)
# reshape and deconv layers
lx_z = tf.reshape(lx_z, [-1, 2, 4, in_dimension])
lx_z = deconv(lx_z, in_dimension*2, 'deconv1', activation_func=tf.nn.leaky_relu, batch_normalization=True)
lx_z = deconv(lx_z, in_dimension*2, 'deconv2', stride_size=2, activation_func=tf.nn.leaky_relu, batch_normalization=True)
lx_z = deconv(lx_z, in_dimension*4, 'deconv3', activation_func=tf.nn.leaky_relu, batch_normalization=True)
lx_z = deconv(lx_z, 1, 'deconv4', stride_size=2, activation_func=tf.nn.leaky_relu, batch_normalization=False)
resShape = lx_z.get_shape().as_list()
lx_z = tf.reshape(lx_z, [batch_size, resShape[1] * resShape[2] * resShape[3]])
lx_z = fc(lx_z, output_num, 'deconvOut', activation_func=None, batch_normalization=False)
lx_z = tf.clip_by_value(lx_z, -10, 10)
return lx_z
# chain the generative model and q_net
def autoEncoder(self, x, outDimension=64):
with tf.name_scope('Variational_Net'):
mu, sigma = self.build_q_net(x, outDimension)
with tf.name_scope('Z_GenNetInput'):
z = mu + sigma * tf.random.normal(tf.shape(mu), 0, 1, dtype=tf.float32)
with tf.name_scope('GenerationNet'):
Xhat = self.genModel(z, outDimension)
with tf.name_scope('KL_divergence'):
negKL = 0.5 * tf.reduce_mean(tf.reduce_sum(1 + tf.log(1e-8+tf.square(sigma)) - \
tf.square(mu) - tf.square(sigma), 1))
# shape [batch_size, window_size] , 1
return Xhat, negKL
def discNet(self, x, outdimension=32):
with tf.variable_scope('discNet', reuse=tf.AUTO_REUSE):
lz_x = tf.reshape(x, [-1, 8, 16, 1])
# 4 conv layers
lz_x = conv(lz_x, outdimension*4, 'conv1',stride_size=2, activation_func=tf.nn.leaky_relu, batch_normalization=True)
lz_x = conv(lz_x, outdimension*2, 'conv2', activation_func=tf.nn.leaky_relu, batch_normalization=True)
lz_x = conv(lz_x, outdimension*2, 'conv3', stride_size=2, activation_func=tf.nn.leaky_relu, batch_normalization=True)
lz_x = conv(lz_x, outdimension, 'conv4', activation_func=tf.nn.leaky_relu, batch_normalization=True)
dis = fc(lz_x, 1, 'dis', batch_normalization=False, activation_func=None)
# shape [batch_size, window_size]
return dis
def getLoss(self, x, eta, window_size=128):
Xhat, negKL = self.autoEncoder(x)
# with tf.variable_scope('DisX'):
with tf.name_scope('DisX'):
dis1 = self.discNet(x)
# with tf.variable_scope('DisGenZ'):
with tf.name_scope('DisGenZ'):
dis2 = self.discNet(Xhat)
with tf.name_scope('wgan_loss'):
wgan_loss = tf.reduce_mean(dis1-dis2) # shape (1)
# get gradient penalty
batch_size = x.get_shape().as_list()[0]
kxi = tf.random_uniform(shape=[batch_size, window_size])
with tf.name_scope('hatX'):
Xnew = kxi * (x-Xhat) + Xhat
with tf.name_scope('get_gradient_penalty'):
gradients = tf.gradients(self.discNet(Xnew), [Xnew])[0]
# gradients = tf.clip_by_value(gradients, -10, 10)
slopes = tf.sqrt(tf.reduce_sum(tf.square(gradients),axis=1))
gradientPenalty = tf.reduce_mean((slopes-1.)**2) # shape (1)
# vloss = |wgan_loss| - eta * GP
with tf.variable_scope('vloss'):
vloss = tf.math.abs(wgan_loss) - eta * gradientPenalty
# wloss = -la * |wgan_loss| - KL - logZ
with tf.variable_scope('omegaLoss', reuse=tf.AUTO_REUSE):
la = tf.get_variable('lambda',shape=(), initializer=tf.constant_initializer(0.5))
la = tf.clip_by_value(la, 1e-3, 10)
logZ = log(factorial(window_size) / factorial(int(window_size/2)) * 2 * pow(pi, window_size/2)) - window_size * tf.math.log(la)
Wloss = -la * tf.math.abs(wgan_loss) + negKL - logZ
return Xhat, negKL, wgan_loss, gradientPenalty, vloss, Wloss, logZ, la
def readData(fileName):
with open(fileName) as fileObj:
next(fileObj)
timestamp = []
values = []
labels = []
for line in fileObj.readlines():
tmpList = line.split(',')
timestamp.append(int(tmpList[0]))
values.append(float(tmpList[1]))
labels.append(int(tmpList[2]))
return timestamp, values, labels
if __name__ == "__main__":
'''
parameters
'''
z_dimension = 13
eta = 10 # gp weight
window_size = 128
n_critic = 3 # number of critic iterations
s0 = 32 # initial neighborhood size
b0 = 8 # initial batch size
# parameters for adam optimizer
alpha0 = 1e-3
beta1 = 0.9
beta2 = 0.999
# get Data
fileName = './cpu4.csv'
timestamp, values, labels= readData(fileName)
# labels = np.zeros_like(values, dtype=np.int32)
# complete the timestamp and obtain the missing point indicators
timestamp, missing, (values, labels) = complete_timestamp(timestamp, (values, labels))
# split data into training and testing data
test_portion = 0.3
test_n = int(len(values) * test_portion)
train_values, test_values = values[:-test_n], values[-test_n:]
train_labels, test_labels = labels[:-test_n], labels[-test_n:]
train_missing, test_missing = missing[:-test_n], missing[-test_n:]
# standardize the training and testing data and clip the data by [-10, 10]
train_values, mean, std = standardize_kpi(
train_values, excludes=np.logical_or(train_labels, train_missing))
test_values, _, _ = standardize_kpi(test_values, mean=mean, std=std)
# build computation graph
x = tf.placeholder(tf.float32, shape=[s0*b0, window_size], name='inputData')
DisOptimizer = tf.train.AdamOptimizer(learning_rate=alpha0, beta1=beta1, beta2=beta2)
GenOptimizer = tf.train.AdamOptimizer(learning_rate=alpha0, beta1=beta1, beta2=beta2)
model = Buzz(z_dimension)
Xhat, negKL, wgan_loss, gradientPenalty, vloss, Wloss, logZ, la = model.getLoss(x, eta)
Dis_loss = DisOptimizer.minimize(-vloss)
Gen_loss = GenOptimizer.minimize(-Wloss)
trainDataLen = len(train_values)
gpu_options = tf.GPUOptions(per_process_gpu_memory_fraction=0.5)
sess = tf.Session(config=tf.ConfigProto(gpu_options=gpu_options))
#sess = tf.Session()
sess.run(tf.global_variables_initializer())
# writer = tf.summary.FileWriter('./logs', sess.graph)
#sess = tf_debug.LocalCLIDebugWrapperSession(sess=sess)
epoch = 0
while s0 > 0:
# shuffle the data and select omega
stopNum = (trainDataLen - window_size)// s0 # remove the first window size
NC = [window_size+i*s0 for i in range(stopNum)]
np.random.shuffle(NC)
# print(len(NC))
# print(stopNum)
for critic in range(stopNum//b0):
selectedOmega = NC[b0*(critic):b0*(critic+1)]
# get input data
inputs = []
for i in range(b0):
for j in range(s0):
inputs.append(train_values[selectedOmega[i]+j-window_size+1: selectedOmega[i]+j+1]) # [bs, window_size]
# print(np.shape(inputs))
if critic%4==3:
_, GenLoss, WL, GP, _KL, LZ, barX, LAM = sess.run([Gen_loss, -Wloss, wgan_loss, gradientPenalty, negKL, logZ, Xhat, la], feed_dict={x:inputs})
print('epoch: {} GenLoss: {} s0: {} b0: {}, wgan_loss: {}, GP: {}, -KL:{}, LZ:{}, LAM:{}'.format(epoch, GenLoss, s0, b0, WL, GP, _KL, LZ, LAM))
else:
_, DisLoss, WL, GP, barX, LAM = sess.run([Dis_loss, -vloss, wgan_loss, gradientPenalty,Xhat, la], feed_dict={x:inputs})
print('epoch: {} DisLoss: {} s0: {} b0: {}, wgan_loss: {}, GP: {}, LAM:{}'.format(epoch, DisLoss, s0, b0, WL, GP, LAM))
#print(barX)
epoch += 1
# print('epoch: {}'.format(epoch))
print('epoch: {} GenLoss: {} DisLoss: {} s0: {} b0: {}'.format(epoch, GenLoss, DisLoss, s0, b0))
if epoch % 40 == 0:
s0 = s0 // 2
b0 = b0 * 2