|
|
|
@ -105,7 +105,7 @@ class MNIST(fluid.imperative.Layer):
|
|
|
|
|
class TestImperativeMnist(unittest.TestCase):
|
|
|
|
|
def test_mnist_float32(self):
|
|
|
|
|
seed = 90
|
|
|
|
|
batch_num = 2
|
|
|
|
|
epoch_num = 1
|
|
|
|
|
with fluid.imperative.guard():
|
|
|
|
|
fluid.default_startup_program().random_seed = seed
|
|
|
|
|
fluid.default_main_program().random_seed = seed
|
|
|
|
@ -113,39 +113,40 @@ class TestImperativeMnist(unittest.TestCase):
|
|
|
|
|
mnist = MNIST("mnist")
|
|
|
|
|
sgd = SGDOptimizer(learning_rate=1e-3)
|
|
|
|
|
train_reader = paddle.batch(
|
|
|
|
|
paddle.dataset.mnist.train(), batch_size=128)
|
|
|
|
|
paddle.dataset.mnist.train(), batch_size=128, drop_last=True)
|
|
|
|
|
|
|
|
|
|
dy_param_init_value = {}
|
|
|
|
|
for batch_id, data in enumerate(train_reader()):
|
|
|
|
|
if batch_id >= batch_num:
|
|
|
|
|
break
|
|
|
|
|
|
|
|
|
|
dy_x_data = np.array(
|
|
|
|
|
[x[0].reshape(1, 28, 28) for x in data]).astype('float32')
|
|
|
|
|
y_data = np.array([x[1] for x in data]).astype('int64').reshape(
|
|
|
|
|
128, 1)
|
|
|
|
|
|
|
|
|
|
img = to_variable(dy_x_data)
|
|
|
|
|
label = to_variable(y_data)
|
|
|
|
|
label._stop_gradient = True
|
|
|
|
|
|
|
|
|
|
cost = mnist(img)
|
|
|
|
|
loss = fluid.layers.cross_entropy(cost, label)
|
|
|
|
|
avg_loss = fluid.layers.mean(loss)
|
|
|
|
|
dy_out = avg_loss._numpy()
|
|
|
|
|
|
|
|
|
|
if batch_id == 0:
|
|
|
|
|
for param in fluid.default_main_program().global_block(
|
|
|
|
|
).all_parameters():
|
|
|
|
|
dy_param_init_value[param.name] = param._numpy()
|
|
|
|
|
|
|
|
|
|
avg_loss._backward()
|
|
|
|
|
sgd.minimize(avg_loss)
|
|
|
|
|
mnist.clear_gradients()
|
|
|
|
|
dy_param_value = {}
|
|
|
|
|
for param in fluid.default_main_program().global_block(
|
|
|
|
|
).all_parameters():
|
|
|
|
|
dy_param_value[param.name] = param._numpy()
|
|
|
|
|
for epoch in range(epoch_num):
|
|
|
|
|
for batch_id, data in enumerate(train_reader()):
|
|
|
|
|
dy_x_data = np.array(
|
|
|
|
|
[x[0].reshape(1, 28, 28)
|
|
|
|
|
for x in data]).astype('float32')
|
|
|
|
|
y_data = np.array(
|
|
|
|
|
[x[1] for x in data]).astype('int64').reshape(128, 1)
|
|
|
|
|
|
|
|
|
|
img = to_variable(dy_x_data)
|
|
|
|
|
label = to_variable(y_data)
|
|
|
|
|
label._stop_gradient = True
|
|
|
|
|
|
|
|
|
|
cost = mnist(img)
|
|
|
|
|
loss = fluid.layers.cross_entropy(cost, label)
|
|
|
|
|
avg_loss = fluid.layers.mean(loss)
|
|
|
|
|
|
|
|
|
|
dy_out = avg_loss._numpy()
|
|
|
|
|
|
|
|
|
|
if epoch == 0 and batch_id == 0:
|
|
|
|
|
for param in mnist.parameters():
|
|
|
|
|
dy_param_init_value[param.name] = param._numpy()
|
|
|
|
|
|
|
|
|
|
avg_loss._backward()
|
|
|
|
|
sgd.minimize(avg_loss)
|
|
|
|
|
mnist.clear_gradients()
|
|
|
|
|
|
|
|
|
|
fluid.default_main_program().global_block()._clear_block()
|
|
|
|
|
|
|
|
|
|
dy_param_value = {}
|
|
|
|
|
for param in mnist.parameters():
|
|
|
|
|
dy_param_value[param.name] = param._numpy()
|
|
|
|
|
|
|
|
|
|
with new_program_scope():
|
|
|
|
|
fluid.default_startup_program().random_seed = seed
|
|
|
|
@ -157,7 +158,7 @@ class TestImperativeMnist(unittest.TestCase):
|
|
|
|
|
mnist = MNIST("mnist")
|
|
|
|
|
sgd = SGDOptimizer(learning_rate=1e-3)
|
|
|
|
|
train_reader = paddle.batch(
|
|
|
|
|
paddle.dataset.mnist.train(), batch_size=128)
|
|
|
|
|
paddle.dataset.mnist.train(), batch_size=128, drop_last=True)
|
|
|
|
|
|
|
|
|
|
img = fluid.layers.data(
|
|
|
|
|
name='pixel', shape=[1, 28, 28], dtype='float32')
|
|
|
|
@ -170,8 +171,7 @@ class TestImperativeMnist(unittest.TestCase):
|
|
|
|
|
# initialize params and fetch them
|
|
|
|
|
static_param_init_value = {}
|
|
|
|
|
static_param_name_list = []
|
|
|
|
|
for param in fluid.default_startup_program().global_block(
|
|
|
|
|
).all_parameters():
|
|
|
|
|
for param in mnist.parameters():
|
|
|
|
|
static_param_name_list.append(param.name)
|
|
|
|
|
|
|
|
|
|
out = exe.run(fluid.default_startup_program(),
|
|
|
|
@ -180,26 +180,29 @@ class TestImperativeMnist(unittest.TestCase):
|
|
|
|
|
for i in range(len(static_param_name_list)):
|
|
|
|
|
static_param_init_value[static_param_name_list[i]] = out[i]
|
|
|
|
|
|
|
|
|
|
for batch_id, data in enumerate(train_reader()):
|
|
|
|
|
if batch_id >= batch_num:
|
|
|
|
|
break
|
|
|
|
|
|
|
|
|
|
static_x_data = np.array(
|
|
|
|
|
[x[0].reshape(1, 28, 28) for x in data]).astype('float32')
|
|
|
|
|
y_data = np.array([x[1] for x in data]).astype('int64').reshape(
|
|
|
|
|
[128, 1])
|
|
|
|
|
|
|
|
|
|
fetch_list = [avg_loss.name]
|
|
|
|
|
fetch_list.extend(static_param_name_list)
|
|
|
|
|
out = exe.run(fluid.default_main_program(),
|
|
|
|
|
feed={"pixel": static_x_data,
|
|
|
|
|
"label": y_data},
|
|
|
|
|
fetch_list=fetch_list)
|
|
|
|
|
|
|
|
|
|
static_param_value = {}
|
|
|
|
|
static_out = out[0]
|
|
|
|
|
for i in range(1, len(out)):
|
|
|
|
|
static_param_value[static_param_name_list[i - 1]] = out[i]
|
|
|
|
|
for epoch in range(epoch_num):
|
|
|
|
|
for batch_id, data in enumerate(train_reader()):
|
|
|
|
|
static_x_data = np.array(
|
|
|
|
|
[x[0].reshape(1, 28, 28)
|
|
|
|
|
for x in data]).astype('float32')
|
|
|
|
|
y_data = np.array(
|
|
|
|
|
[x[1] for x in data]).astype('int64').reshape([128, 1])
|
|
|
|
|
|
|
|
|
|
fetch_list = [avg_loss.name]
|
|
|
|
|
fetch_list.extend(static_param_name_list)
|
|
|
|
|
out = exe.run(
|
|
|
|
|
fluid.default_main_program(),
|
|
|
|
|
feed={"pixel": static_x_data,
|
|
|
|
|
"label": y_data},
|
|
|
|
|
fetch_list=fetch_list)
|
|
|
|
|
|
|
|
|
|
static_param_value = {}
|
|
|
|
|
static_out = out[0]
|
|
|
|
|
for i in range(1, len(out)):
|
|
|
|
|
static_param_value[static_param_name_list[i - 1]] = out[
|
|
|
|
|
i]
|
|
|
|
|
|
|
|
|
|
self.assertTrue(np.allclose(dy_x_data.all(), static_x_data.all()))
|
|
|
|
|
|
|
|
|
|
for key, value in six.iteritems(static_param_init_value):
|
|
|
|
|
self.assertTrue(np.allclose(value, dy_param_init_value[key]))
|
|
|
|
@ -207,7 +210,7 @@ class TestImperativeMnist(unittest.TestCase):
|
|
|
|
|
self.assertTrue(np.allclose(static_out, dy_out))
|
|
|
|
|
|
|
|
|
|
for key, value in six.iteritems(static_param_value):
|
|
|
|
|
self.assertTrue(np.allclose(value, dy_param_value[key]))
|
|
|
|
|
self.assertTrue(np.allclose(value, dy_param_value[key], atol=1e-5))
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
if __name__ == '__main__':
|
|
|
|
|