|
|
@ -36,7 +36,7 @@ class TestMomentumOptimizer(unittest.TestCase):
|
|
|
|
def get_velocity_str(self):
|
|
|
|
def get_velocity_str(self):
|
|
|
|
return self._velocity_acc_str
|
|
|
|
return self._velocity_acc_str
|
|
|
|
|
|
|
|
|
|
|
|
def test_momentum_optimizer(self):
|
|
|
|
def test_vanilla_momentum_optimizer(self):
|
|
|
|
program = framework.Program()
|
|
|
|
program = framework.Program()
|
|
|
|
block = program.global_block()
|
|
|
|
block = program.global_block()
|
|
|
|
mul_x = block.create_parameter(
|
|
|
|
mul_x = block.create_parameter(
|
|
|
@ -60,6 +60,42 @@ class TestMomentumOptimizer(unittest.TestCase):
|
|
|
|
self.assertEqual(len(opts), 1)
|
|
|
|
self.assertEqual(len(opts), 1)
|
|
|
|
sgd_op = opts[0]
|
|
|
|
sgd_op = opts[0]
|
|
|
|
self.assertEqual(sgd_op.type, "momentum")
|
|
|
|
self.assertEqual(sgd_op.type, "momentum")
|
|
|
|
|
|
|
|
self.assertFalse(sgd_op.attr('useNesterov'))
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
# Check accumulators
|
|
|
|
|
|
|
|
accumulators = momentum_optimizer.get_accumulators()
|
|
|
|
|
|
|
|
self.assertEqual(len(accumulators), 1)
|
|
|
|
|
|
|
|
self.assertTrue(momentum_optimizer.get_velocity_str() in accumulators)
|
|
|
|
|
|
|
|
velocity_acc = accumulators[momentum_optimizer.get_velocity_str()]
|
|
|
|
|
|
|
|
self.assertEqual(len(velocity_acc), 1)
|
|
|
|
|
|
|
|
self.assertTrue(mul_x.name in velocity_acc)
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
def test_nesterov_momentum_optimizer(self):
|
|
|
|
|
|
|
|
program = framework.Program()
|
|
|
|
|
|
|
|
block = program.global_block()
|
|
|
|
|
|
|
|
mul_x = block.create_parameter(
|
|
|
|
|
|
|
|
dtype="float32", shape=[5, 10], lod_level=0, name="mul.x")
|
|
|
|
|
|
|
|
mul_y = block.create_var(
|
|
|
|
|
|
|
|
dtype="float32", shape=[10, 8], lod_level=0, name="mul.y")
|
|
|
|
|
|
|
|
mul_out = block.create_var(
|
|
|
|
|
|
|
|
dtype="float32", shape=[5, 8], lod_level=0, name="mul.out")
|
|
|
|
|
|
|
|
block.append_op(
|
|
|
|
|
|
|
|
type="mul",
|
|
|
|
|
|
|
|
inputs={"X": mul_x,
|
|
|
|
|
|
|
|
"Y": mul_y},
|
|
|
|
|
|
|
|
outputs={"Out": mul_out},
|
|
|
|
|
|
|
|
attrs={"x_num_col_dims": 1})
|
|
|
|
|
|
|
|
momentum_optimizer = self.MockMomentum(
|
|
|
|
|
|
|
|
learning_rate=0.01, momentum=0.2, use_nesterov=True)
|
|
|
|
|
|
|
|
params_grads = append_backward_ops(mul_out)
|
|
|
|
|
|
|
|
self.assertEqual(len(params_grads), 1)
|
|
|
|
|
|
|
|
self.assertEqual(len(momentum_optimizer.get_accumulators()), 0)
|
|
|
|
|
|
|
|
opts = momentum_optimizer.create_optimization_pass(params_grads,
|
|
|
|
|
|
|
|
mul_out)
|
|
|
|
|
|
|
|
self.assertEqual(len(opts), 1)
|
|
|
|
|
|
|
|
sgd_op = opts[0]
|
|
|
|
|
|
|
|
self.assertEqual(sgd_op.type, "momentum")
|
|
|
|
|
|
|
|
self.assertTrue(sgd_op.attr('useNesterov'))
|
|
|
|
|
|
|
|
|
|
|
|
# Check accumulators
|
|
|
|
# Check accumulators
|
|
|
|
accumulators = momentum_optimizer.get_accumulators()
|
|
|
|
accumulators = momentum_optimizer.get_accumulators()
|
|
|
|