Merge pull request #16868 from chengduoZH/speedup_test_parallel_executor_transformer

Reduce the layer number of transfromer model
revert-16839-cmakelist_change
Tao Luo 6 years ago committed by GitHub
commit 485bc6a055
No known key found for this signature in database
GPG Key ID: 4AEE18F83AFDEB23

@ -65,7 +65,9 @@ class ModelHyperParams(object):
# number of head used in multi-head attention.
n_head = 8
# number of sub-layers to be stacked in the encoder and decoder.
n_layer = 6
# NOTE(zcd): the origin number of layer is 6, to make this unit test faster,
# we should reduce the layer number to 4.
n_layer = 4
# dropout rate used by all dropout layers.
dropout = 0.1

Loading…
Cancel
Save