From 8f93919f51e3c647dac3d7a2b7c48e2a38f7b095 Mon Sep 17 00:00:00 2001 From: LiuChiaChi <709153940@qq.com> Date: Wed, 12 May 2021 09:40:28 +0000 Subject: [PATCH] Upgrade the usage of sublayers --- seq2seq/utility.py | 2 +- transformer/transformer.py | 2 +- 2 files changed, 2 insertions(+), 2 deletions(-) diff --git a/seq2seq/utility.py b/seq2seq/utility.py index fc446ef..d56f6b7 100644 --- a/seq2seq/utility.py +++ b/seq2seq/utility.py @@ -90,7 +90,7 @@ def get_model_cls(model_cls): @functools.wraps(model_cls.__init__) def __lstm_patch__(self, *args, **kwargs): self._raw_init(*args, **kwargs) - layers = self.sublayers(include_sublayers=True) + layers = self.sublayers(include_self=False) for layer in layers: if isinstance(layer, BasicLSTMCell): layer._forget_bias.stop_gradient = False diff --git a/transformer/transformer.py b/transformer/transformer.py index 8359bf5..1c8b03c 100644 --- a/transformer/transformer.py +++ b/transformer/transformer.py @@ -58,7 +58,7 @@ def __init__(self, process_cmd, d_model, dropout_rate): self.functors.append( self.add_sublayer( "layer_norm_%d" % len( - self.sublayers(include_sublayers=False)), + self.sublayers(include_self=True)), LayerNorm( normalized_shape=d_model, param_attr=fluid.ParamAttr(