diff --git a/paddlenlp/transformers/sequence_parallel_utils.py b/paddlenlp/transformers/sequence_parallel_utils.py index 5a73c998eed4b48251491eb43fa0d547a22677d0..2e43a48e44136fdb7446a1d5092462d2d54903ae 100644 --- a/paddlenlp/transformers/sequence_parallel_utils.py +++ b/paddlenlp/transformers/sequence_parallel_utils.py @@ -24,7 +24,8 @@ from paddle.distributed.fleet.utils.hybrid_parallel_util import ( ) from paddle.fluid import core from paddle.nn import functional as F -from paddle.nn.layer.layers import Layer +# from paddle.nn.layer.layers import Layer +from paddle.nn import Layer __all__ = [ "GatherOp",