File tree Expand file tree Collapse file tree 5 files changed +52
-34
lines changed Expand file tree Collapse file tree 5 files changed +52
-34
lines changed Original file line number Diff line number Diff line change 2929from .feature_extraction_utils import BatchFeature , FeatureExtractionMixin
3030from .image_processing_utils import ImageProcessingMixin
3131from .attention_utils import create_bigbird_rand_mask_idx_list
32- from paddle .distributed .fleet .utils .sequence_parallel_utils import (
33- GatherOp ,
34- ScatterOp ,
35- AllGatherOp ,
36- ReduceScatterOp ,
37- ColumnSequenceParallelLinear ,
38- RowSequenceParallelLinear ,
39- mark_as_sequence_parallel_parameter ,
40- register_sequence_parallel_allreduce_hooks ,
41- )
32+
33+ try :
34+ from paddle .distributed .fleet .utils .sequence_parallel_utils import (
35+ GatherOp ,
36+ ScatterOp ,
37+ AllGatherOp ,
38+ ReduceScatterOp ,
39+ ColumnSequenceParallelLinear ,
40+ RowSequenceParallelLinear ,
41+ mark_as_sequence_parallel_parameter ,
42+ register_sequence_parallel_allreduce_hooks ,
43+ )
44+ except :
45+ pass
4246from .export import export_model
4347
4448# isort: split
Original file line number Diff line number Diff line change 2929from paddle .distributed import fleet
3030from paddle .distributed .fleet .meta_parallel import get_rng_state_tracker
3131from paddle .distributed .fleet .utils import recompute
32- from paddle .distributed .fleet .utils .sequence_parallel_utils import (
33- ColumnSequenceParallelLinear ,
34- GatherOp ,
35- RowSequenceParallelLinear ,
36- ScatterOp ,
37- mark_as_sequence_parallel_parameter ,
38- )
32+
33+ try :
34+ from paddle .distributed .fleet .utils .sequence_parallel_utils import (
35+ ColumnSequenceParallelLinear ,
36+ GatherOp ,
37+ RowSequenceParallelLinear ,
38+ ScatterOp ,
39+ mark_as_sequence_parallel_parameter ,
40+ )
41+ except :
42+ pass
3943from paddle .nn import BCEWithLogitsLoss , CrossEntropyLoss , MSELoss
4044
4145from ...utils .converter import StateDictNameMapping
Original file line number Diff line number Diff line change 2020 SharedLayerDesc ,
2121)
2222from paddle .distributed .fleet .utils import recompute
23- from paddle .distributed .fleet .utils .sequence_parallel_utils import (
24- mark_as_sequence_parallel_parameter ,
25- )
23+
24+ try :
25+ from paddle .distributed .fleet .utils .sequence_parallel_utils import (
26+ mark_as_sequence_parallel_parameter ,
27+ )
28+ except :
29+ pass
2630
2731from paddlenlp .transformers .model_utils import PipelinePretrainedModel
2832
Original file line number Diff line number Diff line change @@ -44,13 +44,16 @@ def swiglu(x, y=None):
4444 return F .silu (x ) * y
4545
4646
47- from paddle .distributed .fleet .utils .sequence_parallel_utils import (
48- ColumnSequenceParallelLinear ,
49- GatherOp ,
50- RowSequenceParallelLinear ,
51- ScatterOp ,
52- mark_as_sequence_parallel_parameter ,
53- )
47+ try :
48+ from paddle .distributed .fleet .utils .sequence_parallel_utils import (
49+ ColumnSequenceParallelLinear ,
50+ GatherOp ,
51+ RowSequenceParallelLinear ,
52+ ScatterOp ,
53+ mark_as_sequence_parallel_parameter ,
54+ )
55+ except :
56+ pass
5457from paddle .utils import try_import
5558
5659from paddlenlp .transformers .conversion_utils import (
Original file line number Diff line number Diff line change 3333except ImportError :
3434 fused_rotary_position_embedding = None
3535
36- from paddle .distributed .fleet .utils .sequence_parallel_utils import (
37- ColumnSequenceParallelLinear ,
38- GatherOp ,
39- RowSequenceParallelLinear ,
40- ScatterOp ,
41- mark_as_sequence_parallel_parameter ,
42- )
36+ try :
37+ from paddle .distributed .fleet .utils .sequence_parallel_utils import (
38+ ColumnSequenceParallelLinear ,
39+ GatherOp ,
40+ RowSequenceParallelLinear ,
41+ ScatterOp ,
42+ mark_as_sequence_parallel_parameter ,
43+ )
44+ except :
45+ pass
4346
4447from paddlenlp .transformers .conversion_utils import (
4548 StateDictNameMapping ,
You can’t perform that action at this time.
0 commit comments