@@ -1232,6 +1232,7 @@ def create_predictor(
12321232 dtype = predictor_args .dtype ,
12331233 tensor_parallel_degree = tensor_parallel_degree ,
12341234 tensor_parallel_rank = tensor_parallel_rank ,
1235+ tensor_parallel_output = False ,
12351236 )
12361237 elif model_args .model_type == "ernie-3.5-se" :
12371238 sys .path .append ("./ernie-3.5-se" )
@@ -1244,6 +1245,7 @@ def create_predictor(
12441245 dtype = predictor_args .dtype ,
12451246 tensor_parallel_degree = tensor_parallel_degree ,
12461247 tensor_parallel_rank = tensor_parallel_rank ,
1248+ tensor_parallel_output = False ,
12471249 )
12481250 else :
12491251 model = AutoModelForCausalLM .from_pretrained (
@@ -1252,6 +1254,7 @@ def create_predictor(
12521254 use_flash_attention = predictor_args .use_flash_attention ,
12531255 tensor_parallel_degree = tensor_parallel_degree ,
12541256 tensor_parallel_rank = tensor_parallel_rank ,
1257+ tensor_parallel_output = False ,
12551258 )
12561259
12571260 predictor = DygraphPredictor (predictor_args , model = model , tokenizer = tokenizer )
0 commit comments