@@ -1232,6 +1232,7 @@ def create_predictor(
1232
1232
dtype = predictor_args .dtype ,
1233
1233
tensor_parallel_degree = tensor_parallel_degree ,
1234
1234
tensor_parallel_rank = tensor_parallel_rank ,
1235
+ tensor_parallel_output = False ,
1235
1236
)
1236
1237
elif model_args .model_type == "ernie-3.5-se" :
1237
1238
sys .path .append ("./ernie-3.5-se" )
@@ -1244,6 +1245,7 @@ def create_predictor(
1244
1245
dtype = predictor_args .dtype ,
1245
1246
tensor_parallel_degree = tensor_parallel_degree ,
1246
1247
tensor_parallel_rank = tensor_parallel_rank ,
1248
+ tensor_parallel_output = False ,
1247
1249
)
1248
1250
else :
1249
1251
model = AutoModelForCausalLM .from_pretrained (
@@ -1252,6 +1254,7 @@ def create_predictor(
1252
1254
use_flash_attention = predictor_args .use_flash_attention ,
1253
1255
tensor_parallel_degree = tensor_parallel_degree ,
1254
1256
tensor_parallel_rank = tensor_parallel_rank ,
1257
+ tensor_parallel_output = False ,
1255
1258
)
1256
1259
1257
1260
predictor = DygraphPredictor (predictor_args , model = model , tokenizer = tokenizer )
0 commit comments