diff --git a/src/fastertransformer/triton_backend/t5/T5TritonModel.cc b/src/fastertransformer/triton_backend/t5/T5TritonModel.cc index 85138fa6f..31981ae86 100644 --- a/src/fastertransformer/triton_backend/t5/T5TritonModel.cc +++ b/src/fastertransformer/triton_backend/t5/T5TritonModel.cc @@ -190,7 +190,7 @@ T5TritonModel::createModelInstance(int ft::getAttentionType(encoder_size_per_head_, sm_, true, encoder_num_bucket_or_max_pos_seq_len_, false); ft::NcclParam tensor_para_ = nccl_params.first[comms_rank]; - ft::NcclParam pipeline_para_ = nccl_params.first[comms_rank]; + ft::NcclParam pipeline_para_ = nccl_params.second[comms_rank]; auto encoder = std::make_unique>(ft::T5Encoder(0, 0,