diff --git a/optimum/neuron/modeling_seq2seq.py b/optimum/neuron/modeling_seq2seq.py index e936e8f5f..c6b1253c9 100644 --- a/optimum/neuron/modeling_seq2seq.py +++ b/optimum/neuron/modeling_seq2seq.py @@ -429,7 +429,7 @@ def _combine_encoder_decoder_config(self, encoder_config: "PretrainedConfig", de from transformers import {processor_class} from optimum.neuron import {model_class} # 1. compile - if __name__ == "__main__": # compulsory for parallel tracing since the API will spawn multiple processes + if __name__ == "__main__": # compulsory for parallel tracing since the API will spawn multiple processes. neuron_model = {model_class}.from_pretrained( {checkpoint_tp}, export=True, tensor_parallel_size=8, dynamic_batch_size=False, batch_size=1, sequence_length=128, num_beams=4, )