Skip to content

Commit

Permalink
Fix PP issue
Browse files Browse the repository at this point in the history
  • Loading branch information
michaelbenayoun committed Sep 24, 2024
1 parent 3748a06 commit b0cc1d1
Showing 1 changed file with 2 additions and 1 deletion.
3 changes: 2 additions & 1 deletion optimum/neuron/distributed/decoder_models.py
Original file line number Diff line number Diff line change
Expand Up @@ -29,6 +29,7 @@
LlamaDecoderLayer,
LlamaForQuestionAnswering,
LlamaRMSNorm,
LlamaRotaryEmbedding,
repeat_kv,
)
from transformers.models.mistral.modeling_mistral import (
Expand Down Expand Up @@ -554,7 +555,7 @@ class LlamaPipelineParallelismSpecs(PipelineParallelismSpecs):
"LlamaForQuestionAnswering": ("input_ids", "attention_mask", "start_positions", "end_positions"),
}

LEAF_MODULE_CLASSES_NAMES = [LlamaRMSNorm]
LEAF_MODULE_CLASSES_NAMES = [LlamaRMSNorm, LlamaRotaryEmbedding]


class LlamaParallelizer(Parallelizer):
Expand Down

0 comments on commit b0cc1d1

Please sign in to comment.